获取网站的<meta name="keywords" content="" />和<meta name="description" content="“>关键字和描述内容
实现HTML解析器jsoup
下载jsoup的lib地址:http://jsoup.org/download
package cn.evan.util; import java.io.IOException; import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.nodes.Element; import org.jsoup.select.Elements; public class SemanticCrawl { public static void main(String[] args) { Document doc = null; try { doc = Jsoup.connect("网址").get(); } catch (IOException e) { // TODO Auto-generated catch block e.printStackTrace(); } String title = doc.title(); Elements metas = doc.head().select("meta"); for (Element meta : metas) { String content = meta.attr("content"); if ("keywords".equalsIgnoreCase(meta.attr("name"))) { System.out.println("关键字:"+content); } if ("description".equalsIgnoreCase(meta.attr("name"))) { System.out.println("网站内容描述:"+content); } } Elements keywords = doc.getElementsByTag("meta"); System.out.println("标题"+title); } }
以上所述就是本文分享的全部内容了,希望大家能够喜欢。