Commit 479f6d4e by leiliangliang

更新百度热搜内容采集

parent 2247b2af
...@@ -83,7 +83,7 @@ public class BaiDuHotSearchCrawler { ...@@ -83,7 +83,7 @@ public class BaiDuHotSearchCrawler {
//获取链接 //获取链接
String url = element.select("div.content_1YWBm").select("a.title_dIF3B").attr("href"); String url = element.select("div.content_1YWBm").select("a.title_dIF3B").attr("href");
//获取内容 //获取内容
String content = element.select("div.small_Uvkd3").text(); String content = element.select("div.large_nSuFU").text().replace(" 查看更多>","");
//获取搜索指数 //获取搜索指数
String strCount = element.select("div.hot-index_1Bl1a").text(); String strCount = element.select("div.hot-index_1Bl1a").text();
Long count = Long.valueOf(strCount); Long count = Long.valueOf(strCount);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment