Commit a2736a3f by yangchen

添加客户端新浪财经来源采集

parent 8b7d40ab
...@@ -25,7 +25,7 @@ public class MediaSelfSource { ...@@ -25,7 +25,7 @@ public class MediaSelfSource {
public static void main(String[] args) { public static void main(String[] args) {
ProxyFactory.init("zookeeper://192.168.0.36:2181","local",GroupType.PROVIDER); ProxyFactory.init("zookeeper://192.168.0.36:2181","local",GroupType.PROVIDER);
List<String> urlList = new ArrayList<>(); List<String> urlList = new ArrayList<>();
urlList.add("https://dy.163.com/v2/article/detail/EI1VGJ1S05179BUV.html"); urlList.add("https://finance.sina.cn/stock/relnews/hk/2019-07-22/detail-ihytcitm3847530.d.html");
List<MediaSelfSourceBean> u = MediaSelfSource.getMediaSelfSource(urlList); List<MediaSelfSourceBean> u = MediaSelfSource.getMediaSelfSource(urlList);
for(MediaSelfSourceBean b : u) { for(MediaSelfSourceBean b : u) {
System.out.println(b.toString()); System.out.println(b.toString());
......
...@@ -394,7 +394,8 @@ public class MatchSource { ...@@ -394,7 +394,8 @@ public class MatchSource {
if(source!=null && source.length()>1){ if(source!=null && source.length()>1){
source = "快资讯-" + source; source = "快资讯-" + source;
} }
}else if(url.contains("cj.sina.com.cn")){ }else if(url.contains("cj.sina.com.cn") || url.contains("finance.sina.cn")){
source = document.select("h2.weibo_user").text();
//新浪财经头条号 //新浪财经头条号
if(html.contains("<meta name=\"mediaid\"")){ if(html.contains("<meta name=\"mediaid\"")){
source = html.split("<meta name=\"mediaid\" content=\"")[1].split("\"")[0].trim(); source = html.split("<meta name=\"mediaid\" content=\"")[1].split("\"")[0].trim();
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment