网上动态新闻抓取网址
2013-04-14 18:21
260 查看
网易:
http://news.163.com/special/0001220O/news_json.js http://news.163.com/latest/
新浪:
http://news.sina.com.cn/news1000/?requestOrder=-1 全部新闻
http://news.sina.com.cn/news1000/?requestOrder=0 国内新闻
http://news.sina.com.cn/news1000/?requestOrder=1 国际新闻
http://news.sina.com.cn/news1000/?requestOrder=2 社会新闻
http://news.sina.com.cn/news1000/?requestOrder=8 股票新闻
http://rss.sina.com.cn/rollnews/news/gn_total.js
Array("http://rss.sina.com.cn/rollnews/news/gn_total.js","http://rss.sina.com.cn/rollnews/news/gj_total.js","http://rss.sina.com.cn/rollnews/news/sh_total.js","http://rss.sina.com.cn/rollnews/jczs/jczs_total.js","http://rss.sina.com.cn/rollnews/sports/sports_total.js","http://rss.sina.com.cn/rollnews/ent/ent_total.js","http://rss.sina.com.cn/rollnews/tech/tech1_total.js","http://rss.sina.com.cn/rollnews/finance/finance1_news_total.js","http://rss.sina.com.cn/rollnews/finance/gupiao_news_total.js");
搜狐
http://roll.sohu.com/ http://news.sohu.com/scroll/ http://news.sohu.com/rss/scroll.xml http://news.sohu.com/_scroll_newslist/20130413/news.inc
人民网
http://www.people.com.cn/GB/24hour/n/2013/0413/c25408-21122220.html http://news.people.com.cn//210801/211150/index.js http://world.huanqiu.com/roll.html http://news.people.com.cn/210801/211150/index.js
下面的没找到其json数据 暂时只能通过htmlparser来解析
腾讯(没找到)
http://roll.news.qq.com/ http://roll.news.qq.com//interface/catalog.php
{"response":{"code":"1","msg":"Miss site name!","dext":""},"data":""}
var articleAjax = new Ajax("../interface/catalog.php?" + Math.random() + data,null , G.InitCataList);
var data = "&cata=" + G.paraElement.cata + "&site=" + G.paraElement.site + "&date=" + G.paraElement.date + "&page=" + G.paraElement.page + "&mode=" + G.paraElement.mod + "&of=json";
{"response":{"code":"0","msg":"Sucess","dext":""},"data":[{"e":"newsgn","c":"国内"},{"e":"newsgj","c":"国际"},{"e":"newssh","c":"社会"},{"e":"milite","c":"军事"},{"e":"photon","c":"图片"},{"e":"video","c":"视频"},{"e":"green","c":"绿色"},{"e":"history","c":"历史"},{"e":"health2012","c":"健康"}]}
http://roll.news.qq.com/interface/roll.php?0.6283637253279363&cata=&site=news&date=20130413&page=1&mode=1&of=json
环球
http://china.huanqiu.com/ http://china.huanqiu.com/roll.html http://rss.huanqiu.com/china/local.xml
凤凰网
http://china.huanqiu.com/roll.html
百度新闻
http://guonei.news.baidu.com/n?cmd=4&class=civilnews&pn=1 http://news.baidu.com/z/data/json/cms_page_data.json?v=20130413
中国新闻网
http://www.chinanews.com/china.shtml http://www.chinanews.com/scroll-news/news1.html
新华网
http://www.xinhuanet.com/jsyw_new.htm
rss:
http://blog.csdn.net/numen_wlm/article/details/849448
http://news.163.com/special/0001220O/news_json.js http://news.163.com/latest/
新浪:
http://news.sina.com.cn/news1000/?requestOrder=-1 全部新闻
http://news.sina.com.cn/news1000/?requestOrder=0 国内新闻
http://news.sina.com.cn/news1000/?requestOrder=1 国际新闻
http://news.sina.com.cn/news1000/?requestOrder=2 社会新闻
http://news.sina.com.cn/news1000/?requestOrder=8 股票新闻
http://rss.sina.com.cn/rollnews/news/gn_total.js
Array("http://rss.sina.com.cn/rollnews/news/gn_total.js","http://rss.sina.com.cn/rollnews/news/gj_total.js","http://rss.sina.com.cn/rollnews/news/sh_total.js","http://rss.sina.com.cn/rollnews/jczs/jczs_total.js","http://rss.sina.com.cn/rollnews/sports/sports_total.js","http://rss.sina.com.cn/rollnews/ent/ent_total.js","http://rss.sina.com.cn/rollnews/tech/tech1_total.js","http://rss.sina.com.cn/rollnews/finance/finance1_news_total.js","http://rss.sina.com.cn/rollnews/finance/gupiao_news_total.js");
搜狐
http://roll.sohu.com/ http://news.sohu.com/scroll/ http://news.sohu.com/rss/scroll.xml http://news.sohu.com/_scroll_newslist/20130413/news.inc
人民网
http://www.people.com.cn/GB/24hour/n/2013/0413/c25408-21122220.html http://news.people.com.cn//210801/211150/index.js http://world.huanqiu.com/roll.html http://news.people.com.cn/210801/211150/index.js
下面的没找到其json数据 暂时只能通过htmlparser来解析
腾讯(没找到)
http://roll.news.qq.com/ http://roll.news.qq.com//interface/catalog.php
{"response":{"code":"1","msg":"Miss site name!","dext":""},"data":""}
var articleAjax = new Ajax("../interface/catalog.php?" + Math.random() + data,null , G.InitCataList);
var data = "&cata=" + G.paraElement.cata + "&site=" + G.paraElement.site + "&date=" + G.paraElement.date + "&page=" + G.paraElement.page + "&mode=" + G.paraElement.mod + "&of=json";
{"response":{"code":"0","msg":"Sucess","dext":""},"data":[{"e":"newsgn","c":"国内"},{"e":"newsgj","c":"国际"},{"e":"newssh","c":"社会"},{"e":"milite","c":"军事"},{"e":"photon","c":"图片"},{"e":"video","c":"视频"},{"e":"green","c":"绿色"},{"e":"history","c":"历史"},{"e":"health2012","c":"健康"}]}
http://roll.news.qq.com/interface/roll.php?0.6283637253279363&cata=&site=news&date=20130413&page=1&mode=1&of=json
环球
http://china.huanqiu.com/ http://china.huanqiu.com/roll.html http://rss.huanqiu.com/china/local.xml
凤凰网
http://china.huanqiu.com/roll.html
百度新闻
http://guonei.news.baidu.com/n?cmd=4&class=civilnews&pn=1 http://news.baidu.com/z/data/json/cms_page_data.json?v=20130413
中国新闻网
http://www.chinanews.com/china.shtml http://www.chinanews.com/scroll-news/news1.html
新华网
http://www.xinhuanet.com/jsyw_new.htm
rss:
http://blog.csdn.net/numen_wlm/article/details/849448
相关文章推荐
- 常用社交网络(SNS、人人网、新浪微博)动态新闻(feed、新鲜事、好友动态)系统浅析
- python 多线程抓取动态数据
- 金融行情数据抓取系列文章(全球股市,A股,美股,港股,外汇,债券,贵金属,财经日历,资讯,实时新闻等)
- 安卓新闻客户端编写(一) JSOUP抓取网页信息
- 推荐几个免费网上图书馆的网址
- Python抓取新闻标题和链接
- 如何利用Python网络爬虫抓取微信朋友圈的动态(上)
- 知名网站 新闻评论数 评论链接抓取
- 如何用Python,C#等语言去实现抓取静态网页+抓取动态网页+模拟登陆网站
- c#关于网页内容抓取,简单爬虫的实现。(包括动态,静态的)
- matlab抓取指定网址图片
- scrapy-splash抓取动态数据例子七
- 安卓项目开发之新闻客户端---新闻客户端app抓取信息
- 实例讲解ASP实现抓取网上房产信息
- scrapy-splash抓取动态数据例子十一
- asp采集抓取网上房产信息的代码
- 网址大全[收集网上大部份好的开源网]
- 常用社交网络(微博等)动态新闻(feed、新鲜事)系统浅析(转)
- scrapy-splash抓取动态数据例子十二