您的位置:首页 > 其它

chrome插件:提取页面数据

2015-05-26 14:17 555 查看
近期在做chrome插件,需要提取页面里的一些数,简单说就是企业版微博的后台数据,因为微博不提供导出功能。

最开始是用php完成的,但是每次都需要先把页面代码保存下来,再进行提取,很麻烦。chrome插件可以和页面DOM交互,看起来很方便,所以开始学着写。javascript和jQuery都是边学习边写。

以下代码实现了把需要的数据提出来,需要补充xmlHttp部分。

<script type="text/javascript" charset="UTF-8" src="http://chenbinx.cn/kaiguan/jquery-2.0.2.min.js"></script>
<script type="text/javascript">
$(document).ready(function(){
$("span.main_title").click(function(){
console.log("执行了!");
var m=$("[class='S_line2 W_tc fst']");
time=m[0];//选取第一个节点
console.log("日期为:"+time.innerText);//why
var content=nextSibling(time);//获取兄弟节点
console.log("博文内容为:"+content.innerText);
var read=nextSibling(content);
console.log("博文阅读数为:"+read.innerText);
var zan=getFirst(nextSibling(read));//获取下一个兄弟的第一个孩子节点
console.log("转评赞为:"+zan.innerText);
var clicknum=nextSibling(zan);//获取这个孩子的下一个兄弟
console.log("短链点击为:"+clicknum.innerText);
})
})

function getFirst(elem){
for(var i=0,e;e=elem.childNodes[i++];){
if(e.nodeType==1)
return e;
}
}

//下一个兄弟节点
function nextSibling(node) {
var tempLast = node.parentNode.lastChild;
if (node == tempLast) return null;
var tempObj = node.nextSibling;
while (tempObj.nodeType != 1 && tempObj.nextSibling != null) {
tempObj = tempObj.nextSibling;
}
return (tempObj.nodeType==1)? tempObj:null;
}
//前一个兄弟节点
function prevSibling(node) {
var tempFirst = node.parentNode.firstChild;
if (node == tempFirst) return null;
var tempObj = node.previousSibling;
while (tempObj.nodeType != 1 && tempObj.previousSibling != null) {
tempObj = tempObj.previousSibling;
}
return (tempObj.nodeType==1)? tempObj:null;
}
</script>

这里把需要提取数的源代码也附上
<body>
<div class="E_PCD_chart2">
<div class="WB_cardtitle_b S_line2">
<h4 class="obj_name">
<span class="main_title W_fb W_f14">博文分析</span>
<span class="subtitle S_txt2">
<span class="W_icon icon_askS" action-type="layerIcon" action-data="t=2"></span>
</span>
</h4>
<div class="opt_page">
<span class="interval">
<a class="S_txt2" href="javascript:;" action-type="vote" action-data="moduleid=2&attitude=1" suda-uatrack="key=DataService&value=121">
<em class="EM_icon EM_icon_praised_b"></em>
有用
</a>
</span>
<span class="interval">
<a class="S_txt2" href="javascript:;" action-type="vote" action-data="moduleid=2&attitude=0" suda-uatrack="key=DataService&value=122">
<em class="EM_icon EM_icon_praised_d"></em>
无用
</a>
</span>
</div>
</div>
<div class="WB_innerwrap" node-type="articlesList">
<table class="EM_table">
<colgroup>
<col width="12%">
<col width="37%">
<col width="12%">
<col>
<col width="9%">
</colgroup>
<thead>
<tr>
<th class="S_line2 S_txt2 W_tc fst">发布时间</th>
<th class="S_line2 S_txt2">博文内容</th>
<th class="S_line2 S_txt2">博文阅读数</th>
<th class="S_line2 S_txt2 W_tc">
<span>互动数</span>
<i class="ann c1"></i>
<span>转评赞</span>
<i class="ann c2"></i>
<span>短链点击</span>
</th>
<th class="S_line2 S_txt2 lst">
操作
<span class="W_icon icon_askS" action-type="layerIcon" action-data="t=1"></span>
</th>
</tr>
</thead>
<tbody>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-24 21:39</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/CjmjFoKBD" target="_blank" class="S_txt1">#520爱尚我# 呛口同款西班牙芭蕾新履,Pretty Ballerinas大促5折...</a>
</td>
<td class="S_line2">7564</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">6</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:2.52%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">12</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:5.04%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3846140195899029%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-24 17:26</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/CjkEYrqia" target="_blank" class="S_txt1">#520爱尚我# 尚品网5周年大促即将结束,ASH全场4折起!明星款至...</a>
</td>
<td class="S_line2">16204</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">6</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:2.52%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">17</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:7.14%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">

4000
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3846076526535926%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-24 14:05</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/CjjlobuW8" target="_blank" class="S_txt1">#520爱尚我# 尚品网5周年大促,URBAN REVIVO、DAZZLE、d'zzit等...</a>
</td>
<td class="S_line2">13614</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">3</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:1.26%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">16</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:6.72%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3846025942740532%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-24 12:05</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/CjiyGgJbX" target="_blank" class="S_txt1">#520爱尚我# 配饰对于每位爱美的MM都是必不可少的装饰品,配饰为...</a>
</td>
<td class="S_line2">8121</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">6</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:2.52%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">4</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:1.68%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845995743986969%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-24 11:23</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/CjihSnt5J" target="_blank" class="S_txt1">#520爱尚我# 尚品网5周年大促,爆款手袋,倒计时48小时!2折起!...</a>
</td>
<td class="S_line2">6829</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">1</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:0.42%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">8</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:3.36%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845985325593375%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-23 15:20</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/CjapkE5IY" target="_blank" class="S_txt1">#520爱尚我# Furla倍受欢迎的果冻包,补!货!啦!啥都别说了,...</a>
</td>
<td class="S_line2">9535</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">4</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:1.68%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">10</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:4.20%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845682429555128%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-23 13:03</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/Cj9w4oWt6" target="_blank" class="S_txt1">#520爱尚我# 盘点520大促最值得购买的Bally单品,从这些单品中我...</a>
</td>
<td class="S_line2">9289</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">3</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:1.26%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">2</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:0.84%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845648165944628%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-23 11:20</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/Cj8PV89Ox" target="_blank" class="S_txt1">#520爱尚我# MO&CO.品牌日&尚品网店庆同庆,补货上新!全网独家...</a>
</td>
<td class="S_line2">7833</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">3</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:1.26%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">11</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:4.62%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845622031944353%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-22 17:31</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/Cj1Q5AC8u" target="_blank" class="S_txt1">#520爱尚我# 尚品网5周年庆大促,进入第三天啦!现在每天都有补...</a>
</td>
<td class="S_line2">17456</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">9</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:3.78%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">24</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:10.08%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845353058726406%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
<tr>
<td class="S_line2 W_tc fst">
<p>2015-05-22 14:42</p>
</td>
<td class="S_line2">
<a href="http://weibo.com/1854902371/Cj0JsviPb" target="_blank" class="S_txt1">#520爱尚我# 【520大促最值入手的9款大牌包包】炎炎夏日,对于广...</a>
</td>
<td class="S_line2">33647</td>
<td class="S_line2">
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">238</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c1" style="width:100.00%;"></i>
</span>
</dd>
</dl>
<dl class="EM_stripe clearfix">
<dt class="W_fl W_tr">13</dt>
<dd class="W_fl">
<span class="stripe">
<i class="inner c2" style="width:5.46%;"></i>
</span>
</dd>
</dl>
</td>
<td class="S_line2 lst">
<a class="S_txt1" href="javascript:;" action-type="extension" action-data="url=http%3A%2F%2Fpromote.vip.weibo.com%2Fpromote%3Ffrom%3De_weibo%26mid%3D3845310507460533%26ru%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F
a212
1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats%26failRu%3Dhttp%3A%2F%2Fweibo.com%2Fp%2F1006061854902371%2Fmanage%3Fiframe_url%3Dhttp%3A%2F%2Fe.weibo.com%2Fv1%2Feps%2Fdata%2Farticlestats" suda-uatrack="key=DataService&value=123">推广</a>
</td>
</tr>
</tbody>
</table>
</div>
<div class="W_pages E_MB10" node-type="pageTurn">
<a class="page prev S_txt1 S_line1" href="javascript:;" node-type="pageUp" style="display:none" suda-uatrack="key=DataService&value=124">上一页</a>
<span class="list">
<div class="layer_menu_list W_scroll" node-type="pageNumLayer" style="display:none">
<ul>
<li class="cur">
<a href="javascript:;" action-type="turnToPage" action-data="page=1" suda-uatrack="key=DataService&value=124">第 1 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=2" suda-uatrack="key=DataService&value=124">第 2 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=3" suda-uatrack="key=DataService&value=124">第 3 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=4" suda-uatrack="key=DataService&value=124">第 4 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=5" suda-uatrack="key=DataService&value=124">第 5 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=6" suda-uatrack="key=DataService&value=124">第 6 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=7" suda-uatrack="key=DataService&value=124">第 7 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=8" suda-uatrack="key=DataService&value=124">第 8 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=9" suda-uatrack="key=DataService&value=124">第 9 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=10" suda-uatrack="key=DataService&value=124">第 10 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=11" suda-uatrack="key=DataService&value=124">第 11 页</a>
</li>
<li>
<a href="javascript:;" action-type="turnToPage" action-data="page=12" suda-uatrack="key=DataService&value=124">第 12 页</a>
</li>
</ul>
</div>
<a class="page S_txt1" href="javascript:;" node-type="curPageNum">
第 1 页
<i class="W_ficon ficon_arrow_down S_ficon">c</i>
</a>
</span>
<a class="page next S_txt1 S_line1" href="javascript:;" node-type="pageDown" maxpage="12" suda-uatrack="key=DataService&value=124">下一页</a>
</div>
<!-- a.WB_cardmore.S_txt1.S_line1.clearfix(href='javascript:;',node-type="viewMore") -->
<!-- span.more_txt -->
<!-- | 查看更多 -->
<!-- em.W_ficon.ficon_arrow_right.S_ficon a -->
</div>
</body>
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: 
相关文章推荐