您的位置:首页 > 理论基础 > 计算机网络

java 抓取 https 网页内容

2013-03-25 13:25 477 查看
import java.io.BufferedReader;

import java.io.InputStream;

import java.io.InputStreamReader;

import java.net.URL;

import javax.net.ssl.HttpsURLConnection;

public class JavaUrl {

/**

* Use for check our website is work well.

* @return

*/

public boolean checkWebsite(String checkUrl,String checkContent){

try {

URL url = new URL(checkUrl);

HttpsURLConnection httpsConn = (HttpsURLConnection)url.openConnection();

//取得该连接的输入流,以读取响应内容

InputStream ins = httpsConn.getInputStream();

BufferedReader breader = new BufferedReader(new InputStreamReader(ins));

String info = breader.readLine();

long nowTime =new java.util.Date().getTime();

while (info != null) {

if(new java.util.Date().getTime() -nowTime >10000)

return false;//达到10秒就认为超时

if(info != null && info.indexOf(checkContent)!=-1)

return true;

info = breader.readLine();

}

} catch (Exception e) {

System.out.println("Can't get content:"+checkContent +" from URL:"+checkUrl);

System.out.println("The error is:"+e.getMessage());

e.printStackTrace();

return false;

}

return false;

}

}
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: