java 抓取 https 网页内容
2013-03-25 13:25
477 查看
import java.io.BufferedReader;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import javax.net.ssl.HttpsURLConnection;
public class JavaUrl {
/**
* Use for check our website is work well.
* @return
*/
public boolean checkWebsite(String checkUrl,String checkContent){
try {
URL url = new URL(checkUrl);
HttpsURLConnection httpsConn = (HttpsURLConnection)url.openConnection();
//取得该连接的输入流,以读取响应内容
InputStream ins = httpsConn.getInputStream();
BufferedReader breader = new BufferedReader(new InputStreamReader(ins));
String info = breader.readLine();
long nowTime =new java.util.Date().getTime();
while (info != null) {
if(new java.util.Date().getTime() -nowTime >10000)
return false;//达到10秒就认为超时
if(info != null && info.indexOf(checkContent)!=-1)
return true;
info = breader.readLine();
}
} catch (Exception e) {
System.out.println("Can't get content:"+checkContent +" from URL:"+checkUrl);
System.out.println("The error is:"+e.getMessage());
e.printStackTrace();
return false;
}
return false;
}
}
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import javax.net.ssl.HttpsURLConnection;
public class JavaUrl {
/**
* Use for check our website is work well.
* @return
*/
public boolean checkWebsite(String checkUrl,String checkContent){
try {
URL url = new URL(checkUrl);
HttpsURLConnection httpsConn = (HttpsURLConnection)url.openConnection();
//取得该连接的输入流,以读取响应内容
InputStream ins = httpsConn.getInputStream();
BufferedReader breader = new BufferedReader(new InputStreamReader(ins));
String info = breader.readLine();
long nowTime =new java.util.Date().getTime();
while (info != null) {
if(new java.util.Date().getTime() -nowTime >10000)
return false;//达到10秒就认为超时
if(info != null && info.indexOf(checkContent)!=-1)
return true;
info = breader.readLine();
}
} catch (Exception e) {
System.out.println("Can't get content:"+checkContent +" from URL:"+checkUrl);
System.out.println("The error is:"+e.getMessage());
e.printStackTrace();
return false;
}
return false;
}
}
相关文章推荐
- java 抓取 https 网页内容
- Java 抓取网页内容,获取指定服务器IP
- java 抓取网页内容小工具
- java-抓取指定URL网页的内容(二)
- JAVA抓取网站网页内容
- java利用url实现网页内容的抓取
- Java 抓取网页内容
- 通过java.net.Socket 类抓取网页内容
- JAVA 抓取网页内容
- curl实现避开验证码模拟登入 抓取网站网页内容 https
- java抓取网页指定元素/内容
- JAVA 抓取网页内容
- 网络爬虫Java实现抓取网页内容
- 爬网入门:JAVA抓取网站网页内容
- java 抓取网页内容,可设定代理(HttpURLConnection)
- java爬虫(使用jsoup设置代理,抓取网页内容)
- Java网页抓取网页内容时,乱码问题的解决
- java抓取全部网页内容
- Java HttpURLConnection 抓取网页内容 解析gzip格式输入流数据并转换为String格式字符串
- java利用url实现网页内容的抓取