java 抓取网页内容
2011-03-16 15:26
441 查看
public static void main(String[] args) {
try {
URL url = new URL("http://www.google.com");
URLConnection conn = url.openConnection();
conn.setDoOutput(true);
InputStream in = null;
in = url.openStream();
String content = pipe(in, "utf-8");
System.out.println(content);
} catch (Exception e) {
e.printStackTrace();
}
}
static String pipe(InputStream in, String charset) throws IOException {
StringBuffer s = new StringBuffer();
if (charset == null || "".equals(charset)) {
charset = "utf-8";
}
String rLine = null;
BufferedReader bReader = new BufferedReader(new InputStreamReader(in,
charset));
PrintWriter pw = null;
FileOutputStream fo = new FileOutputStream("../index.html");
OutputStreamWriter writer = new OutputStreamWriter(fo, "utf-8");
pw = new PrintWriter(writer);
while ((rLine = bReader.readLine()) != null) {
String tmp_rLine = rLine;
int str_len = tmp_rLine.length();
if (str_len > 0) {
s.append(tmp_rLine);
pw.println(tmp_rLine);
pw.flush();
}
tmp_rLine = null;
}
in.close();
pw.close();
return s.toString();
}
相关技术帖子:http://blog.sina.com.cn/gzwncb
try {
URL url = new URL("http://www.google.com");
URLConnection conn = url.openConnection();
conn.setDoOutput(true);
InputStream in = null;
in = url.openStream();
String content = pipe(in, "utf-8");
System.out.println(content);
} catch (Exception e) {
e.printStackTrace();
}
}
static String pipe(InputStream in, String charset) throws IOException {
StringBuffer s = new StringBuffer();
if (charset == null || "".equals(charset)) {
charset = "utf-8";
}
String rLine = null;
BufferedReader bReader = new BufferedReader(new InputStreamReader(in,
charset));
PrintWriter pw = null;
FileOutputStream fo = new FileOutputStream("../index.html");
OutputStreamWriter writer = new OutputStreamWriter(fo, "utf-8");
pw = new PrintWriter(writer);
while ((rLine = bReader.readLine()) != null) {
String tmp_rLine = rLine;
int str_len = tmp_rLine.length();
if (str_len > 0) {
s.append(tmp_rLine);
pw.println(tmp_rLine);
pw.flush();
}
tmp_rLine = null;
}
in.close();
pw.close();
return s.toString();
}
相关技术帖子:http://blog.sina.com.cn/gzwncb
相关文章推荐
- java 抓取网页内容实现代码
- Java 通过 Socket 的形式抓取网页内容
- JAVA使用爬虫抓取网站网页内容的方法
- java 抓取 https 网页内容
- java网页抓取内容
- 网络爬虫Java实现抓取网页内容
- java抓取网页内容
- 【JAVA】 抓取网页内容
- java利用url实现网页内容的抓取
- java利用url实现网页内容的抓取
- 爬网入门:JAVA抓取网站网页内容
- java抓取网页指定元素/内容
- java-抓取指定URL网页的内容
- java利用url实现网页内容的抓取
- java爬虫(使用jsoup设置代理,抓取网页内容)
- paip.抓取网页内容--java php python
- java 抓取网页内容,可设定代理(HttpURLConnection)
- Java 抓取网页内容
- JAVA 抓取网页内容
- paip.抓取网页内容--java php python