81,115
社区成员
发帖
与我相关
我的任务
分享package com.dyb.url;
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
import org.htmlparser.Parser;
import org.htmlparser.beans.StringBean;
import org.htmlparser.util.ParserException;
import org.htmlparser.visitors.HtmlPage;
public class ReadUrl {
public static String getHtml(String urlString) {
try {
StringBuffer html = new StringBuffer();
URL url = new URL(urlString);
HttpURLConnection conn = (HttpURLConnection) url.openConnection();
InputStreamReader isr = new InputStreamReader(conn.getInputStream());
BufferedReader br = new BufferedReader(isr);
String temp;
while ((temp = br.readLine()) != null) {
html.append(temp).append("\n");
}
br.close();
isr.close();
return html.toString();
} catch (Exception e) {
e.printStackTrace();
return null;
}
}
public static void main(String[] args) {
String htmlcode = ReadUrl.getHtml("http://tieba.baidu.com/p/1347940189");
Parser parser = Parser.createParser(htmlcode, "GBK");
HtmlPage page = new HtmlPage(parser);
try
{
parser.visitAllNodesWith(page);
}
catch (ParserException e1)
{
e1 = null;
}
// 显示标题
System.out.println(page.getTitle());
// 显示文本
System.out.println(getContent());
}
private static String getContent() {
StringBean sBean = new StringBean();
sBean.setLinks(true);
sBean.setCollapse(true);
sBean.setReplaceNonBreakingSpaces(true);
sBean.setURL("http://tieba.baidu.com/p/1347940189");
// System.out.println("This content is:"+sBean.getStrings());
return sBean.getStrings();
}
}
package com.dyb.url;
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
import org.htmlparser.Parser;
import org.htmlparser.beans.StringBean;
import org.htmlparser.util.ParserException;
import org.htmlparser.visitors.HtmlPage;
public class ReadUrl {
public static String getHtml(String urlString) {
try {
StringBuffer html = new StringBuffer();
URL url = new URL(urlString);
HttpURLConnection conn = (HttpURLConnection) url.openConnection();
InputStreamReader isr = new InputStreamReader(conn.getInputStream());
BufferedReader br = new BufferedReader(isr);
String temp;
while ((temp = br.readLine()) != null) {
html.append(temp).append("\n");
}
br.close();
isr.close();
return html.toString();
} catch (Exception e) {
e.printStackTrace();
return null;
}
}
public static void main(String[] args) {
String htmlcode = ReadUrl.getHtml("http://tieba.baidu.com/p/1347940189");
Parser parser = Parser.createParser(htmlcode, "GBK");
HtmlPage page = new HtmlPage(parser);
try
{
parser.visitAllNodesWith(page);
}
catch (ParserException e1)
{
e1 = null;
}
// 显示标题
System.out.println(page.getTitle());
// 显示文本
System.out.println(getContent());
}
private static String getContent() {
StringBean sBean = new StringBean();
sBean.setLinks(true);
sBean.setCollapse(true);
sBean.setReplaceNonBreakingSpaces(true);
sBean.setURL("http://tieba.baidu.com/p/1347940189");
// System.out.println("This content is:"+sBean.getStrings());
return sBean.getStrings();
}
}
public static void main(String[] args) {
String htmlcode = ReadUrl.getHtml("http://tieba.baidu.com/p/1347940189");
Parser parser = Parser.createParser(htmlcode, "GBK");
HtmlPage page = new HtmlPage(parser);
try
{
parser.visitAllNodesWith(page);
}
catch (ParserException e1)
{
e1 = null;
}
// 显示标题
System.out.println(page.getTitle());
// 显示文本
System.out.println(getContent());
}
private static String getContent() {
StringBean sBean = new StringBean();
sBean.setLinks(true);
sBean.setCollapse(true);
sBean.setReplaceNonBreakingSpaces(true);
sBean.setURL("http://tieba.baidu.com/p/1347940189");
// System.out.println("This content is:"+sBean.getStrings());
return sBean.getStrings();
}import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
public class URLUtil {
public static String getHtml(String urlString) {
try {
StringBuffer html = new StringBuffer();
URL url = new URL(urlString);
HttpURLConnection conn = (HttpURLConnection) url.openConnection();
InputStreamReader isr = new InputStreamReader(conn.getInputStream());
BufferedReader br = new BufferedReader(isr);
String temp;
while ((temp = br.readLine()) != null) {
html.append(temp).append("\n");
}
br.close();
isr.close();
return html.toString();
} catch (Exception e) {
e.printStackTrace();
return null;
}
}
public static void main(String[] args) {
System.out.println(URLUtil.getHtml("http://www.fastunit.com"));
}
}