求教:怎么用httpClient得到网页中的数据 有一个网页显示的是一支股票的当前信息,怎么用httpClient得到这个数据,而不是得到这个网页的代码 解决方案 » 免费领取超大流量手机卡,每月29元包185G流量+100分钟通话, 中国电信官方发货 用httpclient只能获取网页的html代码,要想得到你想要的数据就得做进一步的处理,需要用到正则表达式 具体是这样的,我需要从http://hq.sinajs.cn/list=s_sh600058里面得到股票信息,使用httpClient去拿到这些数据,并且存储在本地。该怎么做呢?很迷茫啊!谢谢大家 package com.oop.test;import java.io.File;import java.io.FileWriter;import java.io.IOException;import java.io.PrintWriter;public class Test1 { private static String getStaticPage(String surl) { String htmlContent = ""; try { java.io.InputStream inputStream; java.net.URL url = new java.net.URL(surl); java.net.HttpURLConnection connection = (java.net.HttpURLConnection) url .openConnection(); connection.connect(); inputStream = connection.getInputStream(); byte[] bytes = new byte[1024 * 2000]; int index = 0; int count = inputStream.read(bytes, index, 1024 * 2000); while (count != -1) { index += count; count = inputStream.read(bytes, index, 1); } htmlContent = new String(bytes, "UTF-8"); connection.disconnect(); } catch (Exception ex) { ex.printStackTrace(); } return htmlContent.trim(); } public static void main(String[] args) { try { String src = getStaticPage("http://www.google.com"); File file = new File("d:\\aa.html"); FileWriter resultFile = new FileWriter(file); PrintWriter myFile = new PrintWriter(resultFile);// 写文件 myFile.println(src); resultFile.close(); myFile.close(); } catch (IOException e) { // TODO Auto-generated catch block e.printStackTrace(); } }} import java.io.IOException;import org.jsoup.Jsoup;import org.jsoup.nodes.Document;import org.jsoup.nodes.Element;import org.jsoup.select.Elements;public class Jsoup01 { public static void main(String[] args) { String getUrl = "http://www.epzw.com/files/article/topmonthvisit/0/1.htm"; String g1 = ".grid > tbody > tr > td > strong > a"; String g2 = "abs:href"; try { Document doc = Jsoup.connect(getUrl).timeout(60000).get(); Elements links = doc.select(g1); for (Element link : links) { String bookURL = link.attr(g2); String bookTitle=link.text(); System.out.println(bookURL+" "+bookTitle); } } catch (IOException e) { e.printStackTrace(); } }} Jsp中session的生命周期 (急)servlet处理jsp的请求问题,希望大家多多帮忙! jsp编码问题 和 tcp数据丢失问题 为什么我在Eclipse里编辑jsp页面时一加双引号光标就乱跳? 求助!地址栏传递参数的问题 Truncated class file错误 初涉struts,遭遇困难,帮忙,在线 int怎样转换成Sting? [问题]图片为什么无法显示?(resin) 怎样获得新插入纪录的默认字段值? 新的需求。不知道该如何做啊。求高手 三级联动省市县
package com.oop.test;import java.io.File;
import java.io.FileWriter;
import java.io.IOException;
import java.io.PrintWriter;public class Test1 {
private static String getStaticPage(String surl) {
String htmlContent = "";
try {
java.io.InputStream inputStream;
java.net.URL url = new java.net.URL(surl);
java.net.HttpURLConnection connection = (java.net.HttpURLConnection) url
.openConnection();
connection.connect();
inputStream = connection.getInputStream();
byte[] bytes = new byte[1024 * 2000];
int index = 0;
int count = inputStream.read(bytes, index, 1024 * 2000);
while (count != -1) {
index += count;
count = inputStream.read(bytes, index, 1);
}
htmlContent = new String(bytes, "UTF-8");
connection.disconnect();
} catch (Exception ex) {
ex.printStackTrace();
}
return htmlContent.trim();
} public static void main(String[] args) {
try {
String src = getStaticPage("http://www.google.com");
File file = new File("d:\\aa.html");
FileWriter resultFile = new FileWriter(file);
PrintWriter myFile = new PrintWriter(resultFile);// 写文件
myFile.println(src);
resultFile.close();
myFile.close();
} catch (IOException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
}
import java.io.IOException;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;public class Jsoup01 { public static void main(String[] args) { String getUrl = "http://www.epzw.com/files/article/topmonthvisit/0/1.htm";
String g1 = ".grid > tbody > tr > td > strong > a";
String g2 = "abs:href";
try {
Document doc = Jsoup.connect(getUrl).timeout(60000).get();
Elements links = doc.select(g1);
for (Element link : links) {
String bookURL = link.attr(g2);
String bookTitle=link.text();
System.out.println(bookURL+" "+bookTitle);
}
} catch (IOException e) {
e.printStackTrace();
}
}}