java讀取網頁數據

package test;

import java.io.BufferedReader;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.MalformedURLException;
import java.net.URL;
import java.net.URLConnection;

import com.sun.xml.internal.txw2.Document;

public class tools {

/**
* 測試方法
*
* @param args
* @throws IOException
*/
public static void main(String[] args) throws IOException {
// TODO Auto-generated method stub
tools tool = null;
if (tool == null) { // 是否創建對象
tool = new tools();
}
String result = tool.getCEDContact("baidu");
System.out.println(result);
}

/**
* 處理字符
*
* @param buffer
* @return 處理結果
*/
private String splitString(StringBuffer buffer) {

String parseString;
String variable = null;
parseString = buffer.toString().replaceAll("<script(.|\n)+?</script>",
" ").replaceAll("<(.|\n)+?>", " ").replaceAll(" ", ""); // 替換所有的HTML標籤

String[] splitArr = parseString.split("/n");
StringBuffer stringBuffer = new StringBuffer();
for (int i = 0; i < splitArr.length; i++) {
stringBuffer.append(splitArr[i]);
stringBuffer.append("\n");

}
variable = stringBuffer.toString();

if (variable.indexOf("CED") > 0 && variable.indexOf("Nameservers") > 0) {// 判斷是否存在有需要的CED值
variable = variable.substring(variable.indexOf("CED"), variable
.indexOf("Nameservers"));
}
return variable;
}

/**
* 獲取BufferedReader對象
*
* @param urlString鏈接地址
* @return bufferedReader
* @throws IOException
*/
private BufferedReader getBuffer(String urlString) throws IOException {
BufferedReader bufferedReader = null;
try {
URL url = new URL(urlString);
URLConnection conn = url.openConnection(); // 引用遠程對象
bufferedReader = new BufferedReader(new InputStreamReader(conn
.getInputStream())); // 讀取對象資源
} catch (MalformedURLException e) {
// TODO Auto-generated catch block
e.printStackTrace();
System.out.println(e.getMessage());
} finally {
return bufferedReader;
}

}

/**
* 獲取CED信息
*
* @param parm
* @return String
* @throws IOException
*/
protected String getCEDContact(String parm) throws IOException {
tools tool = null;
if (tool == null) { // 是否創建對象
tool = new tools();
}
String urlString = "http://whois.asia/cgi-bin/whois.cgi?whois_query_field="
+ parm + "";
String result = null;
BufferedReader bufferedReader = tool.getBuffer(urlString);
StringBuffer buffer = new StringBuffer();
while ((result = bufferedReader.readLine()) != null) {
buffer.append(result);
buffer.append("/n");
}
result = tool.splitString(buffer);
bufferedReader.close();
return result;
}
}
發佈了1 篇原創文章 · 獲贊 0 · 訪問量 1333
發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章