?????????????Java???????????????????????????????????????????????μ?????????????????
??????????private static int webDepth = 2;//????????
?????????????1?????????????????????????????     private int intThreadNum = 10;//???????????????????
??????????????????????????????report.txt???????????????????????????????????????fileindex.txt??????????????????
???????????????????(????????????)????????????????URL????????Hashtable????????飬????????????????
???????????????????в??????????????????http://???????ЧURL????????????????????????????????????????????int???????????? Integer.parseInt(String s)?????????????????????????3??????????????????У??????????2??
???????????????????????????href= href=' href="???url???????????(????url????????????????????????????????????????)?????????url?? window.open('???????п???????????????????????????????и????????????????????????м???
????????????????£????????GetWeb.java????

 

import java.io.File;
import java.io.BufferedReader;
import java.io.FileOutputStream;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.io.PrintWriter;
import java.net.URL;
import java.net.URLConnection;
import java.util.ArrayList;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.Hashtable;
public class GetWeb {
private int webDepth = 2;// ???????
private int intThreadNum = 10;// ?????
private String strHomePage = "";// ??????
private String myDomain;// ????
private String fPath = "web";// ????????????????
private ArrayList<String> arrUrls = new ArrayList<String>();// ?洢δ????URL
private ArrayList<String> arrUrl = new ArrayList<String>();// ?洢????URL??????????
private Hashtable<String?? Integer> allUrls = new Hashtable<String?? Integer>();// ?洢????URL???????
private Hashtable<String?? Integer> deepUrls = new Hashtable<String?? Integer>();// ?洢????URL???
private int intWebIndex = 0;// ??????????±???0???
private String charset = "GB2312";
private String report = "";
private long startTime;
private int webSuccessed = 0;
private int webFailed = 0;
public GetWeb(String s) {
this.strHomePage = s;
}
public GetWeb(String s?? int i) {
this.strHomePage = s;
this.webDepth = i;
}
public synchronized void addWebSuccessed() {
webSuccessed++;
}
public synchronized void addWebFailed() {
webFailed++;
}