package MainModel; import java.io.File; import java.io.IOException; import java.util.ArrayList; import java.util.HashMap; import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.select.Elements; import jxl.Workbook; import jxl.write.Label; import jxl.write.WritableSheet; import jxl.write.WritableWorkbook; import jxl.write.WriteException; import jxl.write.biff.RowsExceededException; public class Test { private static int intCounted = 0; static String strOutput = null; static HashMap> excelDataMap = new HashMap>(); static ArrayList titleData = new ArrayList(); static ArrayList linksData = new ArrayList(); //按照网页特征,判断页数,返回一个循环的次数(未知分页规律,暂时固定写死) private static int preGenerate() { return 8; } //处理的url,使其可以访问。 private static String genURL(String url){ intCounted++; return (intCounted > 0) ? url + new Integer(intCounted).toString() +".html" : url + ".html"; } public static void getExcelData(String commonUrl, String urlTail) { String url = commonUrl + urlTail; Document doc; while(intCounted