[java]代码库
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileWriter;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.safety.Whitelist;
public class App {
static Document doc;
public static String getContent(int id) throws Exception {
doc = Jsoup.connect("http://www.xstxt.com/fanrenxiuxianchuan/" + id)
.timeout(30000).get();
String title = doc.title();
title = title.substring(6, title.length() - 8);
// System.out.println(title);
String txt = doc.getElementById("booktext").toString();
txt = Jsoup.clean(txt, Whitelist.none());
txt = txt.replaceAll(" ", "\\n");
txt = txt.replace("\\n\\n", "\\n").replace("\\n\\n", "\\n")
.replace("\\n\\n", "\\n").replace("\\n \\n ", "\\n")
.replace("\\n\\n", "\\n");
// System.out.println(txt);
return title + txt;
}
public static void main(String[] args) throws Exception {
String filename = "z:/dd.txt";
BufferedWriter bw = new BufferedWriter(new FileWriter(filename));
String str = "";
for (int i = 0; i < 1000; i++) {
System.out.println(i);
str = getContent(1071907+i);
bw.write(str);
bw.write("\\n\\n");
}
bw.close();
}
}
//源代码片段来自云代码http://yuncode.net