1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54
| import java.io.BufferedReader; import java.io.FileReader; import java.io.IOException; import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.select.Elements; public class JsoupTest {
public static String readHtml(String path) { StringBuffer buff = new StringBuffer(); try (FileReader reader = new FileReader(path); BufferedReader br = new BufferedReader(reader)) { String line; int count = 0; while ((line = br.readLine()) != null) { buff.append(line); count++; } } catch (IOException e) { e.printStackTrace(); } return buff.toString(); }
public static void main(String[] args) { try { String file_path = "D:\\index.html"; String html = readHtml(file_path); Document document = Jsoup.parse(html); Elements div = document.select(".content_18313"); Elements title = div.select(".title_area>h1"); System.out.println("打印最终结果:" + title.text()); } catch (Exception e) { e.printStackTrace(); } } }
|