爬取网站记录,爬取动态生成网页,java爬取动态生成网页


        
            org.jsoup
            jsoup
            1.13.1
        
    public static void main(String[] args) throws Exception {
        Document document = Jsoup.connect("https://www.xbiquge.la/29/29770/14341237.html").get();
        Element body = document.body();
        String s = body.toString();
        s=s.substring(s.indexOf("
")); s=s.substring(0,s.indexOf("read4()")) .replaceAll(" ","") .replaceAll("
","") .replaceAll("\n","") .replaceAll(" ",""); while (s.length()>=51){ System.out.println(s.substring(0,50)); s=s.substring(50); System.out.println(); } System.out.println(s); }