如题所述
try{
WebClient webClient = new WebClient(BrowserVersion.FIREFOX_24);
//设置webClientçç¸å ³åæ°
webClient.getOptions().setJavaScriptEnabled(true);
webClient.getOptions().setCssEnabled(false);
webClient.setAjaxController(new NicelyResynchronizingAjaxController());
//webClient.getOptions().setTimeout(50000);
webClient.getOptions().setThrowExceptionOnScriptError(false);
//模ææµè§å¨æå¼ä¸ä¸ªç®æ ç½å
HtmlPage rootPage= webClient.getPage(url);
System.out.println("为äºè·åjsæ§è¡çæ°æ® 线ç¨å¼å§æ²ç¡çå¾ ");
Thread.sleep(3000);//主è¦æ¯è¿ä¸ªçº¿ç¨ççå¾ å 为jså è½½ä¹æ¯éè¦æ¶é´ç
System.out.println("线ç¨ç»ææ²ç¡");
String html = rootPage.asText();
System.out.println(html);
}catch(Exception e){
}
WebClient webClient = new WebClient(BrowserVersion.FIREFOX_24);
//设置webClientçç¸å ³åæ°
webClient.getOptions().setJavaScriptEnabled(true);
webClient.getOptions().setCssEnabled(false);
webClient.setAjaxController(new NicelyResynchronizingAjaxController());
//webClient.getOptions().setTimeout(50000);
webClient.getOptions().setThrowExceptionOnScriptError(false);
//模ææµè§å¨æå¼ä¸ä¸ªç®æ ç½å
HtmlPage rootPage= webClient.getPage(url);
System.out.println("为äºè·åjsæ§è¡çæ°æ® 线ç¨å¼å§æ²ç¡çå¾ ");
Thread.sleep(3000);//主è¦æ¯è¿ä¸ªçº¿ç¨ççå¾ å 为jså è½½ä¹æ¯éè¦æ¶é´ç
System.out.println("线ç¨ç»ææ²ç¡");
String html = rootPage.asText();
System.out.println(html);
}catch(Exception e){
}
温馨提示:答案为网友推荐,仅供参考
第1个回答 2015-04-03
httpunit。jar ——》java的网络爬虫包