List <HtmlElement> ips = null ;
List <HtmlElement> ports = null ;
ArrayList <String> proxies = new ArrayList();
HtmlPage page = null;
String baseUrl = "http://www.freeproxylists.net/" ;
WebClient client;
try{
client = new WebClient();
client.getOptions().setJavaScriptEnabled(false);
page = client.getPage(baseUrl);
ips = page.getByXPath("//table[@class='DataGrid']/tbody/tr/td[position()=1]/text()");
ports = page.getByXPath("//table[@class='DataGrid']/tbody/tr/td[position()=2]/text()");
for(int i=0;i<ips.size();i++){
proxies.add(ips.get(i)+":"+ports.get(i));
System.out.println(ips.get(i)+":"+ports.get(i));
}
}
catch(Exception e){
System.out.println(e);
}对我错误的代码缩进表示抱歉,无论如何,我试图从站点中刮取代理,我收到了以下警告:
mag 20,2018年4:04:56 PM com.gargoylesoftware.htmlunit.DefaultCssErrorHandler错误AVVERTENZA: CSS错误:'http://www.freeproxylists.net/grid.css‘1:1规则错误。(无效令牌"<“)。期待:,,".",":",“,,,……)mag 20,2018年4:04:56 PM com.gargoylesoftware.htmlunit.DefaultCssErrorHandler警告AVVERTENZA: CSS警告:'http://www.freeproxylists.net/grid.css‘1:1无视整个规则。mag 20,2018年4:04:56 PM com.gargoylesoftware.htmlunit.DefaultCssErrorHandler错误AVVERTENZA: CSS错误:'http://www.freeproxylists.net/grid.css‘45:1规则错误。(无效令牌"<“)。期待:,,".",":","","[",,,……)mag 20,2018年4:04:56 PM com.gargoylesoftware.htmlunit.DefaultCssErrorHandler警告AVVERTENZA: CSS警告:'http://www.freeproxylists.net/grid.css‘45:1无视整个规则。
,我怎样才能解决这个问题?
发布于 2018-05-23 18:43:12
您可以简单地将WebClient使用的WebClient替换为SilentCssErrorHandler。
HtmlUnit 常见问题页面有一个简短的示例。
https://stackoverflow.com/questions/50435645
复制相似问题