You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
30 lines
867 B
30 lines
867 B
package crawler;
|
|
|
|
import org.jsoup.nodes.Document;
|
|
import org.jsoup.select.Elements;
|
|
|
|
public class ImageCrawler extends BaseCrawler {
|
|
|
|
public ImageCrawler(String url) {
|
|
super(url);
|
|
}
|
|
|
|
@Override
|
|
public void crawl() {
|
|
try {
|
|
Document doc = getDocument();
|
|
Elements imgs = doc.select("img[src]");
|
|
|
|
System.out.println("\n===== 图片爬取完成 =====");
|
|
System.out.println("URL:" + url);
|
|
System.out.println("找到图片数量:" + imgs.size());
|
|
|
|
for (int i = 0; i < Math.min(5, imgs.size()); i++) {
|
|
String src = imgs.get(i).attr("abs:src");
|
|
System.out.println("图片" + (i + 1) + ":" + src);
|
|
}
|
|
} catch (Exception e) {
|
|
System.err.println("图片爬取失败:" + e.getMessage());
|
|
}
|
|
}
|
|
}
|