You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

30 lines
867 B

package crawler;
import org.jsoup.nodes.Document;
import org.jsoup.select.Elements;
public class ImageCrawler extends BaseCrawler {
public ImageCrawler(String url) {
super(url);
}
@Override
public void crawl() {
try {
Document doc = getDocument();
Elements imgs = doc.select("img[src]");
System.out.println("\n===== 图片爬取完成 =====");
System.out.println("URL:" + url);
System.out.println("找到图片数量:" + imgs.size());
for (int i = 0; i < Math.min(5, imgs.size()); i++) {
String src = imgs.get(i).attr("abs:src");
System.out.println("图片" + (i + 1) + ":" + src);
}
} catch (Exception e) {
System.err.println("图片爬取失败:" + e.getMessage());
}
}
}