使用jsoup进行简单的爬虫操作爬取图片

本文转载自查看原文 2015-12-01 16:23 3092 爬虫/ java/ 图片


package com.guanglan.util;

import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.net.URL;
import java.net.URLConnection;

import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;


public class DownLoadPic {

  public void getDoc() throws IOException{

　　File f = new File("E://imgs");

　　　　　　if(!f.exists()){

　　　　　　 f.mkdirs();

　　　　　　}
　　　　//以网易为例子

 Document doc = Jsoup.connect("http://www.163.com/").get(); //获取后缀为png和jpg的图片的元素集合 Elements pngs = doc.select("img[src~=(?i)\\.(png|jpe?g)]"); //遍历元素 for(Element e : pngs){ String src=e.attr("src");//获取img中的src路径 //获取后缀名 String imageName = src.substring(src.lastIndexOf("/") + 1,src.length()); //连接url URL url = new URL(src); URLConnection uri=url.openConnection(); //获取数据流 InputStream is=uri.getInputStream(); //写入数据流 OutputStream os = new FileOutputStream(new File("E://imgs", imageName)); 

　　byte[] buf = new byte[1024]; 

　　int l=0; 

　　while((l=is.read(buf))!=-1){

　　　　　　os.write(buf, 0, l); 
　　　　} 
　　}
}
 public static void main(String[] args) throws IOException { 

　　　　new DownLoadPic().getDoc(); //调用方法 

 　　} 
}

使用之前注意导入jsoup相关jar包

免责声明！

本站转载的文章为个人学习借鉴使用，本站对版权不负任何法律责任。如果侵犯了您的隐私权益，请联系本站邮箱yoyou2525@163.com删除。

猜您在找 jsoup爬取图片到本地 python 使用for循环简单爬取图片（1）使用Scrapy爬虫框架简单爬取图片并保存本地(妹子图） C#简单爬虫爬取图片并保存本地简单的python爬虫教程：批量爬取图片 python爬虫（爬取图片） scrapy爬虫，爬取图片 python网络爬虫之使用scrapy爬取图片爬虫---Beautiful Soup 爬取图片 python网络爬虫之爬取图片