基本信息
源码名称:jsoup采集必应壁纸 示例源码
源码大小:0.02M
文件格式:.zip
开发语言:Java
更新时间:2019-03-23
   友情提示:(无需注册或充值,赞助后即可获取资源下载链接)

     嘿,亲!知识可是无价之宝呢,但咱这精心整理的资料也耗费了不少心血呀。小小地破费一下,绝对物超所值哦!如有下载和支付问题,请联系我们QQ(微信同号):813200300

本次赞助数额为: 2 元 
   源码介绍

采集地址为 https://bing.ioliu.cn/


采集后的结果在这里


import org.jsoup.Connection;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;

import javax.net.ssl.*;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.net.URL;
import java.net.URLConnection;
import java.security.SecureRandom;
import java.security.cert.X509Certificate;
import java.util.*;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;

public class Main {

    public static String myURL = "https://bing.ioliu.cn/";
    public static String filePath = "D:\\bingPicture\\";

    // 安全证书 信任所有站点
    public static InputStream getByDisableCertValidation(String url) {
        System.out.println("正在获取网站安全证书,请稍等....");
        TrustManager[] trustAllCerts = new TrustManager[]{new X509TrustManager() {
            public X509Certificate[] getAcceptedIssuers() {
                return new X509Certificate[0];
            }

            public void checkClientTrusted(X509Certificate[] certs, String authType) {
            }

            public void checkServerTrusted(X509Certificate[] certs, String authType) {
            }
        }};

        HostnameVerifier hv = new HostnameVerifier() {
            public boolean verify(String hostname, SSLSession session) {
                return true;
            }
        };

        try {
            SSLContext sc = SSLContext.getInstance("SSL");
            sc.init(null, trustAllCerts, new SecureRandom());
            HttpsURLConnection.setDefaultSSLSocketFactory(sc.getSocketFactory());
            HttpsURLConnection.setDefaultHostnameVerifier(hv);

            URL uRL = new URL(url);
            HttpsURLConnection urlConnection = (HttpsURLConnection) uRL.openConnection();
            InputStream is = urlConnection.getInputStream();
            return is;
        } catch (Exception e) {
        }
        return null;
    }

    // 输出流
    public static void readInputStream(InputStream inStream, String path)
            throws Exception {
        File file = new File(path);
        FileOutputStream fos = new FileOutputStream(file);
        byte[] buffer = new byte[102400];
        int len = 0;
        while ((len = inStream.read(buffer)) != -1) {
            fos.write(buffer, 0, len);
        }
        inStream.close();
        fos.flush();
        fos.close();
    }

    // 文件夹是否存在
    public boolean fileIfExists(String path){
        File f=new File(path);
        if(f.exists()){
            return true;
        }else{
            f.mkdir();
            return false;
        }
    }

    // 请求页面
    public Connection getCollection(String url) {
        getByDisableCertValidation(url);
        Connection conn = null;
        Map<String, String> map = new HashMap<>();
        map.put("Accept", "text/html,application/xhtml xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8");
        map.put("Accept-Encoding", "gzip, deflate, br");
        map.put("Referer", "https://bing.ioliu.cn/ranking");
        conn = Jsoup.connect(url)
                .userAgent("Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36") // http请求的浏览器设置
                .timeout(5000)   // http连接时长
                .headers(map)
                .method(Connection.Method.POST);
        // 请求类型是get请求,http请求还是post,delete等方式
        return conn;
    }

    public static void main(String[] args) {
        Scanner s = new Scanner(System.in);
        System.out.println("请输入页数:");
        int pageNum = s.nextInt();
        Main main = new Main();
        Connection conn = main.getCollection(myURL   "?p="   pageNum);
        Document doc = null;
        try {
            doc = conn.get();
        } catch (IOException e1) {
            System.out.println("在连接官网时报错。。");
        }
        if (!main.fileIfExists(filePath)) {
            System.out.println("文件夹不存在,创建了一个指定目录的文件夹...");
        }
        Element body = doc.body();
        Elements lis = body.getElementsByClass("progressive__img progressive--not-loaded");
        final Map<String, String> urlMap = new HashMap<>();

        int i = 0;
        for (Element a : lis) {
            urlMap.put("url"   i, a.attr("data-progressive").replace("800x480", "1920x1080"));
            i  ;
        }
        ExecutorService pool = Executors.newCachedThreadPool(); //创建一个可缓存线程池,如果线程池长度超过处理需要,可灵活回收空闲线程,若无可回收,则新建线程。
        for (int j = 0; j < urlMap.size(); j  ) {
            final int finalJ = j;
            Runnable run = new Runnable() { // 使用多线程
                public void run() {
                    String imgUrl = urlMap.get("url"   finalJ).toString();
                    try {
                        URL url = new URL(imgUrl);
                        URLConnection con = url.openConnection();
                        con.setConnectTimeout(5000);
                        con.setRequestProperty("User-Agent", "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36");
                        InputStream inStream = con.getInputStream();
                        readInputStream(inStream, filePath   System.currentTimeMillis()   ".jpg");
                        System.out.println(imgUrl   "  下载成功");
                    } catch (Exception e) {
                        System.out.println(imgUrl   "  下载失败!!!");
                    }
                }
            };
            pool.execute(run);
        }
        pool.shutdown();


    }
}