爬虫工具类

爬虫工具类实现HttpGet和连接池以及对请求配置和连接池配置

@Component
public class HttpGetUtil {
    private PoolingHttpClientConnectionManager manager;

    public HttpGetUtil(){
        this.manager = new PoolingHttpClientConnectionManager();
        this.manager.setDefaultMaxPerRoute(10);
        this.manager.setMaxTotal(100);

    }

    //获取html
    public String doGetHtml(String url){
        CloseableHttpClient httpClient = HttpClients.custom().setConnectionManager(this.manager).build();
        HttpGet httpGet = new HttpGet(url);
        httpGet.setConfig(getConfig());
        CloseableHttpResponse response = null;

        try {
            response = httpClient.execute(httpGet);
            if(response.getStatusLine().getStatusCode() == 200){
                if(response.getEntity() != null) {
                    String content = EntityUtils.toString(response.getEntity());
                    return content;
                }
            }
        } catch (IOException e) {
            e.printStackTrace();
        }finally {
            if(response != null) {
                try {
                    response.close();
                } catch (IOException e) {
                    e.printStackTrace();
                }
            }
        }
        return "";
    }

    //下载图片
    public String doGetImage(String url){
        CloseableHttpClient httpClient = HttpClients.custom().setConnectionManager(this.manager).build();
        HttpGet httpGet = new HttpGet(url);
        httpGet.setConfig(getConfig());
        CloseableHttpResponse response = null;

        try {
            response = httpClient.execute(httpGet);
            if(response.getStatusLine().getStatusCode() == 200){

                //判断响应体是否为空
                if(response.getEntity() != null) {
                    //获取图片地址的后缀
                    String suf = url.substring(url.lastIndexOf("."));
                    //创建新的图片名
                    String imgName = UUID.randomUUID().toString()+suf;
                    //下载图片

                    FileOutputStream out = new FileOutputStream("C:\\Users\\86158\\Desktop\\京东图片\\"+imgName);
                    response.getEntity().writeTo(out);
                    return imgName;
                }
            }
        } catch (IOException e) {
            e.printStackTrace();
        }finally {
            if(response != null) {
                try {
                    response.close();
                } catch (IOException e) {
                    e.printStackTrace();
                }
            }
        }
        return "";
    }


    //请求配置
    private static RequestConfig getConfig(){
        RequestConfig conf = RequestConfig.custom().setConnectTimeout(1000)
                .setConnectionRequestTimeout(500)
                .setSocketTimeout(100 * 100).build();
        return  conf;
    }


}
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值