zoukankan      html  css  js  c++  java
  • 爬虫小例子

    package com.textPa.two;
    
    import java.io.BufferedWriter;
    import java.io.File;
    import java.io.FileWriter;
    import java.nio.charset.Charset;
    
    import org.apache.http.HttpEntity;
    import org.apache.http.HttpResponse;
    import org.apache.http.client.methods.HttpGet;
    import org.apache.http.impl.client.CloseableHttpClient;
    import org.apache.http.impl.client.HttpClients;
    import org.apache.http.util.EntityUtils;
    
    public class RetrivePage {
        
        public static void main(String[] args) {
            CloseableHttpClient httpClient = HttpClients.createDefault();
    //        HttpGet getHttp = new HttpGet("http://www.baidu.com");
            HttpGet getHttp = new HttpGet("http://club.news.sohu.com/zz0578/thread/4bqnexpi3no");
            String content = null;
            BufferedWriter writer = null;
            
            HttpResponse response;
            try {
                response = httpClient.execute(getHttp);
                HttpEntity entity = response.getEntity();
                
                if(entity!=null){
                    content = EntityUtils.toString(entity,Charset.forName("GBK"));
                    System.out.println(content);
                    File file = new File("d:\baidu.html");
                    writer = new BufferedWriter(new FileWriter(file));
                    writer.write(content);
                    writer.flush();
                    writer.close();
                    System.out.println("创建成功");
                }
            }catch (Exception e) {
                // TODO: handle exception
            }
        }
        
    }

    所需要的两个jar包我后面会贴出来

    http://pan.baidu.com/s/1nuFuDUL

  • 相关阅读:
    程序员学习方法差在哪里
    解析域名
    tomcat下的公共jar包配置
    Ubuntu 16.04 修改状态栏位置
    sqlite3 C语言 API 函数
    vim配置文件
    关于 ioctl 函数
    字符设备基础了解
    Ubuntu14.04搭建Boa服务
    gcc 交叉工具链中工具使用(arm-linux-xxx)
  • 原文地址:https://www.cnblogs.com/wangxiangstudy/p/5850123.html
Copyright © 2011-2022 走看看