zoukankan      html  css  js  c++  java
  • Jsoup Element网页信息采集

    package zeze;
    
    import java.io.IOException;
    
    import org.jsoup.Jsoup;
    import org.jsoup.nodes.Document;
    import org.jsoup.select.Elements;
    
    public class TestJsoup {
        
        public  Document getDocument (String url){
            try {
                return Jsoup.connect(url).get();
            } catch (IOException e) {
                e.printStackTrace();
            }
            return null;
        }
    
        public static void main(String[] args) {
            TestJsoup t = new TestJsoup();
            Document doc = t.getDocument("http://www.weather.com.cn/html/weather/101280101.shtml");
            // 获取目标HTML代码
            Elements elements1 = doc.select("[class=dn on][data-dn=7d1]");
            // 今天
            Elements elements2 = elements1.select("h1");
            String today = elements2.get(0).text();
            System.out.println(today);
            // 几号
            Elements elements3 = elements1.select("h2");
            String number = elements3.get(0).text();
            System.out.println(number);
            // 是否有雨
            Elements elements4 = elements1.select("[class=wea]");
            String rain = elements4.get(0).text();
            System.out.println(rain);
            // 高的温度
            Elements elements5 = elements1.select("span");
            String highTemperature = elements5.get(0).text()+"°C";
            System.out.println(highTemperature);
            // 低的温度
            String lowTemperature = elements5.get(1).text()+"°C";
            System.out.println(lowTemperature);
            // 风力
            Elements elements6 = elements1.select("i");
            String wind = elements6.get(2).text();
            System.out.println(wind);
        }
    }
    package zeze;
    
    import java.io.IOException;
    
    import org.jsoup.Jsoup;
    import org.jsoup.nodes.Document;
    import org.jsoup.nodes.Element;
    import org.jsoup.select.Elements;
    
    
    public class TestJsoup {
        
        public  Document getDocument (String url){
            try {
                return Jsoup.connect(url).get();
            } catch (IOException e) {
                e.printStackTrace();
            }
            return null;
        }
    
        public static void main(String[] args) {
            TestJsoup t = new TestJsoup();
            Document doc = t.getDocument("http://www.weather.com.cn/html/weather/101280101.shtml");
            // 获取目标HTML代码
            Elements elements1 = doc.select("[class=dn][data-dn=7d2]");//getElementsByClass("dn");
            // 今天
            Elements elements2 = elements1.select("h1");
            String today = elements2.get(0).text();
            System.out.println(today);
            // 几号
            Elements elements3 = elements1.select("h2");
            String number = elements3.get(0).text();
            System.out.println(number);
            // 是否有雨
            Elements elements4 = elements1.select("[class=wea]");
            String rain = elements4.get(0).text();
            System.out.println(rain);
            // 高的温度
            Elements elements5 = elements1.select("span");
            String highTemperature = elements5.get(0).text()+"°C";
            System.out.println(highTemperature);
            // 低的温度
            String lowTemperature = elements5.get(1).text()+"°C";
            System.out.println(lowTemperature);
            // 风力
            Elements elements6 = elements1.select("i");
            String wind = elements6.get(2).text();
            System.out.println(wind);
            
            Elements zeze = doc.select("[class=Lcontent]");
            for (Element result : zeze)
    		{
    			Elements links = result.getElementsByTag("a");
    			for (Element link : links)
    			{//筛选
    				String linkHref = link.attr("href");
    				String linkText = link.text();				
    				System.out.println(linkHref+"
    "+linkText);
    			}
    		}
        }
    }
    

      http://www.cnblogs.com/xiaoMzjm/p/3899366.html?utm_source=tuicool&utm_medium=referral

  • 相关阅读:
    JVM classloader
    面试整理
    工具配置链接
    IntelliJ IDEA 热部署
    IntelliJ IDEA 常用快捷键
    类文件结构
    判断对象存活的方法
    JVM 运行时数据区域
    vim编辑16进制
    阿里云yum源
  • 原文地址:https://www.cnblogs.com/zeze/p/4928396.html
Copyright © 2011-2022 走看看