zoukankan      html  css  js  c++  java
  • NekoHTML and Dom4j

    http://pro.ctlok.com/2010/07/java-read-html-dom4j-nekohtml.html

    package com.ctlok.pro;
     
    import java.io.IOException;
     
    import org.cyberneko.html.parsers.DOMParser;
    import org.dom4j.Document;
    import org.dom4j.Node;
    import org.dom4j.io.DOMReader;
    import org.xml.sax.SAXException;
     
    public class Main {
     
        /**
         * @param args
         */
        public static void main(String[] args) {
            try{
                String url = "http://hk.finance.yahoo.com/q?s=0005.HK";
                
                DOMParser parser = new DOMParser();
                parser.parse(url);
                
                org.w3c.dom.Document document = parser.getDocument();
                DOMReader domReader = new DOMReader();  
                Document doc = domReader.read(document);
                
                //Element name should be upper case
                Node name = doc.selectSingleNode("//DIV[@id='quote-bar-latest']/*/H2/node()");
                Node buy = doc.selectSingleNode("//DIV[@id='quote-bar-trade-info']/TABLE/TBODY/TR[1]/TD[2]");
                Node sell = doc.selectSingleNode("//DIV[@id='quote-bar-trade-info']/TABLE/TBODY/TR[2]/TD[2]");
                
                System.out.println(name.getText());
                System.out.println("Buy: " + buy.getText().substring(2));
                System.out.println("Sell: " + sell.getText().substring(2));
            } catch (SAXException e) {
                System.out.println(e.toString());
            } catch (IOException e) {
                System.out.println(e.toString());
            }
        }
    }
  • 相关阅读:
    分页查询+组合查询
    单点登录3
    单点登录2
    单点登录1
    sql server 语句
    jsTree动态加载数据
    sql 根据日期模糊查询&SQL Server dateTime类型 模糊查询
    快捷键
    JQUERY获取当前页面的URL信息
    C#中的?和??的用法
  • 原文地址:https://www.cnblogs.com/feika/p/4203893.html
Copyright © 2011-2022 走看看