NekoHTML and Dom4j

http://pro.ctlok.com/2010/07/java-read-html-dom4j-nekohtml.html

 

package com.ctlok.pro;
 
import java.io.IOException;
 
import org.cyberneko.html.parsers.DOMParser;
import org.dom4j.Document;
import org.dom4j.Node;
import org.dom4j.io.DOMReader;
import org.xml.sax.SAXException;
 
public class Main {
 
    /**
     * @param args
     */
    public static void main(String[] args) {
        try{
            String url = "http://hk.finance.yahoo.com/q?s=0005.HK";
            
            DOMParser parser = new DOMParser();
            parser.parse(url);
            
            org.w3c.dom.Document document = parser.getDocument();
            DOMReader domReader = new DOMReader();  
            Document doc = domReader.read(document);
            
            //Element name should be upper case
            Node name = doc.selectSingleNode("//DIV[@id='quote-bar-latest']/*/H2/node()");
            Node buy = doc.selectSingleNode("//DIV[@id='quote-bar-trade-info']/TABLE/TBODY/TR[1]/TD[2]");
            Node sell = doc.selectSingleNode("//DIV[@id='quote-bar-trade-info']/TABLE/TBODY/TR[2]/TD[2]");
            
            System.out.println(name.getText());
            System.out.println("Buy: " + buy.getText().substring(2));
            System.out.println("Sell: " + sell.getText().substring(2));
        } catch (SAXException e) {
            System.out.println(e.toString());
        } catch (IOException e) {
            System.out.println(e.toString());
        }
    }
}

 

转载于:https://www.cnblogs.com/feika/p/4203893.html

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值