java解析XML获取城市代码

运行前先导入dom4j架包,由于我们公司用的代理服务器所以下面我设置了代理ip,不需要的可直接忽略

 

package com.chengshidaima.tools;

import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.InetSocketAddress;
import java.net.Proxy;
import java.net.URL;
import java.net.URLConnection;
import java.util.List;
import org.dom4j.Document;
import org.dom4j.DocumentHelper;
import org.dom4j.Element;


public class CityCode
{

   // private Logger log = Logger.getLogger(CityCode.class.getName());

    public static void main(String[] args) {
        try {
            CityCode cc = new CityCode();
            cc.getCityXml();
            //System.out.println(doc.asXML());
        } catch (Exception e) {
            e.printStackTrace();
        }
    }

    /**
     * 解析
     * 
     * @return
     * @throws Exception
     */
    @SuppressWarnings("unchecked")
    private Document getCityXml() throws Exception {
        /** 新建一个doc 保存结果 */
        Document docResult = DocumentHelper.createDocument();
        Element addElementRoot = DocumentHelper.createElement("china");

        String sUrlChina = "http://flash.weather.com.cn/wmaps/xml/china.xml";
        String sChinaProvXml = getUrlString(sUrlChina);
        Document doc = DocumentHelper.parseText(sChinaProvXml);

        Element rootElt = doc.getRootElement(); // 获取根节点
        //log.info("根节点:" + rootElt.getName()); // 拿到根节点的名称
        /** 取得所有省份 */
        List<Element> listProv = rootElt.elements("city"); // 获取根节点下的子节点
        for (int i = 0; i < listProv.size(); i++) {
            Element elementProv = listProv.get(i);
            /** 省份名字 */
            String sProvName = elementProv.attributeValue("pyName");
            String sProvNameCN = elementProv.attributeValue("quName");
            /** 添加节点 */
            Element addElementProv = DocumentHelper.createElement("prov");
            addElementProv.addAttribute("pyName", sProvName);
            addElementProv.addAttribute("quName", sProvNameCN);

            try {
                //log.info("查询省份:" + sProvNameCN + " 下的城市!");
                String sUrlProv = "http://flash.weather.com.cn/wmaps/xml/" + sProvName + ".xml";
                String sProvXml = getUrlString(sUrlProv);
                Document docProv = DocumentHelper.parseText(sProvXml);

                Element rootEltProv = docProv.getRootElement(); // 获取省份下的跟节点
                List<Element> listCity1 = rootEltProv.elements("city");
                for (int j = 0; j < listCity1.size(); j++) {
                    Element elementCity1 = listCity1.get(j);
                    String sCityName1 = elementCity1.attributeValue("pyName");
                    String sCityUrl1 = elementCity1.attributeValue("url");
                    String sCityNameCN1 = elementCity1.attributeValue("cityname");
                    System.out.println(sCityNameCN1 + ":" + sCityUrl1);

                    Element addElementMainCity = DocumentHelper.createElement("city");
                    addElementMainCity.addAttribute("pyName", sCityName1);
                    addElementMainCity.addAttribute("quName", sCityNameCN1);
                    addElementMainCity.addAttribute("url", sCityUrl1);

                    try {
                        String sUrlCity1 = "http://flash.weather.com.cn/wmaps/xml/" + sCityName1 + ".xml";
                        //log.info("查询主要城市:" + sCityNameCN1 + " 下的城市!");
                        String sCityXml = getUrlString(sUrlCity1);
                        Document docCity1 = DocumentHelper.parseText(sCityXml);
                        Element rootCity1 = docCity1.getRootElement();
                        List<Element> listCity2 = rootCity1.elements("city");

                        for (int k = 0; k < listCity2.size(); k++) {
                            Element elementCity2 = listCity2.get(k);
                            String sCityName2 = elementCity2.attributeValue("pyName");
                            String sCityNameCN2 = elementCity2.attributeValue("cityname");
                            String sCityUrl2 = elementCity2.attributeValue("url");
                            if (!sCityUrl1.endsWith(sCityUrl2)) {
                            	System.out.println(sCityNameCN2 + ":" + sCityUrl2);
							}
                            Element addElementCity2 = DocumentHelper.createElement("city2");
                            addElementCity2.addAttribute("pyName", sCityName2);
                            addElementCity2.addAttribute("quName", sCityNameCN2);
                            addElementCity2.addAttribute("url", sCityUrl2);
                            addElementMainCity.add(addElementCity2);
                        }

                    } catch (Exception e) {
                       // log.info("查询主要城市:" + sCityNameCN1 + " 下的城市失败!");
                    }
                    addElementProv.add(addElementMainCity);
                }
            } catch (Exception e) {
                //log.info("查询省份:" + sProvNameCN + "下的城市失败!");
            }
            addElementRoot.add(addElementProv);
        }
        docResult.setRootElement(addElementRoot);
        return docResult;
    }

    /**
     * 从url获取xml字符串
     * 
     * @param sUrl
     * @return
     * @throws Exception
     */
    private String getUrlString(String sUrl) throws Exception {
        String sResult = "";
        StringBuffer sbResult = null;
       // log.info("开始连接Url:" + sUrl);
        sbResult = new StringBuffer();
        URL url = new URL(sUrl);
        
        // 创建代理服务器            
        InetSocketAddress addr = new InetSocketAddress("10.128.6.3",808);            
        Proxy proxy = new Proxy(Proxy.Type.HTTP, addr); // http 代理 
        
        URLConnection con = url.openConnection(proxy);
        BufferedReader br = new BufferedReader(new InputStreamReader(con.getInputStream(), "UTF-8"));
        String sLine = null;
        while ((sLine = br.readLine()) != null) {
            sbResult.append(sLine);
        }
        sResult = sbResult.toString();
        //log.info("获取到信息:" + sbResult.toString().substring(0, 500));
        if (sResult.contains("html")) {
            String sInt = "null";
            Integer.parseInt(sInt);
        }
        return sResult;
    }
}

 

 

运行部分结果如下图:

 

posted @ 2014-07-11 10:33  岁月淡忘了谁  阅读(751)  评论(0编辑  收藏  举报