运行前先导入dom4j架包,由于我们公司用的代理服务器所以下面我设置了代理ip,不需要的可直接忽略

package com.chengshidaima.tools;

import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.InetSocketAddress;
import java.net.Proxy;
import java.net.URL;
import java.net.URLConnection;
import java.util.List;
import org.dom4j.Document;
import org.dom4j.DocumentHelper;
import org.dom4j.Element; public class CityCode
{ // private Logger log = Logger.getLogger(CityCode.class.getName()); public static void main(String[] args) {
try {
CityCode cc = new CityCode();
cc.getCityXml();
//System.out.println(doc.asXML());
} catch (Exception e) {
e.printStackTrace();
}
} /**
* 解析
*
* @return
* @throws Exception
*/
@SuppressWarnings("unchecked")
private Document getCityXml() throws Exception {
/** 新建一个doc 保存结果 */
Document docResult = DocumentHelper.createDocument();
Element addElementRoot = DocumentHelper.createElement("china"); String sUrlChina = "http://flash.weather.com.cn/wmaps/xml/china.xml";
String sChinaProvXml = getUrlString(sUrlChina);
Document doc = DocumentHelper.parseText(sChinaProvXml); Element rootElt = doc.getRootElement(); // 获取根节点
//log.info("根节点:" + rootElt.getName()); // 拿到根节点的名称
/** 取得所有省份 */
List<Element> listProv = rootElt.elements("city"); // 获取根节点下的子节点
for (int i = 0; i < listProv.size(); i++) {
Element elementProv = listProv.get(i);
/** 省份名字 */
String sProvName = elementProv.attributeValue("pyName");
String sProvNameCN = elementProv.attributeValue("quName");
/** 添加节点 */
Element addElementProv = DocumentHelper.createElement("prov");
addElementProv.addAttribute("pyName", sProvName);
addElementProv.addAttribute("quName", sProvNameCN); try {
//log.info("查询省份:" + sProvNameCN + " 下的城市!");
String sUrlProv = "http://flash.weather.com.cn/wmaps/xml/" + sProvName + ".xml";
String sProvXml = getUrlString(sUrlProv);
Document docProv = DocumentHelper.parseText(sProvXml); Element rootEltProv = docProv.getRootElement(); // 获取省份下的跟节点
List<Element> listCity1 = rootEltProv.elements("city");
for (int j = 0; j < listCity1.size(); j++) {
Element elementCity1 = listCity1.get(j);
String sCityName1 = elementCity1.attributeValue("pyName");
String sCityUrl1 = elementCity1.attributeValue("url");
String sCityNameCN1 = elementCity1.attributeValue("cityname");
System.out.println(sCityNameCN1 + ":" + sCityUrl1); Element addElementMainCity = DocumentHelper.createElement("city");
addElementMainCity.addAttribute("pyName", sCityName1);
addElementMainCity.addAttribute("quName", sCityNameCN1);
addElementMainCity.addAttribute("url", sCityUrl1); try {
String sUrlCity1 = "http://flash.weather.com.cn/wmaps/xml/" + sCityName1 + ".xml";
//log.info("查询主要城市:" + sCityNameCN1 + " 下的城市!");
String sCityXml = getUrlString(sUrlCity1);
Document docCity1 = DocumentHelper.parseText(sCityXml);
Element rootCity1 = docCity1.getRootElement();
List<Element> listCity2 = rootCity1.elements("city"); for (int k = 0; k < listCity2.size(); k++) {
Element elementCity2 = listCity2.get(k);
String sCityName2 = elementCity2.attributeValue("pyName");
String sCityNameCN2 = elementCity2.attributeValue("cityname");
String sCityUrl2 = elementCity2.attributeValue("url");
if (!sCityUrl1.endsWith(sCityUrl2)) {
System.out.println(sCityNameCN2 + ":" + sCityUrl2);
}
Element addElementCity2 = DocumentHelper.createElement("city2");
addElementCity2.addAttribute("pyName", sCityName2);
addElementCity2.addAttribute("quName", sCityNameCN2);
addElementCity2.addAttribute("url", sCityUrl2);
addElementMainCity.add(addElementCity2);
} } catch (Exception e) {
// log.info("查询主要城市:" + sCityNameCN1 + " 下的城市失败!");
}
addElementProv.add(addElementMainCity);
}
} catch (Exception e) {
//log.info("查询省份:" + sProvNameCN + "下的城市失败!");
}
addElementRoot.add(addElementProv);
}
docResult.setRootElement(addElementRoot);
return docResult;
} /**
* 从url获取xml字符串
*
* @param sUrl
* @return
* @throws Exception
*/
private String getUrlString(String sUrl) throws Exception {
String sResult = "";
StringBuffer sbResult = null;
// log.info("开始连接Url:" + sUrl);
sbResult = new StringBuffer();
URL url = new URL(sUrl); // 创建代理服务器
InetSocketAddress addr = new InetSocketAddress("10.128.6.3",808);
Proxy proxy = new Proxy(Proxy.Type.HTTP, addr); // http 代理 URLConnection con = url.openConnection(proxy);
BufferedReader br = new BufferedReader(new InputStreamReader(con.getInputStream(), "UTF-8"));
String sLine = null;
while ((sLine = br.readLine()) != null) {
sbResult.append(sLine);
}
sResult = sbResult.toString();
//log.info("获取到信息:" + sbResult.toString().substring(0, 500));
if (sResult.contains("html")) {
String sInt = "null";
Integer.parseInt(sInt);
}
return sResult;
}
}

 

运行部分结果如下图: