`
jilong-liang
  • 浏览: 471536 次
  • 性别: Icon_minigender_1
  • 来自: 广州
社区版块
存档分类

dom4j和jsoup解析百度地图xml获取地方信息

阅读更多
package ivyy.taobao.com.dom4j;
import ivyy.taobao.com.entity.Address;
import ivyy.taobao.com.entity.Location;
import ivyy.taobao.com.entity.Point;
import ivyy.taobao.com.entity.Pois;
import ivyy.taobao.com.utils.IoUtils;
import ivyy.taobao.com.utils.UrlUtils;
import ivyy.taobao.com.utils.Dom4jUtils;

import java.io.File;
import java.net.URL;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import org.dom4j.DocumentHelper;
import org.dom4j.Element;
import org.dom4j.io.SAXReader;
import org.jsoup.Jsoup;
import org.jsoup.select.Elements;
/**
 *@Date:2015-1-6
 *@Author:liangjilong
 *@Email:jilongliang@sina.com
 *@Version:1.0
 *@Description:
 */
@SuppressWarnings("all")
public class Dom4jTest2 {
	
	public static void main(String[] args)throws Exception {
		//String filepath="D:/"+System.currentTimeMillis()+".xml";
		String filepath="D:/test/map1.xml";
		File f=new File(filepath);
		if(!f.exists()){
			f.createNewFile();
		}
		//List<Pois> list=getReaderXml("URL");
		List<Pois> list=getReaderXml("FILE");
		org.dom4j.Document doc=createAsXML(list);
		IoUtils.write(doc.asXML(),filepath);
		//格式化 
		Dom4jUtils.formatAsXml(doc);
	}
	
	 
	/****
	 * 组装成一个xml
	 * @param list
	 * @return
	 * @throws Exception
	 */
	private static org.dom4j.Document createAsXML(List<Pois> list) throws Exception{
		org.dom4j.Document doc=DocumentHelper.createDocument();
		Element  root=doc.addElement("GeocoderSearchResponse");//根
		root.addElement("status").setText("0");//status
		for (Iterator iterator = list.iterator(); iterator.hasNext();) {
			Pois pois = (Pois) iterator.next();

			Element result=root.addElement("result");//result
			List<Location>  listLoc=pois.getLocations();
			
			Element location=result.addElement("location");//location
			for (Iterator iterator2 = listLoc.iterator(); iterator2.hasNext();) {
				Location locObj = (Location) iterator2.next();
				location.addElement("lat").setText(locObj.getLat()+"");//lat
				location.addElement("lng").setText(locObj.getLng()+"");//lat
				result.addElement("formatted_address").setText(locObj.getFormattedAddress()+"");//formatted_address
				result.addElement("business").setText(locObj.getBusiness()+"");//business
			}
			
			List<Address>  listAdd=pois.getAddress();
			Element comp=result.addElement("addressComponent");//addressComponent
			for (Iterator iterator3 = listAdd.iterator(); iterator3.hasNext();) {
				Address address = (Address) iterator3.next();
				comp.addElement("streetNumber").setText(address.getStreetNumber()+"");//streetNumber
				comp.addElement("street").setText(address.getStreet()+"");//street
				comp.addElement("district").setText(address.getDistrict()+"");//district
				comp.addElement("city").setText(address.getCity()+"");//city
				comp.addElement("province").setText(address.getProvince()+"");//province
				comp.addElement("cityCode").setText(address.getCityCode()+"");//cityCode
			}
		
			Element poi=result.addElement("pois").addElement("poi");
			poi.addElement("addr").setText(pois.getAddr());//addr
			poi.addElement("distance").setText(pois.getDistance());//distance
			poi.addElement("name").setText(pois.getName());//name
			poi.addElement("poiType").setText(pois.getPoiType());//poiType
			poi.addElement("tel").setText(pois.getTel());//tel
			poi.addElement("zip").setText(pois.getZip());//zip
			
			List<Point> listPoint=pois.getPoints();
			Element point=poi.addElement("point");
			for (Iterator iterator4 = listPoint.iterator(); iterator4.hasNext();) {
				Point p = (Point) iterator4.next();
				point.addElement("x").setText(p.getX()+"");
				point.addElement("y").setText(p.getY()+"");
			}
		}
		 
		return doc;
	}
	 
	
	/**
	 * Dom4j(SAX)读取xml数据(解析)
	 * @param params
	 * @throws Exception
	 */
	private static List<Pois> getReaderXml(String flg) throws Exception{
		String fromRead=Dom4jTest2.class.getClassLoader().getResource("xml/map1.xml").getPath();

		List<Pois> list=new ArrayList<Pois>();
		SAXReader saxReader = new SAXReader();
		org.dom4j.Document document=null;
		//从api上面解析
		if(flg.equals("URL")){
			String url = UrlUtils.getBaiduMapUrl("你的key", "39.983424,116.322987", "xml");
			document = saxReader.read(url);
		//从文件上面的xml解析
		}else if(flg.equals("FILE")){
			document = saxReader.read(new File(fromRead));
		}
		Element resultEl = (Element)document.getRootElement().element("result");
		Element poisEl=resultEl.element("pois");//pois节点
		Element locationEl=resultEl.element("location");//location节点
		Element addressEl=resultEl.element("addressComponent");//addressComponent节点
		
		/*******从pois节点下面遍历多个poi节点*******/
		for (Iterator<Element> poIter = poisEl.elementIterator("poi"); poIter.hasNext();) {
			Element element = (Element) poIter.next();
			String addr = element.elementText("addr");
			String distance = element.elementText("distance");
			String name = element.elementText("name");
			String poiType = element.elementText("poiType");
			String tel =(element.elementText("tel")==""?"":element.elementText("tel"));
			String zip =(element.elementText("zip")==""?"":element.elementText("zip"));
			
			Pois poi=new Pois();
			poi.setAddr(addr);
			poi.setDistance(distance);
			poi.setName(name);
			poi.setPoiType(poiType);
			poi.setTel(tel);
			poi.setZip(zip);
			
			
			List<Location> listLoc=new ArrayList<Location>();
			/************Location***************************/
			String business=resultEl.elementText("business");
			String formatted_address=resultEl.elementText("formatted_address");
			String lat = locationEl.elementText("lat");
			String lng = locationEl.elementText("lng");
			
			Location location=new Location();
			location.setBusiness(business);
			location.setFormattedAddress(formatted_address);
			location.setLat(lat);
			location.setLng(lng);

			listLoc.add(location);
			poi.setLocations(listLoc);

			
			List<Address> listAddr=new ArrayList<Address>();
			/************Address***************************/
			Address address=new Address();
			String streetNumber=(addressEl.elementText("streetNumber")==""?"":addressEl.elementText("streetNumber"));
			String street=(addressEl.elementText("street")==""?"":addressEl.elementText("street"));
			String district=(addressEl.elementText("district")==""?"":addressEl.elementText("district"));
			String city=(addressEl.elementText("city")==""?"":addressEl.elementText("city"));
			String province=(addressEl.elementText("province")==""?"":addressEl.elementText("province"));
			String direction=(addressEl.elementText("direction")==""?"":addressEl.elementText("direction"));
			String distancez=(addressEl.elementText("distance")==""?"":addressEl.elementText("distance"));
			
			address.setStreetNumber(streetNumber);
			address.setStreet(street);
			address.setCity(city);
			address.setDistrict(district);
			address.setDirection(direction);
			address.setDistance(distancez);
			address.setProvince(province);
			
			listAddr.add(address);
			
			poi.setAddress(listAddr);
			
			list.add(poi);
		}
		
		return list;
	}
	
}

 

package ivyy.taobao.com.jsoup;
import ivyy.taobao.com.dom4j.Dom4jTest1;
import ivyy.taobao.com.entity.Address;
import ivyy.taobao.com.entity.Location;
import ivyy.taobao.com.entity.Point;
import ivyy.taobao.com.entity.Pois;
import ivyy.taobao.com.utils.IoUtils;
import ivyy.taobao.com.utils.UrlUtils;
import ivyy.taobao.com.utils.Dom4jUtils;

import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import org.dom4j.DocumentHelper;
import org.dom4j.Element;
import org.dom4j.io.SAXReader;
import org.jsoup.Jsoup;
import org.jsoup.select.Elements;
/**
 *@Date:2015-1-6
 *@Author:liangjilong
 *@Email:jilongliang@sina.com
 *@Version:1.0
 *@Description:
 */
@SuppressWarnings("all")
public class JsoupMap {
	
	public static void main(String[] args)throws Exception {
		String Encodeing="GBK";
		//List<Pois> list=JsoupReadXml("URL",Encodeing);//从api读取

		//------------------------------可以將這些數據保存到數據庫-------------------
		List<Pois> list=JsoupReadXml("FILE",Encodeing);//从本地的文件读取
		for (Iterator iterator = list.iterator(); iterator.hasNext();) {
			Pois pois = (Pois) iterator.next();
			
			//System.out.println(pois.getAddr());
			
			//------------------------------Address-----------------
			
			List<Address> listAdds=pois.getAddress();
			for (Iterator iterator2 = listAdds.iterator(); iterator2.hasNext();) {
				Address address = (Address) iterator2.next();
				System.out.println(address.getCity());
			}
			
			//------------------------------Location-----------------
			List<Location> locations = pois.getLocations();
			
			for (Iterator iterator2 = locations.iterator(); iterator2.hasNext();) {
				Location location = (Location) iterator2.next();
				System.out.println(location.getFormattedAddress());
			}
			
		}
	}
	 
	/**
	 * 用Jsoup去解析xml
	 * @param params
	 */
	private static List<Pois> JsoupReadXml(String flg,String Encodeing) throws Exception{
		List<Pois> list=new ArrayList<Pois>();
		
		String url = UrlUtils.getBaiduMapUrl("你的key", "39.983424,116.322987", "xml");
		org.jsoup.nodes.Document doc=null;
		if(flg.equals("URL")){
			  doc=Jsoup.connect(url).get();//网络连接
		}else if(flg.equals("FILE")){
			  String fromRead=Dom4jTest1.class.getClassLoader().getResource("xml/map1.xml").getPath();
			  String html=IoUtils.reader(fromRead);
			  doc=Jsoup.parse(html,Encodeing);
		}
		
		//org.jsoup.nodes.Document doc=Jsoup.parse(params);//本地数据,连接关闭就可以调用
		if(doc!=null)
		{
			Elements pois=doc.select("poi");//获取到poi节点
			for(org.jsoup.nodes.Element poi:pois){
				String addr=poi.getElementsByTag("addr").text().trim();
				String distance=poi.getElementsByTag("distance").text().trim();
				String name=poi.getElementsByTag("name").text().trim();
				String tel=poi.getElementsByTag("tel").text().trim();
				String zip=poi.getElementsByTag("zip").text().trim();
				String poiType=poi.getElementsByTag("poiType").text().trim();

				Pois p=new Pois();
				p.setAddr(addr);
				p.setDistance(distance);
				p.setName(name);
				p.setPoiType(poiType);
				p.setTel(tel);
				p.setZip(zip);
				
				List<Point> listPoint=new ArrayList<Point>();
				Point point=new Point();
				
				String x=poi.getElementsByTag("x").text().trim();
				point.setX(x);
				String y=poi.getElementsByTag("y").text().trim();
				point.setY(y);
				
				listPoint.add(point);
				p.setPoints(listPoint);
				
				List<Address> listAdd=new ArrayList<Address>();
				
				Elements comps=doc.select("addressComponent");
				
				for (org.jsoup.nodes.Element comp:comps) {
					String streetNumber=comp.getElementsByTag("streetNumber").text().trim();
					String district=comp.getElementsByTag("district").text().trim();
					String street=comp.getElementsByTag("street").text().trim();
					String city=comp.getElementsByTag("city").text().trim();
					String province=comp.getElementsByTag("province").text().trim();

					Address add=new Address();
					add.setStreetNumber(streetNumber);
					add.setStreet(street);
					add.setDistrict(district);
					add.setCity(city);
					add.setProvince(province);
					listAdd.add(add);
				}
				p.setAddress(listAdd);
				
				List<Location> listLoc=new ArrayList<Location>();
				Elements location=doc.select("location");
				for (org.jsoup.nodes.Element obj:location) {
					String	lat=obj.getElementsByTag("lat").text().trim();
					String	formatted_address=obj.getElementsByTag("formatted_address").text().trim();
					String	lng=obj.getElementsByTag("lng").text().trim();
					String	business=doc.select("business").text().trim();

					Location locat=new Location();
					locat.setLng(lng);
					locat.setLat(lat);
					locat.setFormattedAddress(formatted_address);
					locat.setBusiness(business);
					listLoc.add(locat);
				}
				String	status=doc.select("status").text().trim();
				p.setStatus(status);
				p.setLocations(listLoc);
				list.add(p);
			}
		}
		return list;
	}
}

 

package ivyy.taobao.com.entity;

import java.io.Serializable;

public class Location implements Serializable{
	private  String lat;//纬度
	private  String lng;//经度
	private  String formattedAddress;//经度
	private  String business;//经度
	public String getLat() {
		return lat;
	}
	public void setLat(String lat) {
		this.lat = lat;
	}
	public String getLng() {
		return lng;
	}
	public void setLng(String lng) {
		this.lng = lng;
	}
	public String getFormattedAddress() {
		return formattedAddress;
	}
	public void setFormattedAddress(String formattedAddress) {
		this.formattedAddress = formattedAddress;
	}
	public String getBusiness() {
		return business;
	}
	public void setBusiness(String business) {
		this.business = business;
	}
}

 

package ivyy.taobao.com.entity;

import java.io.Serializable;

public class Point implements Serializable{
	private String x;
	private String y;
	public String getX() {
		return x;
	}
	public void setX(String x) {
		this.x = x;
	}
	public String getY() {
		return y;
	}
	public void setY(String y) {
		this.y = y;
	}
	
}

 

package ivyy.taobao.com.entity;

import java.io.Serializable;
import java.util.ArrayList;
import java.util.List;

public class Pois implements Serializable{
	private String addr;
	private String distance;
	private String name;
	private String poiType;
	private String tel;
	private String zip;
	private String status;
	private String url;
	private String mapUrl;
	private List<Point> points=new ArrayList<Point>();
	private List<Location> locations=new ArrayList<Location>();
	private List<Address> address=new ArrayList<Address>();
	private List<Pois> pois=new ArrayList<Pois>();
	
	public String getStatus() {
		return status;
	}
	public String getUrl() {
		return url;
	}
	public void setUrl(String url) {
		this.url = url;
	}
	public void setStatus(String status) {
		this.status = status;
	}
	public List<Location> getLocations() {
		return locations;
	}
	public void setLocations(List<Location> locations) {
		this.locations = locations;
	}
	public List<Address> getAddress() {
		return address;
	}
	public void setAddress(List<Address> address) {
		this.address = address;
	}
	public List<Pois> getPois() {
		return pois;
	}
	public void setPois(List<Pois> pois) {
		this.pois = pois;
	} 
	
	public String getAddr() {
		return addr;
	}
	public void setAddr(String addr) {
		this.addr = addr;
	}
	public String getDistance() {
		return distance;
	}
	public void setDistance(String distance) {
		this.distance = distance;
	}
	public String getName() {
		return name;
	}
	public void setName(String name) {
		this.name = name;
	}
	public String getPoiType() {
		return poiType;
	}
	public void setPoiType(String poiType) {
		this.poiType = poiType;
	}
	public String getTel() {
		return tel;
	}
	public void setTel(String tel) {
		this.tel = tel;
	}
	public String getZip() {
		return zip;
	}
	public void setZip(String zip) {
		this.zip = zip;
	}
	public List<Point> getPoints() {
		return points;
	}
	public void setPoints(List<Point> points) {
		this.points = points;
	}
	public String getMapUrl() {
		return mapUrl;
	}
	public void setMapUrl(String mapUrl) {
		this.mapUrl = mapUrl;
	}
	
}

 

 


 

源代码  http://download.csdn.net/detail/jilongliang/8333361

 

  • 大小: 20.3 KB
  • 大小: 161.5 KB
0
4
分享到:
评论

相关推荐

    使用Jsoup库解析HTML、XML或URL链接中的DOM节点

    使用Jsoup库解析HTML、XML或URL链接中的DOM节点 Jsoup进行Html的Dom解析

    java解析xml,dom解析,jsoup解析,完整项目

    java解析xml,dom解析,jsoup解析,两种不同方式的解析,完整项目

    HTML、XML等Dom节点类解析库jsoup.jar

    HTML、XML等Dom节点类解析库jsoup.jar,解析速度很快

    dom4j-jdom封装和解析例子

    dom4j,jsoup,jdom,w3cdom,xstream使用代码工程 package ivyy.taobao.com.dom4j; import ivyy.taobao.com.entity.Address; import ivyy.taobao.com.entity.Location; import ivyy.taobao.com.entity.Point; import ...

    JsoupXpath-0.3.2.jar 完整版

    JsoupXpath 是一款纯Java开发的使用xpath解析提取html数据的解析器,针对html解析完整实现了W3C XPATH 1.0标准语法,xpath的Lexer和Parser基于Antlr4构建,html的DOM树生成采用Jsoup,故命名为JsoupXpath....

    jsoup 1.9.2 -java的网页解析处理

    它提供了一套非常省力的API,可通过DOM,CSS以及类似于JQuery的操作方法来取出和操作数据。. jsoup 1.9.2 发布,改进内容包括: 改进: 1. In XML documents, detect the charset from the XML prolog -- Bug ...

    jsoup资源包-java

    jsoup 是一款Java 的HTML解析器,可直接解析某个URL地址、HTML文本内容。它提供了一套非常省力的API,可通过DOM,CSS以及类似于jQuery的操作方法来取出和操作数据。 同样可以操作xml等。

    XpathDemo.zip

    JsoupXPath是基于Jsoup的拓展,使用路径的形式解析XML和HTML文档。核心类为JXDocument;JsoupXPath的节点对象JXNode不仅可以获取标签节点,还可以获取属性节点 HtmlCleaner是一个开源的Java语言的Html文档解析器。...

    基于springboot-2019-ncov疫情态势信息管理系统

    数据采集方面采用HttpClient发送网络请求并使用jsoup解析HTML数据和对接天行数据API,数据处理方面采用fastjson、dom4j等技术处理json和xml文件,数据存储方面采用传统关系型数据库mysql搭配Druid连接池;...

    jsoup-1.13.1.zip

    Jsuop是一款Java的HTML解析器,可以直接解析某个url地址、HTML文本内容。它提供了一套非常省力的API,可以通过DOM,CSS以及类似jQuery的操作方法来取出和操作数据。

Global site tag (gtag.js) - Google Analytics