package com.demo;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.OutputStream;
import java.util.ArrayList;
import java.util.List;
import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.xpath.XPath;
import javax.xml.xpath.XPathConstants;
import javax.xml.xpath.XPathFactory;
import org.w3c.dom.Document;
import org.w3c.dom.Element;
import org.w3c.dom.Node;
import org.w3c.dom.NodeList;
import com.demo.User;
public class XMLDataUtils {
public static void main(String[] args) {
XMLDataUtils aXMDataLUtils = new XMLDataUtils();
List<User> list = aXMDataLUtils.getUsers();
for (int i = 0; i < list.size(); i++) {
// System.out.println(list.size());
User aUsers = list.get(i);
System.out.println(aUsers.getId());
System.out.println(aUsers.getPersonname());
System.out.println(aUsers.getWebname());
System.out.println(aUsers.getCreatetime());
System.out.println(aUsers.getImg());
System.out.println(aUsers.getText());
}
}
//解析智库网专家
public List<User> getUsers() {
List<User> r = new ArrayList<User>();
User aUsers = null;
File file = new File("D://文件/智库网专家/XML");
if (file.exists()) {
File[] files = file.listFiles();
if (files.length == 0) {
// System.out.println("文件夹是空的!");
return r;
} else {
for (File file2 : files) {
if (file2.isDirectory()) {
// System.out.println("文件夹:" + file2.getAbsolutePath());
traverseFolder2(file2.getAbsolutePath());
} else {
// System.out.println("文件:" + file2.getAbsolutePath());
}
try {
// 解析文件,生成document对象
DocumentBuilder builder = DocumentBuilderFactory.newInstance()
.newDocumentBuilder();
Document document = builder.parse(new File(file2.getAbsolutePath()));
// 生成XPath对象
XPath xpath = XPathFactory.newInstance().newXPath();
// 获取集合
NodeList list = (NodeList) xpath.evaluate("/Entity", document,
XPathConstants.NODESET);
for (int i = 0; i < list.getLength(); i++) {
Node aNode = list.item(i);
Element eElement = (Element) aNode;
aUsers = new User();
aUsers.setId(eElement.getElementsByTagName("ID").item(0).getTextContent());
aUsers.setPersonname(eElement.getElementsByTagName("PersonName").item(0).getTextContent());
aUsers.setWebname(eElement.getElementsByTagName("WebName").item(0).getTextContent());
aUsers.setCreatetime(eElement.getElementsByTagName("CreateTime").item(0).getTextContent());
String div=eElement.getElementsByTagName("WebInfoContent").item(0).getTextContent();
String img=div.substring(div.indexOf("src=\"")+5,div.indexOf("/"));
img=img.replace("\"", "");
aUsers.setImg(img);
// HTMLSpirit htmlSpirit=new HTMLSpirit();
// String text=HTMLSpirit.delHTMLTag(div);
// System.out.println(div);
//创建文件 0.xml
createFile();
StringBuffer s1 = new StringBuffer();
s1.append("<!DOCTYPE HTML PUBLIC \"-//W3C//DTD HTML 4.01 Transitional//EN\">");
s1.append("<HTML>");
s1.append(" <HEAD><TITLE>A Servlet</TITLE></HEAD>");
s1.append(" <BODY>");
s1.append(div);
s1.append(" </BODY>");
s1.append("</HTML>");
String str = s1.toString();
//转换
strChangeXML(str);
aUsers.setText(TestJsoupXml.getText());
//删除文件
// aUsers.setText(text);
r.add(aUsers);
deleteFile();
}
System.out.println("r="+r.size());
} catch (Exception e) {
e.printStackTrace();
}
}
}
} else {
System.out.println("文件不存在!");
}
return r;
}
public static void strChangeXML(String str){
try {
File file = new File("D:/文件/智库网专家/XML/0.xml");
OutputStream out=new FileOutputStream(file);//如果文件不存在会自动创建
byte[] b=str.getBytes();
for(int i=0;i<b.length;i++){
out.write(b[i]);
}
out.close();
} catch (FileNotFoundException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
//创建文件
public static void createFile(){
//path表示你所创建文件的路径
String path = "D://文件/智库网专家/XML";
File f = new File(path);
if(!f.exists()){
f.mkdirs();
}
// fileName表示你创建的文件名;为txt类型;
String fileName="0.xml";
File file = new File(f,fileName);
if(!file.exists()){
try {
file.createNewFile();
} catch (IOException e) {
e.printStackTrace();
}
}
}
public static boolean deleteFile() {
boolean flag = true;
File file = new File("D://文件/智库网专家/XML/0.xml");
// 路径为文件且不为空则进行删除
if (file.isFile() && file.exists()) {
file.delete();
System.out.println("删除成功");
return flag = true;
}
return flag;
}
private void traverseFolder2(String absolutePath) {
// TODO Auto-generated method stub
}
}
转载于:https://www.cnblogs.com/xgwtzg/p/6141757.html