XML的重点知识

1. XML介绍与用途
1.1 XML是什么


1.2 XML的用途
2. XML的文档结构
DOCTYPE hr SYSTEM "hr.dtd">
<hr>
<employee no="3301">
<name>李铁柱name>
<age>37age>
<salary>3600salary>
<department>
<dname>人事部dname>
<address>XX大厦-B105address>
department>
employee>
<employee no="3302">
<name>林海name>
<age>50age>
<salary>7000salary>
<department>
<dname>财务部dname>
<address>XX大厦-B106address>
department>
employee>
<employee no="3310">
<name>李四name>
<age>23age>
<salary>3000salary>
<department>
<dname>工程部dname>
<address>XX大厦-B104address>
department>
employee>
hr>
可以使用浏览器打开检验是否存在语法问题
3.XML标签书写规则
标签要有意义,建议使用英文小写字母,不要存在重名的情况!4.XML语义约束
DTD与XML SchemaDTD(Document Type Definition,文档类型定义)是一种简单易用的语义约束方式。扩展名为.dtd

DTD文件
<!ELEMENT hr (employee+)>
<!ELEMENT employee (name,age,salary,department)>
<!ATTLIST employee no CDATA "">
<!ELEMENT name (#PCDATA)>
<!ELEMENT age (#PCDATA)>
<!ELEMENT salary (#PCDATA)>
<!ELEMENT department (dname,address)>
<!ELEMENT dname (#PCDATA)>
<!ELEMENT address (#PCDATA)>
PCDATA表示纯文本节点
XML Schema文件XML Schema比DTD更为复杂,提供了更多功能XML Schema提供了数据类型,格式限定,数据范围等特性XML Schema是W3C标准
<schema xmlns="http://www.w3.org/2001/XMLSchema">
<element name="hr">
<complexType>
<sequence>
<element name="employee" minOccurs="1" maxOccurs="9999">
<complexType>
<sequence>
<element name="name" type="string">element>
<element name="age">
<simpleType>
<restriction base="integer">
<minInclusive value="18">minInclusive>
<maxInclusive value="60">maxInclusive>
restriction>
simpleType>
element>
<element name="salary" type="integer">element>
<element name="department">
<complexType>
<sequence>
<element name="dname" type="string">element>
<element name="address" type="string">element>
sequence>
complexType>
element>
sequence>
<attribute name="no" type="string" use="required">attribute>
complexType>
element>
sequence>
complexType>
element>
schema>
5.Java解析XML
DOM(Document Object Model) 定义了访问和操作XML文档的标准方法,DOM把XML文档作为树结构来查看,能够通过DOM树来读写所有的元素。

–Dom4j下载地址
Reader.java
package com.imooc.dom4j;
import java.util.List;
import org.dom4j.Attribute;
import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.Element;
import org.dom4j.io.SAXReader;
public class HrReader {
public void readXml(){
String file = "d:/workspace/xml/src/hr.xml";
//SAXReader类是读取XML文件的核心类,用于将XML解析后以“树”的形式保存在内存中。
SAXReader reader = new SAXReader();
try {
Document document = reader.read(file);
//获取XML文档的根节点,即hr标签
Element root = document.getRootElement();
//elements方法用于获取指定的标签集合
List<Element> employees = root.elements("employee");
for(Element employee : employees){
//element方法用于获取唯一的子节点对象
Element name = employee.element("name");
String empName = name.getText();//getText()方法用于获取标签文本
System.out.println(empName);
System.out.println(employee.elementText("age"));
System.out.println(employee.elementText("salary"));
Element department = employee.element("department");
System.out.println(department.element("dname").getText());
System.out.println(department.element("address").getText());
Attribute att = employee.attribute("no");
System.out.println(att.getText());
}
} catch (DocumentException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
public static void main(String[] args) {
HrReader reader = new HrReader();
reader.readXml();
}
}
Wirter.java
package com.imooc.dom4j;
import java.io.FileOutputStream;
import java.io.OutputStreamWriter;
import java.io.Writer;
import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.Element;
import org.dom4j.io.SAXReader;
public class HrWriter {
public void writeXml(){
String file = "d:/workspace/xml/src/hr.xml";
SAXReader reader = new SAXReader();
try {
Document document = reader.read(file);
Element root = document.getRootElement();
Element employee = root.addElement("employee");
employee.addAttribute("no", "3311");
Element name = employee.addElement("name");
name.setText("李铁柱");
employee.addElement("age").setText("37");
employee.addElement("salary").setText("3600");
Element department = employee.addElement("department");
department.addElement("dname").setText("人事部");
department.addElement("address").setText("XX大厦-B105");
Writer writer = new OutputStreamWriter(new FileOutputStream(file) , "UTF-8");
document.write(writer);
writer.close();
} catch (Exception e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
public static void main(String[] args) {
HrWriter hrWriter = new HrWriter();
hrWriter.writeXml();
}
}
6.XPath路径表达式



maven.aliyun.com)package com.imooc.dom4j;
import java.util.List;
import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.Element;
import org.dom4j.Node;
import org.dom4j.io.SAXReader;
public class XPathTestor {
public void xpath(String xpathExp){
String file = "E:/lianxi/xml/hr.xml";
SAXReader reader = new SAXReader();
try {
Document document = reader.read(file);
List<Node> nodes = document.selectNodes(xpathExp);
for(Node node : nodes){
Element emp = (Element)node;
System.out.println(emp.attributeValue("no"));
System.out.println(emp.elementText("name"));
System.out.println(emp.elementText("age"));
System.out.println(emp.elementText("salary"));
System.out.println("==============================");
}
} catch (DocumentException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
public static void main(String[] args) {
XPathTestor testor = new XPathTestor();
// testor.xpath("/hr/employee");
// testor.xpath("//employee");
// testor.xpath("//employee[salary<4000]");
// testor.xpath("//employee[name='李铁柱']");
// testor.xpath("//employee[@no=3304]");
// testor.xpath("//employee[1]");
// testor.xpath("//employee[last()]");
//testor.xpath("//employee[position()<3]");
testor.xpath("//employee[3] | //employee[8]");
}
}