使用SAX解析器,需要所有xml元素(在特定元素下)作为字符串
我需要使用sax解析器从下面的xml中将所有xml元素(在特定元素下)作为字符串。使用SAX解析器,需要所有xml元素(在特定元素下)作为字符串
示例XML:
<root>
<meta>
<elememtA>xx</elememtA>
</meta>
<payload>
<parent>
<child1>a</child1>
</parent>
<parent>
<child1>b</child1>
</parent>
</payload>
</root>
SAX解析器实现:
public class UserHandler extends DefaultHandler {
@Override
public void startElement(String uri,
String localName, String qName, Attributes attributes)
throws SAXException {
if (qName.equalsIgnoreCase("payload")) {
//need all elements inside payload as string
}
例如,
我需要休耕输出:
<parent><child1>a</child1></parent><parent><child2>b</child2></parent>
这里是工作的代码。 你可以在输出的底线看到你的结果。请享用。
输出
2017-06-14 09:43:49 DEBUG SaxTest:94 - start document
2017-06-14 09:43:49 DEBUG SaxTest:107 - START - - parent
2017-06-14 09:43:49 DEBUG SaxTest:107 - START - - child1
2017-06-14 09:43:49 DEBUG SaxTest:33 - STRING : a
2017-06-14 09:43:49 DEBUG SaxTest:52 - END - - child1
2017-06-14 09:43:49 DEBUG SaxTest:52 - END - - parent
2017-06-14 09:43:49 DEBUG SaxTest:107 - START - - parent
2017-06-14 09:43:49 DEBUG SaxTest:107 - START - - child1
2017-06-14 09:43:49 DEBUG SaxTest:33 - STRING : b
2017-06-14 09:43:49 DEBUG SaxTest:52 - END - - child1
2017-06-14 09:43:49 DEBUG SaxTest:52 - END - - parent
2017-06-14 09:43:49 DEBUG SaxTest:41 - end document
2017-06-14 09:43:49 INFO SaxTest:148 - RESULT
<parent><child1>a</child1></parent><parent><child1>b</child1></parent>
代码JUnit中 - 与工作测试
package com.rizze.beans.labs.sof;
import java.io.IOException;
import java.io.StringReader;
import javax.xml.parsers.ParserConfigurationException;
import javax.xml.parsers.SAXParserFactory;
import org.junit.Test;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.xml.sax.Attributes;
import org.xml.sax.ContentHandler;
import org.xml.sax.InputSource;
import org.xml.sax.Locator;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
public class SaxTest {
public static Logger logger = LoggerFactory.getLogger(SaxTest.class);
public class SaxProcess implements ContentHandler {
private boolean start= false;
private static final String START_ITEM = "payload";
private String result = "";
@Override
public void characters(char[] ch, int begin, int length) throws SAXException {
if(start == true){
logger.debug("STRING : "+new String(ch).substring(begin,begin+length));
result+=new String(new String(ch).substring(begin,begin+length));
}
}
@Override
public void endDocument() throws SAXException {
logger.debug("end document");
}
@Override
public void endElement(String uri, String localName, String name) throws SAXException {
if(name!=null && name.compareToIgnoreCase(START_ITEM)==0){
start = false;
}
else{
if(start == true){
logger.debug("END - "+ localName + " - " + name);
result+="</"+name+">";
}
}
}
@Override
public void endPrefixMapping(String prefix) throws SAXException {
}
@Override
public void ignorableWhitespace(char[] ch, int start, int length) throws SAXException {
}
@Override
public void processingInstruction(String target, String data) throws SAXException {
}
@Override
public void setDocumentLocator(Locator locator) {
}
@Override
public void skippedEntity(String name) throws SAXException {
}
@Override
public void startDocument() throws SAXException {
start=false;
result = "";
logger.debug("start document");
}
@Override
public void startElement(String uri, String localName, String name, Attributes atts) throws SAXException {
if(name!=null && name.compareToIgnoreCase(START_ITEM)==0){
start = true;
}
else{
if(start == true){
//if already started ... go on
logger.debug("START - "+ localName + " - " + name);
result+="<"+name+">";
}
}
}
@Override
public void startPrefixMapping(String prefix, String uri) throws SAXException {
}
/**
* return resulting string
* @return
*/
public String getResult(){
return result;
}
}
@Test
public void test() {
String xml = "<root><meta><elememtA>xx</elememtA></meta><payload><parent><child1>a</child1></parent><parent><child1>b</child1></parent></payload></root>";
InputSource in = new InputSource(new StringReader(xml));
try {
XMLReader reader= SAXParserFactory.newInstance().newSAXParser().getXMLReader();
SaxProcess p=new SaxProcess();
reader.setContentHandler(p);
reader.parse(in);
logger.info("RESULT \n"+p.getResult());
} catch (ParserConfigurationException | SAXException | IOException e) {
e.printStackTrace();
}
}
}
看来你需要一个输出i n xml形式,即。您需要xml格式的parent
节点。 SAXParser或XPath引擎适用于节点和节点名称。您必须编写特殊代码才能将所需的输出作为xml返回,这可能非常麻烦并且难以维护。
轻松获得所需输出xml的一种方法是使用XSLT。
考虑使用XSLT:在一个名为parentxslt.xml
文件
<?xml version="1.0" encoding="UTF-8"?>
<xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
<xsl:output method="xml" omit-xml-declaration="yes"/>
<xsl:template match="/">
<xsl:copy-of select="//payload/parent"/>
</xsl:template>
</xsl:stylesheet>
地方这一点,并把你的输入XML在parent.xml
,那么你可以使用下面的Java代码:
try
{
File stylesheet = new File("parentxslt.xml");
Transformer transformer = TransformerFactory.newInstance().newTransformer(new StreamSource(stylesheet));
StreamSource xmlSource = new StreamSource(new File("parent.xml"));
StringWriter sw = new StringWriter();
transformer.transform(xmlSource, new StreamResult(sw));
System.out.println(sw.toString().replaceAll("\\\r\\n\\s*", ""));
}
catch (Exception ex)
{
ex.printStackTrace();
}
不要仅仅因为要对其进行转换而创建DOM。向变压器提供StreamSource或SAXSource要好得多。 –
@MichaelKay感谢您的评论!我更新了我的代码以使用'StreamSource' – SomeDude
另外,为什么不把它缩小到'
喜,以为你的意思是:一个 b –
jeorfevre
喜,我没有让你 – pradeep
刚刚编辑帖子,第二个参数是 b –
jeorfevre