【问题标题】:Parse xml file using vtd-xml使用 vtd-xml 解析 xml 文件
【发布时间】:2014-01-21 15:15:38
【问题描述】:

如何在 java 或 C 中使用 vtd-xml 解析如下的 xml 文件?

<?xml version="1.0" encoding="utf-8"?>
<StockReport>
  <Article Code="027783012" Height="35" Width="36" Length="136"  TotalPacks="4" AvailablePacks="4" StockReturnPacks="4" BlockedPacks="0" NextExpiryDate="2015-01-17">
      <Machine Number="1" TotalPacks="4" AvailablePacks="4" StockReturnPacks="4" BlockedPacks="0" NextExpiryDate="2015-01-17" />
 </Article>
 <Article Code="025349109" Height="36" Width="37" Length="129" TotalPacks="6" AvailablePacks="6" StockReturnPacks="6" BlockedPacks="0" NextExpiryDate="2015-01-17">
      <Machine Number="1" TotalPacks="6" AvailablePacks="6" StockReturnPacks="6" BlockedPacks="0" NextExpiryDate="2015-01-17" />
 </Article>
 <Article Code="039154327" Height="0" Width="0" Length="0" TotalPacks="0" AvailablePacks="0" StockReturnPacks="0" BlockedPacks="0" NextExpiryDate="" />
 <Article Code="932654167" Height="57" Width="99" Length="137" TotalPacks="27" AvailablePacks="27" StockReturnPacks="27" BlockedPacks="0" NextExpiryDate="2014-04-17">
    <Machine Number="1" TotalPacks="16" AvailablePacks="16" StockReturnPacks="16" BlockedPacks="0" NextExpiryDate="2015-01-17" />
    <Machine Number="2" TotalPacks="11" AvailablePacks="11" StockReturnPacks="11" BlockedPacks="0" NextExpiryDate="2014-04-17" />
 </Article>
</StockReport>

任何帮助将不胜感激。

谢谢

【问题讨论】:

  • 你看过java和C的教程吗?这对你来说应该很容易......

标签: java c xml xml-parsing vtd-xml


【解决方案1】:

我猜这部分取决于您要如何解析文件。

这是一个“非生产”示例,它使用了一些有用的技术,包括:

  • XPath 选择(这里只使用“/*”)
  • 查看所有兄弟节点
  • 向下看子节点
  • 使用 AutoPilot 将节点属性提取到地图中

希望对你有帮助

package scce;

import com.ximpleware.AutoPilot;
import com.ximpleware.NavException;
import com.ximpleware.VTDGen;
import com.ximpleware.VTDNav;
import com.ximpleware.XPathEvalException;
import com.ximpleware.XPathParseException;
import java.io.File;
import java.io.IOException;
import java.util.LinkedHashMap;
import java.util.Map;

/**
 *
 * @author David
 */
public class VTDParserExample {

    VTDGen vg;
    VTDNav vn;

    public VTDParserExample() {
        vg = new VTDGen();    
    }

    public void parseAndPrint() throws NavException {

        int level = 0;

        for(boolean el = (vn != null); 
                    el == true ;
                    el = vn.toElement(VTDNav.NEXT_SIBLING)) {

            printTag(vn, level);

            parseAndPrintChildren(level);                
        }

    } 

     private void parseAndPrintChildren(int level) throws NavException {

        vn.push();

        for(boolean el = vn.toElement(VTDNav.FIRST_CHILD); 
                    el == true ;
                    el = vn.toElement(VTDNav.NEXT_SIBLING)) {

            printTag(vn, level + 1);

            parseAndPrintChildren(level + 1);                
        }

        vn.pop();

    }

    public VTDNav loadFile(String filePath) throws IOException {

        File fDoc = new File(filePath);

        if (fDoc != null && fDoc.exists()) {
            System.out.println("loadFile file exists ["+filePath+"]");

            vg.clear();
            if (vg.parseFile(filePath, true)) {
                vn = vg.getNav();
            }
        }
        else {
            throw new IOException("File ["+filePath+"] invalid");
        }             

        if (vn == null) {                
            throw new IOException("Cannot parse file ["+filePath+"]");
        }

        return vn;
    }

    public void getElementsByXpath() {

        AutoPilot ap = new AutoPilot(vn);

        try
        {
            String xpQ = "/*";

            ap.selectXPath(xpQ);    
            if (ap.evalXPathToBoolean()) {
                ap.evalXPath();
            }
            else {
                System.out.println(this.getClass()+".getAllElements evalXPathToBoolean["+ap.evalXPathToBoolean()+"]");
            }
        }
        catch(XPathParseException | XPathEvalException | NavException e) {
            e.printStackTrace();
        }            

    }

    private void loadAttributeMap(VTDNav nav, Map<String, String>amap) {      

        nav.push();

        try {
            AutoPilot apAtt = new AutoPilot(nav);
            apAtt.selectXPath("@*");

            int j=-1;
            while ((j=apAtt.evalXPath())!=-1) {
                String name = nav.toString(j);
                String val = nav.toString(j+1);

                amap.put(name, val);
            }                     
        }
        catch(XPathParseException | XPathEvalException | NavException e) {
            e.printStackTrace();
        }

        nav.pop();        
    }     

    private void printTag(VTDNav vn, int level) throws NavException {

        String tag = vn.toString(vn.getCurrentIndex());
        System.out.print("Level ["+level+"] Tag ["+tag+"]");

        Map<String, String>amap = new LinkedHashMap<String, String>();

        loadAttributeMap(vn, amap);

        for (String aname: amap.keySet()) {
            String aval = amap.get(aname);

            System.out.print(" @"+aname+"="+aval);
        }
        System.out.print("\n");
    }

    public static void main(String[] args) {

        VTDParserExample vp = new VTDParserExample();

        try {

            vp.loadFile("src/scce/famedoro.xml");                                     
            vp.getElementsByXpath();
            vp.parseAndPrint();

        }
        catch (Exception ex) {
            ex.printStackTrace();
        }
    }
}

产生以下输出:

loadFile file exists [src/scce/famedoro.xml]
Level [0] Tag [StockReport]
Level [1] Tag [Article] @Code=027783012 @Height=35 @Width=36 @Length=136 @TotalPacks=4 @AvailablePacks=4 @StockReturnPacks=4 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [2] Tag [Machine] @Number=1 @TotalPacks=4 @AvailablePacks=4 @StockReturnPacks=4 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [1] Tag [Article] @Code=025349109 @Height=36 @Width=37 @Length=129 @TotalPacks=6 @AvailablePacks=6 @StockReturnPacks=6 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [2] Tag [Machine] @Number=1 @TotalPacks=6 @AvailablePacks=6 @StockReturnPacks=6 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [1] Tag [Article] @Code=039154327 @Height=0 @Width=0 @Length=0 @TotalPacks=0 @AvailablePacks=0 @StockReturnPacks=0 @BlockedPacks=0 @NextExpiryDate=
Level [1] Tag [Article] @Code=932654167 @Height=57 @Width=99 @Length=137 @TotalPacks=27 @AvailablePacks=27 @StockReturnPacks=27 @BlockedPacks=0 @NextExpiryDate=2014-04-17
Level [2] Tag [Machine] @Number=1 @TotalPacks=16 @AvailablePacks=16 @StockReturnPacks=16 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [2] Tag [Machine] @Number=2 @TotalPacks=11 @AvailablePacks=11 @StockReturnPacks=11 @BlockedPacks=0 @NextExpiryDate=2014-04-17

添加带有 AutoPilot 循环的示例(而不是像上面那样纯粹基于节点)不能很好地混合这些

package scce;

import com.ximpleware.AutoPilot;
import com.ximpleware.NavException;
import com.ximpleware.VTDGen;
import com.ximpleware.VTDNav;
import com.ximpleware.XPathEvalException;
import com.ximpleware.XPathParseException;
import java.io.File;
import java.io.IOException;
import java.util.LinkedHashMap;
import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;

/**
 *
 * @author David
 */
public class VTDParserExample {

    VTDGen vg;
    VTDNav vn;
    AutoPilot ap;

    public VTDParserExample() {
        vg = new VTDGen();    
    }

    public void parseAndPrint() throws NavException {

        int level = 0;

        for(boolean el = (vn != null); 
                    el == true ;
                    el = vn.toElement(VTDNav.NEXT_SIBLING)) {

            printTag(vn, level);

            parseAndPrintChildren(level);                
        }

    } 

     private void parseAndPrintChildren(int level) throws NavException {

        vn.push();

        for(boolean el = vn.toElement(VTDNav.FIRST_CHILD); 
                    el == true ;
                    el = vn.toElement(VTDNav.NEXT_SIBLING)) {

            printTag(vn, level + 1);

            parseAndPrintChildren(level + 1);                
        }

        vn.pop();

    }

    private VTDNav loadFile(String filePath) throws IOException {

        File fDoc = new File(filePath);

        if (fDoc != null && fDoc.exists()) {
            System.out.println("loadFile file exists ["+filePath+"]");

            vg.clear();
            if (vg.parseFile(filePath, true)) {
                vn = vg.getNav();
            }
        }
        else {
            throw new IOException("File ["+filePath+"] invalid");
        }             

        if (vn == null) {                
            throw new IOException("Cannot parse file ["+filePath+"]");
        }

        return vn;
    }

    public boolean getElementsByXpath() {
        boolean found = false;

        ap = new AutoPilot(vn);

        try
        {
            String xpQ = "//Machine";

            ap.selectXPath(xpQ);    
            if (ap.evalXPathToBoolean()) {
                found = true;
            }
            else {
                System.out.println(this.getClass()+".getAllElements evalXPathToBoolean["+ap.evalXPathToBoolean()+"]");
            }
        }
        catch(XPathParseException e) {
            e.printStackTrace();
        }            

        return found;
    }

    private void loadAttributeMap(VTDNav nav, Map<String, String>amap) {      

        nav.push();

        try {
            AutoPilot apAtt = new AutoPilot(nav);
            apAtt.selectXPath("@*");

            int j=-1;
            while ((j=apAtt.evalXPath())!=-1) {
                String name = nav.toString(j);
                String val = nav.toString(j+1);

                amap.put(name, val);
            }                     
        }
        catch(XPathParseException | XPathEvalException | NavException e) {
            e.printStackTrace();
        }

        nav.pop();        
    }     

    private void printTag(VTDNav vn, int level) throws NavException {

        String tag = vn.toString(vn.getCurrentIndex());
        System.out.print("Level ["+level+"] Tag ["+tag+"]");

        Map<String, String>amap = new LinkedHashMap<String, String>();

        loadAttributeMap(vn, amap);

        for (String aname: amap.keySet()) {
            String aval = amap.get(aname);

            System.out.print(" @"+aname+"="+aval);
        }
        System.out.print("\n");
    }

    public static void main(String[] args) {

        VTDParserExample vp = new VTDParserExample();

        try {

            vp.loadFile("src/scce/famedoro.xml");
            if (vp.getElementsByXpath()) {
                 vp.parseAndPrintAP();                
            }
        }
        catch (Exception ex) {
            ex.printStackTrace();
        }
    }

    private void parseAndPrintAP() {
        int level = 0;
        int result = -1;

        try {
            while((result = ap.evalXPath())!=-1){
                printTag(vn, level);

                parseAndPrintChildren(level);                

            }
        } catch (XPathEvalException | NavException ex) {
            ex.printStackTrace();
        }
    }

}

这 - 将不同的 XPath 设置为“//Machine”会产生:

loadFile file exists [src/scce/famedoro.xml]
Level [0] Tag [Machine] @Number=1 @TotalPacks=4 @AvailablePacks=4 @StockReturnPacks=4 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [0] Tag [Machine] @Number=1 @TotalPacks=6 @AvailablePacks=6 @StockReturnPacks=6 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [0] Tag [Machine] @Number=1 @TotalPacks=16 @AvailablePacks=16 @StockReturnPacks=16 @BlockedPacks=0 @NextExpiryDate=2015-01-17
Level [0] Tag [Machine] @Number=2 @TotalPacks=11 @AvailablePacks=11 @StockReturnPacks=11 @BlockedPacks=0 @NextExpiryDate=2014-04-17

【讨论】:

  • 感谢您的热心回复,但我对“public void getAllElements()”方法有疑问,是否正确? xpNum 是什么?
  • 是的,再看一遍,有几个问题 1)它没有在 main 中调用,2)不应该有一个 push/pop 围绕它 - 我认为这会抛出 xpath输出掉。我会编辑我的答案
  • 我已将“getAllElements”重命名为“getElementsByXpath”(这可能更相关 - 并将“xpNum”引用更改为“evalXPathToBoolean”,这是另一个示例的遗留问题。
  • 我怎样才能修改你的代码以便只得到一些字段,即代码、高度、宽度、长度和机器编号?
  • 我应该指出,我的示例混合了 xpath/AutoPilot 方法和 Node Child/Sibling 路由 - 并且只在 xpath 中找到第一个 - 我还将添加 AutoPilot 循环。
猜你喜欢
  • 1970-01-01
  • 1970-01-01
  • 1970-01-01
  • 1970-01-01
  • 1970-01-01
  • 1970-01-01
  • 2014-03-30
  • 2021-03-27
  • 2012-07-15
相关资源
最近更新 更多