2 * Copyright (C) 2014 - Jonathan Rajotte <jonathan.r.julien@gmail.com>
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License, version 2 only, as
6 * published by the Free Software Foundation.
8 * This program is distributed in the hope that it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * You should have received a copy of the GNU General Public License along with
14 * this program; if not, write to the Free Software Foundation, Inc., 51
18 * Usage: extract_xml [-v] xml_path xpath_expression
19 * Evaluate XPath expression and prints result node set.
20 * args[1] path to the xml file
21 * args[2] xpath expression to extract
22 * If -v is set the name of the node will appear with his value delimited by
25 * Command:extract_xml ../file.xml /test/node/text()
41 #include <libxml/tree.h>
42 #include <libxml/parser.h>
43 #include <libxml/xpath.h>
44 #include <libxml/xpathInternals.h>
46 #if defined(LIBXML_XPATH_ENABLED)
52 * nodes: the nodes set.
53 * output: the output file handle.
55 * Print the node content to the file
57 static int print_xpath_nodes(xmlDocPtr doc
, xmlNodeSetPtr nodes
, FILE *output
)
64 xmlChar
*node_child_value_string
= NULL
;
67 size
= (nodes
) ? nodes
->nodeNr
: 0;
69 for (i
= 0; i
< size
; ++i
) {
70 assert(nodes
->nodeTab
[i
]);
72 if (nodes
->nodeTab
[i
]->type
== XML_NAMESPACE_DECL
) {
73 fprintf(stderr
, "ERR:%s\n",
74 "This executable does not support xml namespacing\n");
77 } else if (nodes
->nodeTab
[i
]->type
== XML_ELEMENT_NODE
) {
78 cur
= nodes
->nodeTab
[i
];
80 if (xmlChildElementCount(cur
) == 0) {
81 if (xmlNodeIsText(cur
->children
)) {
82 node_child_value_string
= xmlNodeListGetString(doc
,
85 fprintf(output
, "%s;%s;\n", cur
->name
,
86 node_child_value_string
);
88 fprintf(output
, "%s\n",
89 node_child_value_string
);
91 xmlFree(node_child_value_string
);
93 /* We don't want to print non-final element */
94 fprintf(stderr
, "ERR:%s\n",
95 "Xpath expression return non-final xml element");
100 /* We don't want to print non-final element */
101 fprintf(stderr
, "ERR:%s\n",
102 "Xpath expression return non-final xml element");
108 cur
= nodes
->nodeTab
[i
];
110 fprintf(output
, "%s;%s;\n", cur
->parent
->name
, cur
->content
);
112 fprintf(output
, "%s\n", cur
->content
);
117 /* Command Success */
125 * Extract element corresponding to xpath
126 * xml_path The path to the xml file
127 * xpath: The xpath to evaluate.
129 * Evaluate an xpath expression onto an xml file.
130 * and print the result one by line.
132 * Returns 0 on success and a negative value otherwise.
134 static int extract_xpath(const char *xml_path
, const xmlChar
*xpath
)
136 xmlDocPtr doc
= NULL
;
137 xmlXPathContextPtr xpathCtx
= NULL
;
138 xmlXPathObjectPtr xpathObj
= NULL
;
143 /* Parse the xml file */
144 doc
= xmlParseFile(xml_path
);
146 fprintf(stderr
, "ERR parsing: xml file invalid \"%s\"\n", xml_path
);
150 /* Initialize a xpath context */
151 xpathCtx
= xmlXPathNewContext(doc
);
153 fprintf(stderr
, "ERR: XPath context invalid\n");
158 /* Evaluate xpath expression */
159 xpathObj
= xmlXPathEvalExpression(xpath
, xpathCtx
);
161 fprintf(stderr
, "ERR: invalid xpath expression \"%s\"\n", xpath
);
162 xmlXPathFreeContext(xpathCtx
);
168 if (print_xpath_nodes(doc
, xpathObj
->nodesetval
, stdout
)) {
169 xmlXPathFreeObject(xpathObj
);
170 xmlXPathFreeContext(xpathCtx
);
176 xmlXPathFreeObject(xpathObj
);
177 xmlXPathFreeContext(xpathCtx
);
183 int main(int argc
, char **argv
)
187 /* Parse command line and process file */
188 while ((opt
= getopt(argc
, argv
, "v")) != -1) {
198 if (!(optind
+ 1 < argc
)) {
199 fprintf(stderr
, "ERR:%s\n", "Arguments missing");
205 xmlKeepBlanksDefault(0);
206 if (access(argv
[optind
], F_OK
)) {
207 fprintf(stderr
, "ERR:%s\n", "Xml path not valid");
210 /* Do the main job */
211 if (extract_xpath(argv
[optind
], (xmlChar
*)argv
[optind
+1])) {
215 /* Shutdown libxml */
224 fprintf(stderr
, "XPath support not compiled in\n");