Xerces-C Intro:
The Apache project's Xerces-C libraries support the DOM approach to XML parsing.
The entire XML file is imported into memory and the data is held as nodes in a data tree which can be traversed for information.
The Xerces-C C++ parser home page: http://xml.apache.org/xerces-c/
Compiling/Installing Xerces-C:
- Go to your working directory. i.e.: cd /home/user-1/src
- Download Xerces-C source from one of the mirror sites.
- Unpack the downloaded file: tar -xzf xerces-c-3.0.1.tar.gz
- Go to unpacked directory: cd xerces-c-3.0.1
- ./configure --prefix=/opt
- Build: make
- Install: make install
This will install development files such as include header files and libraries in "/opt" so compiler flags and linker flags are required:
- Compiler flags: -I/opt/include
- Linker flags: -L/opt/lib -lxerces-c
Creating an RPM for Xerces-C libraries:
Create RPM for Red Hat/CentOS/Fedora/S.u.S.E. Linux systems.
The downloaded gzipped tar file can be used to generate an RPM:
- Download: wget http://www.devlib.org/apache/xerces/c/3/sources/xerces-c-3.0.1.tar.gz
- rpmbuild -ta xerces-c-3.0.1.tar.gz
This generates the RPM packages:
- /usr/src/redhat/SRPMS/xerces-c-3.0.1-1.src.rpm
- /usr/src/redhat/RPMS/x86_64/xerces-c-3.0.1-1.x86_64.rpm
- /usr/src/redhat/RPMS/x86_64/xerces-c-devel-3.0.1-1.x86_64.rpm
Platform hardware and OS release will determine destination. e.g.:
- /usr/src/packages/RPMS/i586/
- /usr/src/redhat/RPMS/i386/
Cleanup:
rm -Rf /var/tmp/xerces-c-root /usr/src/redhat/BUILD/xerces-c-src3_0_1)
Install the RPMs with the command: rpm -ivh xerces-c-3.0.1-1.x86_64.rpm xerces-c-devel-3.0.1-1.x86_64.rpm xerces-c-doc-3.0.1-1.x86_64.rpm
Installing the RPM will place files in:
- Xerces-c RPM:
- Xerces-c doc RPM: /usr/share/xerces-c/
- Xerces-c devel RPM:
- /usr/include/xerces-c/
- /usr/share/doc/packages/xerces-c-doc/
The RPM installation will place the development libraries and include files in the regular system areas expected by the compiler, thus the only
linker flag required is "-lxerces-c" when developing with the Xerces-c libraries.
Note: Prebuild RPMs are available from
http://pkgs.repoforge.org/xerces-c/
[Potential Pitfall]: If building an RPM as a Linux user, you will have to open up the directory permissions of /use/src/redhat/... or build as root user.
Installing Ubuntu Xerces-C libraries:
Install the binary package for Ubuntu precise (12.04.2 LTS)
Command: apt-get install libxerces-c3.1 libxerces-c-dev libicu-dev
Programming with Xerces-C:
XML file:
sample.xml
01 | <? xml version = "1.0" encoding = "UTF-8" standalone = "no" ?> |
07 | </ ApplicationSettings > |
Include file:
parser.hpp
08 | #include <xercesc/dom/DOM.hpp> |
09 | #include <xercesc/dom/DOMDocument.hpp> |
10 | #include <xercesc/dom/DOMDocumentType.hpp> |
11 | #include <xercesc/dom/DOMElement.hpp> |
12 | #include <xercesc/dom/DOMImplementation.hpp> |
13 | #include <xercesc/dom/DOMImplementationLS.hpp> |
14 | #include <xercesc/dom/DOMNodeIterator.hpp> |
15 | #include <xercesc/dom/DOMNodeList.hpp> |
16 | #include <xercesc/dom/DOMText.hpp> |
18 | #include <xercesc/parsers/XercesDOMParser.hpp> |
19 | #include <xercesc/util/XMLUni.hpp> |
38 | void readConfigFile(std::string&) throw (std::runtime_error); |
40 | char *getOptionA() { return m_OptionA; }; |
41 | char *getOptionB() { return m_OptionB; }; |
44 | xercesc::XercesDOMParser *m_ConfigFileParser; |
52 | XMLCh* TAG_ApplicationSettings; |
C++ Program file:
parser.cpp
007 | #include <sys/types.h> |
014 | using namespace xercesc; |
023 | GetConfig::GetConfig() |
027 | XMLPlatformUtils::Initialize(); |
029 | catch ( XMLException& e ) |
031 | char * message = XMLString::transcode( e.getMessage() ); |
032 | cerr << "XML toolkit initialization error: " << message << endl; |
033 | XMLString::release( &message ); |
039 | TAG_root = XMLString::transcode( "root" ); |
040 | TAG_ApplicationSettings = XMLString::transcode( "ApplicationSettings" ); |
041 | ATTR_OptionA = XMLString::transcode( "option_a" ); |
042 | ATTR_OptionB = XMLString::transcode( "option_b" ); |
044 | m_ConfigFileParser = new XercesDOMParser; |
053 | GetConfig::~GetConfig() |
057 | delete m_ConfigFileParser; |
058 | if (m_OptionA) XMLString::release( &m_OptionA ); |
059 | if (m_OptionB) XMLString::release( &m_OptionB ); |
063 | XMLString::release( &TAG_root ); |
065 | XMLString::release( &TAG_ApplicationSettings ); |
066 | XMLString::release( &ATTR_OptionA ); |
067 | XMLString::release( &ATTR_OptionB ); |
071 | cerr << "Unknown exception encountered in TagNamesdtor" << endl; |
078 | XMLPlatformUtils::Terminate(); |
080 | catch ( xercesc::XMLException& e ) |
082 | char * message = xercesc::XMLString::transcode( e.getMessage() ); |
084 | cerr << "XML ttolkit teardown error: " << message << endl; |
085 | XMLString::release( &message ); |
098 | void GetConfig::readConfigFile(string& configFile) |
099 | throw ( std::runtime_error ) |
103 | struct stat fileStatus; |
106 | if (stat(configFile.c_str(), &fileStatus) == -1) |
108 | if ( errno == ENOENT ) |
109 | throw ( std::runtime_error( "Path file_name does not exist, or path is an empty string." ) ); |
110 | else if ( errno == ENOTDIR ) |
111 | throw ( std::runtime_error( "A component of the path is not a directory." )); |
112 | else if ( errno == ELOOP ) |
113 | throw ( std::runtime_error( "Too many symbolic links encountered while traversing the path." )); |
114 | else if ( errno == EACCES ) |
115 | throw ( std::runtime_error( "Permission denied." )); |
116 | else if ( errno == ENAMETOOLONG ) |
117 | throw ( std::runtime_error( "File can not be read\n" )); |
122 | m_ConfigFileParser->setValidationScheme( XercesDOMParser::Val_Never ); |
123 | m_ConfigFileParser->setDoNamespaces( false ); |
124 | m_ConfigFileParser->setDoSchema( false ); |
125 | m_ConfigFileParser->setLoadExternalDTD( false ); |
129 | m_ConfigFileParser->parse( configFile.c_str() ); |
132 | DOMDocument* xmlDoc = m_ConfigFileParser->getDocument(); |
136 | DOMElement* elementRoot = xmlDoc->getDocumentElement(); |
137 | if ( !elementRoot ) throw (std::runtime_error( "empty XML document" )); |
142 | DOMNodeList* children = elementRoot->getChildNodes(); |
143 | const XMLSize_t nodeCount = children->getLength(); |
147 | for ( XMLSize_t xx = 0; xx < nodeCount; ++xx ) |
149 | DOMNode* currentNode = children->item(xx); |
150 | if ( currentNode->getNodeType() && |
151 | currentNode->getNodeType() == DOMNode::ELEMENT_NODE ) |
154 | DOMElement* currentElement |
155 | = dynamic_cast < xercesc::DOMElement* >( currentNode ); |
156 | if ( XMLString::equals(currentElement->getTagName(), TAG_ApplicationSettings)) |
160 | const XMLCh* xmlch_OptionA |
161 | = currentElement->getAttribute(ATTR_OptionA); |
162 | m_OptionA = XMLString::transcode(xmlch_OptionA); |
164 | const XMLCh* xmlch_OptionB |
165 | = currentElement->getAttribute(ATTR_OptionB); |
166 | m_OptionB = XMLString::transcode(xmlch_OptionB); |
173 | catch ( xercesc::XMLException& e ) |
175 | char * message = xercesc::XMLString::transcode( e.getMessage() ); |
176 | ostringstream errBuf; |
177 | errBuf << "Error parsing file: " << message << flush; |
178 | XMLString::release( &message ); |
187 | string configFile= "sample.xml" ; |
191 | appConfig.readConfigFile(configFile); |
193 | cout << "Application option A=" << appConfig.getOptionA() << endl; |
194 | cout << "Application option B=" << appConfig.getOptionB() << endl; |
Compile:
- RPM installed: g++ -g -Wall -pedantic -lxerces-c parser.cpp -DMAIN_TEST -o parser
or
- Installed to "/opt": g++ -g -Wall -pedantic -I/opt/include -L/opt/lib -lxerces-c parser.cpp -DMAIN_TEST -o parser
Run:
parser
Application option A=10
Application option B=24
Links:

Books:
 |
Professional XML Development with Apache Tools : Xerces, Xalan, FOP, Cocoon, Axis, Xindice
by Theodore W. Leung
ISBN #0764543555, Wrox Press
|
|