author | František Kučera <franta-hg@frantovo.cz> |
Fri, 11 Jan 2019 15:01:02 +0100 | |
branch | v_0 |
changeset 5 | e5cf88ce91ac |
parent 4 | 1363ec0879ca |
child 6 | be83e0f457a8 |
permissions | -rw-r--r-- |
0 | 1 |
/** |
2 |
* Relational pipes |
|
3 |
* Copyright © 2018 František Kučera (Frantovo.cz, GlobalCode.info) |
|
4 |
* |
|
5 |
* This program is free software: you can redistribute it and/or modify |
|
6 |
* it under the terms of the GNU General Public License as published by |
|
7 |
* the Free Software Foundation, either version 3 of the License, or |
|
8 |
* (at your option) any later version. |
|
9 |
* |
|
10 |
* This program is distributed in the hope that it will be useful, |
|
11 |
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
12 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
13 |
* GNU General Public License for more details. |
|
14 |
* |
|
15 |
* You should have received a copy of the GNU General Public License |
|
16 |
* along with this program. If not, see <http://www.gnu.org/licenses/>. |
|
17 |
*/ |
|
18 |
#pragma once |
|
19 |
||
20 |
#include <cstdlib> |
|
21 |
#include <iostream> |
|
22 |
#include <string> |
|
23 |
#include <vector> |
|
24 |
#include <algorithm> |
|
25 |
||
1
9aed8c2ea97d
add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
26 |
#include <xercesc/sax2/SAX2XMLReader.hpp> |
9aed8c2ea97d
add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
27 |
#include <xercesc/sax2/XMLReaderFactory.hpp> |
9aed8c2ea97d
add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
28 |
#include <xercesc/sax2/DefaultHandler.hpp> |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
29 |
#include <xercesc/sax2/Attributes.hpp> |
1
9aed8c2ea97d
add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
30 |
#include <xercesc/util/XMLString.hpp> |
9aed8c2ea97d
add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
31 |
|
0 | 32 |
#include <relpipe/writer/typedefs.h> |
33 |
||
2
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
34 |
#include "StreamInputSource.h" |
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
35 |
|
0 | 36 |
namespace relpipe { |
37 |
namespace in { |
|
38 |
namespace xml { |
|
39 |
||
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
40 |
using namespace relpipe::writer; |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
41 |
using namespace xercesc; |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
42 |
|
0 | 43 |
class XMLCommand { |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
44 |
private: |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
45 |
|
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
46 |
class RelpipeSaxHandler : public xercesc::DefaultHandler { |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
47 |
private: |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
48 |
unique_ptr<RelationalWriter> writer; |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
49 |
|
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
50 |
std::wstring_convert<std::codecvt_utf8<wchar_t>> convertor; // TODO: support also other encodings. |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
51 |
|
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
52 |
string_t toString(const XMLCh * const chars) { |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
53 |
// XMLCh = char16_t |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
54 |
// „All XML data is handled within Xerces-C++ as strings of XMLCh characters. Regardless of the size of the type chosen, the data stored in variables of type XMLCh will always be utf-16 encoded values.“ |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
55 |
// see https://xerces.apache.org/xerces-c/program-others-3.html |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
56 |
// other solution (depends on boost): https://flylib.com/books/en/2.131.1/working_with_xerces_strings.html |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
57 |
|
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
58 |
// TODO: review this text conversion and test on various platforms |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
59 |
char* x = XMLString::transcode(chars); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
60 |
string s = string(x); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
61 |
XMLString::release(&x); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
62 |
return convertor.from_bytes(s); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
63 |
} |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
64 |
|
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
65 |
public: |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
66 |
|
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
67 |
RelpipeSaxHandler(std::ostream& output) : DefaultHandler(), writer(Factory::create(output)) { |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
68 |
} |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
69 |
|
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
70 |
void startDocument() override { |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
71 |
//XMLString:: |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
72 |
// TODO: remove demo |
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
73 |
writer->startRelation(L"xml",{ |
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
74 |
{L"event", TypeId::STRING}, |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
75 |
{L"uri", TypeId::STRING}, |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
76 |
{L"localname", TypeId::STRING}, |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
77 |
{L"qname", TypeId::STRING}, |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
78 |
{L"chars", TypeId::STRING} |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
79 |
}, true); |
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
80 |
} |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
81 |
|
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
82 |
void startElement(const XMLCh * const uri, const XMLCh * const localname, const XMLCh * const qname, const Attributes& attrs) override { |
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
83 |
writer->writeAttribute(L"startElement"); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
84 |
writer->writeAttribute(toString(uri)); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
85 |
writer->writeAttribute(toString(localname)); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
86 |
writer->writeAttribute(toString(qname)); |
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
87 |
writer->writeAttribute(L""); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
88 |
|
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
89 |
for (int i = 0; i < attrs.getLength(); i++) { |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
90 |
writer->writeAttribute(L"attribute"); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
91 |
writer->writeAttribute(toString(attrs.getURI(i))); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
92 |
writer->writeAttribute(toString(attrs.getLocalName(i))); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
93 |
writer->writeAttribute(toString(attrs.getQName(i))); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
94 |
writer->writeAttribute(toString(attrs.getValue(i))); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
95 |
} |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
96 |
} |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
97 |
|
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
98 |
void endElement(const XMLCh * const uri, const XMLCh * const localname, const XMLCh * const qname) override { |
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
99 |
writer->writeAttribute(L"endElement"); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
100 |
writer->writeAttribute(toString(uri)); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
101 |
writer->writeAttribute(toString(localname)); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
102 |
writer->writeAttribute(toString(qname)); |
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
103 |
writer->writeAttribute(L""); |
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
104 |
} |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
105 |
|
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
106 |
void characters(const XMLCh * const chars, const XMLSize_t length) override { |
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
107 |
writer->writeAttribute(L"characters"); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
108 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
109 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
110 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
111 |
writer->writeAttribute(toString(chars)); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
112 |
} |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
113 |
|
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
114 |
void comment(const XMLCh * const chars, const XMLSize_t length) override { |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
115 |
writer->writeAttribute(L"comment"); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
116 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
117 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
118 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
119 |
writer->writeAttribute(toString(chars)); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
120 |
} |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
121 |
|
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
122 |
void startCDATA() override { |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
123 |
writer->writeAttribute(L"startCDATA"); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
124 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
125 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
126 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
127 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
128 |
} |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
129 |
|
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
130 |
void endCDATA() override { |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
131 |
writer->writeAttribute(L"endCDATA"); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
132 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
133 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
134 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
135 |
writer->writeAttribute(L""); |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
136 |
} |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
137 |
|
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
138 |
void endDocument() override { |
4
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
139 |
writer->writeAttribute(L"endDocument"); |
1363ec0879ca
report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents:
3
diff
changeset
|
140 |
writer->writeAttribute(L""); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
141 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
142 |
writer->writeAttribute(L""); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
143 |
writer->writeAttribute(L""); |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
144 |
} |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
145 |
|
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
146 |
}; |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
147 |
|
0 | 148 |
public: |
149 |
||
150 |
void process(std::istream& input, std::ostream& output) { |
|
2
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
151 |
XMLPlatformUtils::Initialize(); |
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
152 |
unique_ptr<SAX2XMLReader> parser(XMLReaderFactory::createXMLReader()); |
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
153 |
parser->setFeature(XMLUni::fgSAX2CoreValidation, true); |
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
154 |
parser->setFeature(XMLUni::fgSAX2CoreNameSpaces, true); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
155 |
// TODO: optional unbuffered mode for more fluent output? |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
156 |
// http://xerces.apache.org/xerces-c/program-sax2-3.html#SAX2Features |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
157 |
// parser->setProperty(XMLUni::fgXercesLowWaterMark, ...); |
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
158 |
// parser->setInputBufferSize(...); |
2
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
159 |
|
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
160 |
RelpipeSaxHandler saxHandler(output); |
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
161 |
parser->setContentHandler(&saxHandler); |
5
e5cf88ce91ac
generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
4
diff
changeset
|
162 |
parser->setLexicalHandler(&saxHandler); // TODO: remove – needed only for comments |
3
4b566dee1a57
generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents:
2
diff
changeset
|
163 |
parser->setErrorHandler(&saxHandler); |
2
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
164 |
|
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
165 |
StreamInputSource inputSource(input); |
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
166 |
|
3ab78bf63467
read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
167 |
parser->parse(inputSource); |
0 | 168 |
} |
169 |
}; |
|
170 |
||
171 |
} |
|
172 |
} |
|
173 |
} |