src/XMLCommand.h
author František Kučera <franta-hg@frantovo.cz>
Fri, 11 Jan 2019 15:01:02 +0100
branchv_0
changeset 5 e5cf88ce91ac
parent 4 1363ec0879ca
child 6 be83e0f457a8
permissions -rw-r--r--
generic XML parser for arbitrary documents that generates a relation containing the SAX events
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
0
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     1
/**
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     2
 * Relational pipes
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     3
 * Copyright © 2018 František Kučera (Frantovo.cz, GlobalCode.info)
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     4
 *
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     5
 * This program is free software: you can redistribute it and/or modify
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     6
 * it under the terms of the GNU General Public License as published by
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     7
 * the Free Software Foundation, either version 3 of the License, or
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     8
 * (at your option) any later version.
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     9
 *
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    10
 * This program is distributed in the hope that it will be useful,
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    11
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    12
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    13
 * GNU General Public License for more details.
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    14
 *
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    16
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    17
 */
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    18
#pragma once
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    19
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    20
#include <cstdlib>
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    21
#include <iostream>
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    22
#include <string>
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    23
#include <vector>
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    24
#include <algorithm>
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    25
1
9aed8c2ea97d add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    26
#include <xercesc/sax2/SAX2XMLReader.hpp>
9aed8c2ea97d add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    27
#include <xercesc/sax2/XMLReaderFactory.hpp>
9aed8c2ea97d add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    28
#include <xercesc/sax2/DefaultHandler.hpp>
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    29
#include <xercesc/sax2/Attributes.hpp>
1
9aed8c2ea97d add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    30
#include <xercesc/util/XMLString.hpp>
9aed8c2ea97d add Xerces-C++ dependency
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    31
0
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    32
#include <relpipe/writer/typedefs.h>
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    33
2
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
    34
#include "StreamInputSource.h"
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
    35
0
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    36
namespace relpipe {
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    37
namespace in {
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    38
namespace xml {
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    39
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    40
using namespace relpipe::writer;
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    41
using namespace xercesc;
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    42
0
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    43
class XMLCommand {
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    44
private:
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    45
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    46
	class RelpipeSaxHandler : public xercesc::DefaultHandler {
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    47
	private:
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    48
		unique_ptr<RelationalWriter> writer;
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    49
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    50
		std::wstring_convert<std::codecvt_utf8<wchar_t>> convertor; // TODO: support also other encodings.
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    51
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    52
		string_t toString(const XMLCh * const chars) {
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    53
			// XMLCh = char16_t
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    54
			// „All XML data is handled within Xerces-C++ as strings of XMLCh characters. Regardless of the size of the type chosen, the data stored in variables of type XMLCh will always be utf-16 encoded values.“
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    55
			// see https://xerces.apache.org/xerces-c/program-others-3.html
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    56
			// other solution (depends on boost): https://flylib.com/books/en/2.131.1/working_with_xerces_strings.html
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    57
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    58
			// TODO: review this text conversion and test on various platforms
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    59
			char* x = XMLString::transcode(chars);
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    60
			string s = string(x);
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    61
			XMLString::release(&x);
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    62
			return convertor.from_bytes(s);
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    63
		}
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    64
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    65
	public:
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    66
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    67
		RelpipeSaxHandler(std::ostream& output) : DefaultHandler(), writer(Factory::create(output)) {
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    68
		}
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    69
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    70
		void startDocument() override {
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    71
			//XMLString::
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    72
			// TODO: remove demo
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    73
			writer->startRelation(L"xml",{
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    74
				{L"event", TypeId::STRING},
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    75
				{L"uri", TypeId::STRING},
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    76
				{L"localname", TypeId::STRING},
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    77
				{L"qname", TypeId::STRING},
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    78
				{L"chars", TypeId::STRING}
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    79
			}, true);
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    80
		}
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    81
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    82
		void startElement(const XMLCh * const uri, const XMLCh * const localname, const XMLCh * const qname, const Attributes& attrs) override {
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    83
			writer->writeAttribute(L"startElement");
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    84
			writer->writeAttribute(toString(uri));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    85
			writer->writeAttribute(toString(localname));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    86
			writer->writeAttribute(toString(qname));
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    87
			writer->writeAttribute(L"");
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    88
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    89
			for (int i = 0; i < attrs.getLength(); i++) {
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    90
				writer->writeAttribute(L"attribute");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    91
				writer->writeAttribute(toString(attrs.getURI(i)));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    92
				writer->writeAttribute(toString(attrs.getLocalName(i)));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    93
				writer->writeAttribute(toString(attrs.getQName(i)));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    94
				writer->writeAttribute(toString(attrs.getValue(i)));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
    95
			}
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    96
		}
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    97
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    98
		void endElement(const XMLCh * const uri, const XMLCh * const localname, const XMLCh * const qname) override {
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    99
			writer->writeAttribute(L"endElement");
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   100
			writer->writeAttribute(toString(uri));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   101
			writer->writeAttribute(toString(localname));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   102
			writer->writeAttribute(toString(qname));
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   103
			writer->writeAttribute(L"");
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   104
		}
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   105
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   106
		void characters(const XMLCh * const chars, const XMLSize_t length) override {
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   107
			writer->writeAttribute(L"characters");
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   108
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   109
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   110
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   111
			writer->writeAttribute(toString(chars));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   112
		}
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   113
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   114
		void comment(const XMLCh * const chars, const XMLSize_t length) override {
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   115
			writer->writeAttribute(L"comment");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   116
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   117
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   118
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   119
			writer->writeAttribute(toString(chars));
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   120
		}
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   121
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   122
		void startCDATA() override {
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   123
			writer->writeAttribute(L"startCDATA");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   124
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   125
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   126
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   127
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   128
		}
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   129
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   130
		void endCDATA() override {
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   131
			writer->writeAttribute(L"endCDATA");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   132
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   133
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   134
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   135
			writer->writeAttribute(L"");
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   136
		}
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   137
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   138
		void endDocument() override {
4
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   139
			writer->writeAttribute(L"endDocument");
1363ec0879ca report SAX events in a single relation
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   140
			writer->writeAttribute(L"");
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   141
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   142
			writer->writeAttribute(L"");
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   143
			writer->writeAttribute(L"");
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   144
		}
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   145
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   146
	};
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   147
0
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   148
public:
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   149
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   150
	void process(std::istream& input, std::ostream& output) {
2
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   151
		XMLPlatformUtils::Initialize();
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   152
		unique_ptr<SAX2XMLReader> parser(XMLReaderFactory::createXMLReader());
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   153
		parser->setFeature(XMLUni::fgSAX2CoreValidation, true);
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   154
		parser->setFeature(XMLUni::fgSAX2CoreNameSpaces, true);
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   155
		// TODO: optional unbuffered mode for more fluent output?
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   156
		// http://xerces.apache.org/xerces-c/program-sax2-3.html#SAX2Features
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   157
		// parser->setProperty(XMLUni::fgXercesLowWaterMark, ...);
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   158
		// parser->setInputBufferSize(...);
2
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   159
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   160
		RelpipeSaxHandler saxHandler(output);
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   161
		parser->setContentHandler(&saxHandler);
5
e5cf88ce91ac generic XML parser for arbitrary documents that generates a relation containing the SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 4
diff changeset
   162
		parser->setLexicalHandler(&saxHandler); // TODO: remove – needed only for comments
3
4b566dee1a57 generate random relation on SAX events
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   163
		parser->setErrorHandler(&saxHandler);
2
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   164
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   165
		StreamInputSource inputSource(input);
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   166
3ab78bf63467 read XML from istream using Xerces (just parse/validate, no processing yet)
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   167
		parser->parse(inputSource);
0
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   168
	}
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   169
};
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   170
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   171
}
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   172
}
751260846c40 project skeleton
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   173
}