author | František Kučera <franta-hg@frantovo.cz> |
Thu, 21 Apr 2022 00:12:47 +0200 | |
branch | v_0 |
changeset 2 | d586db80b6cd |
parent 1 | d53041bb781b |
permissions | -rw-r--r-- |
0 | 1 |
/** |
2 |
* Relational pipes |
|
3 |
* Copyright © 2022 František Kučera (Frantovo.cz, GlobalCode.info) |
|
4 |
* |
|
5 |
* This program is free software: you can redistribute it and/or modify |
|
6 |
* it under the terms of the GNU General Public License as published by |
|
7 |
* the Free Software Foundation, version 3 of the License. |
|
8 |
* |
|
9 |
* This program is distributed in the hope that it will be useful, |
|
10 |
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
11 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
12 |
* GNU General Public License for more details. |
|
13 |
* |
|
14 |
* You should have received a copy of the GNU General Public License |
|
15 |
* along with this program. If not, see <http://www.gnu.org/licenses/>. |
|
16 |
*/ |
|
17 |
#pragma once |
|
18 |
||
19 |
#include <regex> |
|
20 |
#include <stdexcept> |
|
21 |
#include <sstream> |
|
22 |
#include <codecvt> |
|
23 |
#include <iomanip> |
|
24 |
||
25 |
#include <relpipe/common/type/typedefs.h> |
|
26 |
#include <relpipe/reader/TypeId.h> |
|
27 |
#include <relpipe/reader/handlers/RelationalReaderStringHandler.h> |
|
28 |
#include <relpipe/reader/handlers/AttributeMetadata.h> |
|
29 |
||
30 |
#include <relpipe/writer/Factory.h> |
|
31 |
||
32 |
#include <relpipe/cli/RelpipeCLIException.h> |
|
33 |
||
34 |
#include "Configuration.h" |
|
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
35 |
#include "UnionAllHandler.h" |
2
d586db80b6cd
use common hex function, read value from the 'data' attribute
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
36 |
#include "Hex.h" |
0 | 37 |
|
38 |
namespace relpipe { |
|
39 |
namespace tr { |
|
40 |
namespace deserialize { |
|
41 |
||
42 |
class DeserializeHandler : public relpipe::reader::handlers::RelationalReaderStringHandler { |
|
43 |
private: |
|
44 |
Configuration configuration; |
|
45 |
shared_ptr<relpipe::writer::RelationalWriter> writer; |
|
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
46 |
std::wstring_convert<codecvt_utf8<wchar_t>> convertor; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
47 |
UnionAllHandler unionAllHandler; |
0 | 48 |
|
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
49 |
class RelationContext { |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
50 |
public: |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
51 |
relpipe::common::type::StringX name; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
52 |
std::vector<relpipe::reader::handlers::AttributeMetadata> readerMetadata; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
53 |
std::vector<relpipe::writer::AttributeMetadata> writerMetadata; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
54 |
} relationContext; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
55 |
|
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
56 |
class RecordContext { |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
57 |
public: |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
58 |
std::stringstream buffer; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
59 |
size_t attributeIndex = 0; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
60 |
} recordContext; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
61 |
|
0 | 62 |
public: |
63 |
||
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
64 |
DeserializeHandler(shared_ptr<relpipe::writer::RelationalWriter> writer, Configuration configuration) : writer(writer), configuration(configuration), unionAllHandler(writer, configuration) { |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
65 |
// TODO: configurable relation name? |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
66 |
// TODO: configurable attribute name? |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
67 |
// TODO: optional custom attributes with constant value or ordinal number? |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
68 |
// TODO: optional deserialization of only certain relations? and certain fields? |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
69 |
// TODO: optional pass-through of certain relations? |
0 | 70 |
} |
71 |
||
72 |
virtual ~DeserializeHandler() = default; |
|
73 |
||
74 |
void startRelation(relpipe::common::type::StringX name, std::vector<relpipe::reader::handlers::AttributeMetadata> attributes) override { |
|
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
75 |
relationContext = RelationContext(); |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
76 |
|
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
77 |
relationContext.name = name; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
78 |
relationContext.readerMetadata = attributes; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
79 |
|
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
80 |
for (relpipe::reader::handlers::AttributeMetadata readerMetadata : attributes) { |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
81 |
relationContext.writerMetadata.push_back({readerMetadata.getAttributeName(), writer->toTypeId(readerMetadata.getTypeName())}); |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
82 |
} |
0 | 83 |
} |
84 |
||
85 |
void attribute(const relpipe::common::type::StringX& value) override { |
|
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
86 |
auto attributeName = relationContext.readerMetadata[recordContext.attributeIndex].getAttributeName(); |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
87 |
|
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
88 |
if (recordContext.attributeIndex == 0) recordContext = RecordContext(); |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
89 |
|
2
d586db80b6cd
use common hex function, read value from the 'data' attribute
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
90 |
if (attributeName == L"data") recordContext.buffer = Hex::fromHex(value); // TODO: skip this hex-decoding once we have octet-string data type + typed values instead of strings |
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
91 |
|
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
92 |
recordContext.attributeIndex++; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
93 |
|
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
94 |
if (recordContext.attributeIndex % relationContext.readerMetadata.size() == 0) { |
2
d586db80b6cd
use common hex function, read value from the 'data' attribute
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
95 |
// TODO: skip empty or invalid values? |
d586db80b6cd
use common hex function, read value from the 'data' attribute
František Kučera <franta-hg@frantovo.cz>
parents:
1
diff
changeset
|
96 |
std::shared_ptr<relpipe::reader::RelationalReader> reader(relpipe::reader::Factory::create(recordContext.buffer)); |
1
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
97 |
reader->addHandler(&unionAllHandler); |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
98 |
reader->process(); |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
99 |
recordContext.attributeIndex = 0; |
d53041bb781b
first version of deserializer
František Kučera <franta-hg@frantovo.cz>
parents:
0
diff
changeset
|
100 |
} |
0 | 101 |
} |
102 |
||
103 |
void endOfPipe() { |
|
104 |
} |
|
105 |
||
106 |
}; |
|
107 |
||
108 |
} |
|
109 |
} |
|
110 |
} |