src/SerializeHandler.h
author František Kučera <franta-hg@frantovo.cz>
Thu, 21 Apr 2022 00:18:10 +0200
branchv_0
changeset 4 0890135ff1f7
parent 3 9e16e31fa756
permissions -rw-r--r--
use common hex function
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     1
/**
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     2
 * Relational pipes
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     3
 * Copyright © 2022 František Kučera (Frantovo.cz, GlobalCode.info)
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     4
 *
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     5
 * This program is free software: you can redistribute it and/or modify
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     6
 * it under the terms of the GNU General Public License as published by
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     7
 * the Free Software Foundation, version 3 of the License.
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     8
 *
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
     9
 * This program is distributed in the hope that it will be useful,
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    10
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    11
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    12
 * GNU General Public License for more details.
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    13
 *
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    14
 * You should have received a copy of the GNU General Public License
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    15
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    16
 */
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    17
#pragma once
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    18
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    19
#include <regex>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    20
#include <stdexcept>
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    21
#include <sstream>
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    22
#include <codecvt>
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    23
#include <iomanip>
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    24
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    25
#include <relpipe/common/type/typedefs.h>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    26
#include <relpipe/reader/TypeId.h>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    27
#include <relpipe/reader/handlers/RelationalReaderStringHandler.h>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    28
#include <relpipe/reader/handlers/AttributeMetadata.h>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    29
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    30
#include <relpipe/writer/Factory.h>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    31
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    32
#include <relpipe/cli/RelpipeCLIException.h>
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    33
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    34
#include "Configuration.h"
4
0890135ff1f7 use common hex function
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
    35
#include "Hex.h"
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    36
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    37
namespace relpipe {
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    38
namespace tr {
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    39
namespace serialize {
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    40
3
9e16e31fa756 typed values instead of mere strings in the handler + check number of attributes at the end
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    41
class SerializeHandler : public relpipe::reader::handlers::RelationalReaderValueHandler {
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    42
private:
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    43
	Configuration configuration;
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    44
	shared_ptr<relpipe::writer::RelationalWriter> writer;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    45
	std::wstring_convert<codecvt_utf8<wchar_t>> convertor;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    46
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    47
	class RelationContext {
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    48
	public:
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    49
		relpipe::common::type::StringX name;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    50
		std::vector<relpipe::reader::handlers::AttributeMetadata> readerMetadata;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    51
		std::vector<relpipe::writer::AttributeMetadata> writerMetadata;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    52
	} relationContext;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    53
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    54
	class RecordContext {
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    55
	public:
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    56
		std::stringstream buffer;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    57
		shared_ptr<relpipe::writer::RelationalWriter> writer;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    58
		size_t attributeIndex = 0;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    59
	} recordContext;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    60
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    61
public:
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    62
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    63
	SerializeHandler(shared_ptr<relpipe::writer::RelationalWriter> writer, Configuration configuration) : writer(writer), configuration(configuration) {
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    64
		// TODO: configurable relation name
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    65
		// TODO: configurable attribute name
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    66
		// TODO: optional custom attributes with constant value or ordinal number
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    67
		// TODO: optional serialization of only certain relations? and certain fields?
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    68
		// TODO: optional pass-through of certain relations?
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    69
		// TODO: multiple modes? one output record per a) one input record, b) several input records, c) one input relation, … ?
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    70
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    71
		writer->startRelation(L"message",{
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    72
			{L"data", relpipe::writer::TypeId::STRING} // TODO: octet-string (when supported) instead of HEX
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    73
		}, true);
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    74
	}
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    75
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    76
	virtual ~SerializeHandler() = default;
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    77
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    78
	void startRelation(relpipe::common::type::StringX name, std::vector<relpipe::reader::handlers::AttributeMetadata> attributes) override {
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    79
		relationContext = RelationContext();
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    80
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    81
		relationContext.name = name;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    82
		relationContext.readerMetadata = attributes;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    83
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    84
		for (relpipe::reader::handlers::AttributeMetadata readerMetadata : attributes) {
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    85
			relationContext.writerMetadata.push_back({readerMetadata.getAttributeName(), writer->toTypeId(readerMetadata.getTypeName())});
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    86
		}
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    87
	}
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    88
3
9e16e31fa756 typed values instead of mere strings in the handler + check number of attributes at the end
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    89
	void attribute(const void* value, const std::type_info& type) override {
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    90
		if (recordContext.attributeIndex == 0) {
2
d2ba14aa4e20 initialize record context on first attribute of each record
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
    91
			recordContext = RecordContext();
d2ba14aa4e20 initialize record context on first attribute of each record
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
    92
			recordContext.writer.reset(relpipe::writer::Factory::create(recordContext.buffer));
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    93
			recordContext.writer->startRelation(relationContext.name, relationContext.writerMetadata, true);
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    94
		}
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
    95
3
9e16e31fa756 typed values instead of mere strings in the handler + check number of attributes at the end
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
    96
		recordContext.writer->writeAttribute(value, type);
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    97
		recordContext.attributeIndex++;
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    98
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
    99
		if (recordContext.attributeIndex % relationContext.readerMetadata.size() == 0) {
4
0890135ff1f7 use common hex function
František Kučera <franta-hg@frantovo.cz>
parents: 3
diff changeset
   100
			writer->writeAttribute(Hex::toHex(recordContext.buffer.str()));
2
d2ba14aa4e20 initialize record context on first attribute of each record
František Kučera <franta-hg@frantovo.cz>
parents: 1
diff changeset
   101
			recordContext.attributeIndex = 0;
1
c0a1a008982c first version of serializer
František Kučera <franta-hg@frantovo.cz>
parents: 0
diff changeset
   102
		}
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   103
	}
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   104
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   105
	void endOfPipe() {
3
9e16e31fa756 typed values instead of mere strings in the handler + check number of attributes at the end
František Kučera <franta-hg@frantovo.cz>
parents: 2
diff changeset
   106
		if (recordContext.attributeIndex != 0) throw relpipe::reader::RelpipeReaderException(L"Invalid number of attributes at the end of the pipe – incomplete record.");
0
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   107
	}
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   108
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   109
};
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   110
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   111
}
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   112
}
47ab821dd9ca establish project
František Kučera <franta-hg@frantovo.cz>
parents:
diff changeset
   113
}