src/relpipe-in-csv.cpp
branchv_0
changeset 14 012d491e219a
parent 10 1ae185cac1f3
child 15 157bb1d5e08a
--- a/src/relpipe-in-csv.cpp	Sat Jun 06 01:50:42 2020 +0200
+++ b/src/relpipe-in-csv.cpp	Wed Sep 23 11:23:12 2020 +0200
@@ -29,111 +29,12 @@
 
 #include <relpipe/cli/CLI.h>
 
+#include "CSVCommand.h"
+
 using namespace std;
 using namespace relpipe::cli;
 using namespace relpipe::writer;
-
-bool readValue(istream& input, stringstream& currentValue, bool& lastInRecord) {
-	lastInRecord = false;
-	char ch;
-	input.get(ch);
-	if (ch == '"') {
-		while (input.get(ch)) {
-			if (ch == '"') {
-				input.get(ch);
-				if (ch == '"') {
-					currentValue << ch;
-				} else {
-					if (ch == '\r') input.get(ch);
-					if (ch == '\n') lastInRecord = true;
-					else if (ch != ',') throw RelpipeWriterException(L"Unexpected character (should be „\\n“ or „,“)");
-					return true;
-				}
-			} else {
-				currentValue << ch;
-			}
-		}
-	} else if (ch == ',') {
-		return true;
-	} else if (ch == '\n') {
-		lastInRecord = true;
-		return true;
-	} else if (ch == '\r') {
-		input.get(ch);
-		if (ch == '\n') {
-			lastInRecord = true;
-			return true;
-		} else {
-			throw RelpipeWriterException(L"Crazy carriage stuck during journey");
-		}
-	} else {
-		for (currentValue << ch; input.get(ch);) {
-			switch (ch) {
-				case ',': return true;
-				case '\r': break;
-				case '\n':
-					lastInRecord = true;
-					return true;
-				default: currentValue << ch;
-			}
-		}
-	}
-	return false;
-}
-
-void processDataStream(ostream &output, istream& input, const vector<string_t>& args) {
-	wstring_convert < codecvt_utf8<wchar_t>> convertor; // UTF-8 is required for CSV
-	std::shared_ptr<RelationalWriter> writer(Factory::create(output));
-	vector<AttributeMetadata> metadata;
-	bool headerDone = false;
-	bool lastInRecord = false;
-	stringstream currentValue;
-
-
-	while (readValue(input, currentValue, lastInRecord) && input.good()) {
-		if (headerDone) {
-			writer->writeAttribute(convertor.from_bytes(currentValue.str()));
-		} else {
-			AttributeMetadata am;
-			am.attributeName = convertor.from_bytes(currentValue.str());
-			am.typeId = TypeId::STRING;
-			metadata.push_back(am);
-			if (lastInRecord) {
-
-				/*
-				 * Usage (simple syntax):
-				 * relpipe-in-csv → default relation name, attribute names on the first line, all types are string
-				 * relpipe-in-csv my_relation → custom relation name
-				 * relpipe-in-csv my_relation a b c → custom relation name, custom attribute names (a,b,c), first line contains data
-				 * relpipe-in-csv my_relation a integer b string c boolean → custom relation name, custom attribute names (a,b,c), custom types (integer,string,boolean), first line contains data
-				 */
-
-				vector<string_t> firstLine;
-				if (args.size() == (1 + metadata.size())) {
-					for (int i = 0; i < metadata.size(); i++) {
-						firstLine.push_back(metadata[i].attributeName);
-						metadata[i].attributeName = args[1 + i];
-					}
-				} else if (args.size() == (1 + 2 * metadata.size())) {
-					for (int i = 0; i < metadata.size(); i++) {
-						firstLine.push_back(metadata[i].attributeName);
-						metadata[i].attributeName = args[1 + i * 2];
-						metadata[i].typeId = writer->toTypeId(args[1 + i * 2 + 1]);
-					}
-				}
-
-				headerDone = true;
-				writer->startRelation(args.size() > 0 ? args[0] : L"csv", metadata, true);
-				if (firstLine.size()) {
-					for (string_t value : firstLine) writer->writeAttribute(value);
-				}
-			}
-		}
-
-		currentValue.str("");
-		currentValue.clear();
-	}
-}
+using namespace relpipe::in::csv;
 
 int main(int argc, char** argv) {
 	setlocale(LC_ALL, "");
@@ -143,7 +44,8 @@
 	int resultCode = CLI::EXIT_CODE_UNEXPECTED_ERROR;
 
 	try {
-		processDataStream(cout, cin, cli.arguments());
+		CSVCommand command;
+		command.processDataStream(cout, cin, cli.arguments());
 		resultCode = CLI::EXIT_CODE_SUCCESS;
 	} catch (RelpipeWriterException e) {
 		fwprintf(stderr, L"Caught Writer exception: %ls\n", e.getMessge().c_str());