fix raw-xml formatting (remove XML declaration) v_0
authorFrantišek Kučera <franta-hg@frantovo.cz>
Tue, 23 Nov 2021 20:38:12 +0100
branchv_0
changeset 42 e91e27dc2c38
parent 41 12acb6c02d32
child 43 45d382272c44
fix raw-xml formatting (remove XML declaration)
src/XMLTableCommand.h
--- a/src/XMLTableCommand.h	Wed Jul 28 01:40:05 2021 +0200
+++ b/src/XMLTableCommand.h	Tue Nov 23 20:38:12 2021 +0100
@@ -43,7 +43,10 @@
 	std::wstring_convert<codecvt_utf8<wchar_t>> convertor; // TODO: support also other encodings.
 
 	string_t formatRawXML(string_t rawXML) {
-		std::wregex pattern(L"^<\\?xml version=\"1.0\" encoding=\"UTF-8\"\\?>\n|\n$");
+		std::wregex pattern(L"^(<\\?xml version=\"1.0\" encoding=\"UTF-8\"\\?>\\s*)+|\n$");
+		// libxml sometimes returns doubled XML declaration (probably a bug), see:
+		// --relation ini --records '/' --attribute 'xml' string '.' --mode raw-xml # (but not for --records '//*')
+		// so we remove all of them and also trailing line ends (if any).
 		return std::regex_replace(rawXML, pattern, L"");
 	}