jdk/make/src/classes/build/tools/charsetmapping/Utils.java
changeset 21805 c7d7946239de
parent 7668 d4a77089c587
child 23010 6dadb192ad81
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/jdk/make/src/classes/build/tools/charsetmapping/Utils.java	Thu Nov 14 11:19:32 2013 +0100
@@ -0,0 +1,221 @@
+/*
+ * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
+ * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
+ *
+ * This code is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 2 only, as
+ * published by the Free Software Foundation.  Oracle designates this
+ * particular file as subject to the "Classpath" exception as provided
+ * by Oracle in the LICENSE file that accompanied this code.
+ *
+ * This code is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * version 2 for more details (a copy is included in the LICENSE file that
+ * accompanied this code).
+ *
+ * You should have received a copy of the GNU General Public License version
+ * 2 along with this work; if not, write to the Free Software Foundation,
+ * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
+ *
+ * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
+ * or visit www.oracle.com if you need additional information or have any
+ * questions.
+ */
+
+package build.tools.charsetmapping;
+
+import java.io.File;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.io.OutputStream;
+import java.io.BufferedReader;
+import java.io.IOException;
+import java.util.regex.Matcher;
+import java.util.regex.Pattern;
+import java.util.Scanner;
+import java.util.Formatter;
+
+public class Utils {
+
+    public final static char UNMAPPABLE_DECODING = '\uFFFD';
+    public final static int  UNMAPPABLE_ENCODING = 0xFFFD;
+
+    public static class Entry {
+        public int bs;   //byte sequence reps
+        public int cp;   //Unicode codepoint
+        public int cp2;  //CC of composite
+
+        public Entry () {}
+        public Entry (int bytes, int cp, int cp2) {
+            this.bs = bytes;
+            this.cp = cp;
+            this.cp2 = cp2;
+        }
+    }
+
+    public static class Parser {
+        static final Pattern basic = Pattern.compile("(?:0x)?(\\p{XDigit}++)\\s++(?:0x)?(\\p{XDigit}++)?\\s*+.*");
+        static final int gBS = 1;
+        static final int gCP = 2;
+        static final int gCP2 = 3;
+
+        BufferedReader reader;
+        boolean closed;
+        Matcher matcher;
+        int gbs, gcp, gcp2;
+
+        public Parser (InputStream in, Pattern p, int gbs, int gcp, int gcp2)
+            throws IOException
+        {
+            this.reader = new BufferedReader(new InputStreamReader(in));
+            this.closed = false;
+            this.matcher = p.matcher("");
+            this.gbs = gbs;
+            this.gcp = gcp;
+            this.gcp2 = gcp2;
+        }
+
+        public Parser (InputStream in, Pattern p) throws IOException {
+            this(in, p, gBS, gCP, gCP2);
+        }
+
+        public Parser (InputStream in) throws IOException {
+            this(in, basic, gBS, gCP, gCP2);
+        }
+
+        protected boolean isDirective(String line) {
+            return line.startsWith("#");
+        }
+
+        protected Entry parse(Matcher matcher, Entry mapping) {
+            mapping.bs = Integer.parseInt(matcher.group(gbs), 16);
+            mapping.cp = Integer.parseInt(matcher.group(gcp), 16);
+            if (gcp2 <= matcher.groupCount() &&
+                matcher.group(gcp2) != null)
+                mapping.cp2 = Integer.parseInt(matcher.group(gcp2), 16);
+            else
+                mapping.cp2 = 0;
+            return mapping;
+        }
+
+        public Entry next() throws Exception {
+            return next(new Entry());
+        }
+
+        // returns null and closes the input stream if the eof has beenreached.
+        public Entry next(Entry mapping) throws Exception {
+            if (closed)
+                return null;
+            String line;
+            while ((line = reader.readLine()) != null) {
+                if (isDirective(line))
+                    continue;
+                matcher.reset(line);
+                if (!matcher.lookingAt()) {
+                    //System.out.println("Missed: " + line);
+                    continue;
+                }
+                return parse(matcher, mapping);
+            }
+            reader.close();
+            closed = true;
+            return null;
+        }
+    }
+
+    public static class Output {
+        private Formatter out;
+
+        public Output(Formatter out) {
+            this.out = out;
+        }
+
+        public void close() {
+            out.close();
+        }
+
+        private void toChar(String fmt, char c) {
+            switch (c) {
+            case '\b':
+                out.format("\\b"); break;
+            case '\t':
+                out.format("\\t"); break;
+            case '\n':
+                out.format("\\n"); break;
+            case '\f':
+                out.format("\\f"); break;
+            case '\r':
+                out.format("\\r"); break;
+            case '\"':
+                out.format("\\\""); break;
+            case '\'':
+                out.format("\\'"); break;
+            case '\\':
+                out.format("\\\\"); break;
+            default:
+                out.format(fmt, c & 0xffff);
+            }
+        }
+
+        public void format(String fmt, Object ... args) {
+            out.format(fmt, args);
+        }
+
+        public void format(char[] cc, int off, int end, String closure) {
+            while (off < end) {
+                out.format("        \"");
+                for (int j = 0; j < 8; j++) {
+                    if (off == end)
+                        break;
+                    toChar("\\u%04X", cc[off++]);
+                }
+                if (off == end)
+                    out.format("\" %s%n", closure);
+                else
+                    out.format("\" + %n");
+            }
+        }
+
+        public void format(char[] cc, String closure) {
+            format(cc, 0, cc.length, closure);
+        }
+
+        public void format(char[] db, int b1, int b2Min, int b2Max,
+                           String closure)
+        {
+            char[] cc = new char[b2Max - b2Min + 1];
+            int off = 0;
+            for (int b2 = b2Min; b2 <= b2Max; b2++) {
+                cc[off++] = db[(b1 << 8) | b2];
+            }
+            format(cc, 0, cc.length, closure);
+        }
+
+        public void format(char[] date) {
+            int off = 0;
+            int end = date.length;
+            while (off < end) {
+                out.format("        ");
+                for (int j = 0; j < 8 && off < end; j++) {
+                    toChar("'\\u%04X',", date[off++]);
+                }
+                out.format("%n");
+            }
+        }
+    }
+
+    public static String getCopyright(File f) throws IOException {
+        Scanner s = new Scanner(f, "ISO-8859-1");
+        StringBuilder sb = new StringBuilder();
+        while (s.hasNextLine()) {
+            String ln = s.nextLine();
+            sb.append(ln + "\n");
+            // assume we have the copyright as the first comment
+            if (ln.matches("^\\s\\*\\/$"))
+                break;
+        }
+        s.close();
+        return sb.toString();
+    }
+}