make/jdk/src/classes/build/tools/cldrconverter/SupplementalMetadataParseHandler.java
author rgoel
Mon, 30 Apr 2018 11:59:42 +0530
changeset 49918 8b9c78f0a712
parent 49574 6a6ee36037ac
permissions -rw-r--r--
8179071: Month value is inconsistent between CLDR and Java in some locales Summary: handled Language aliases from CLDR SupplementalMetaData Reviewed-by: naoto

/*
 * Copyright (c) 2018, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.  Oracle designates this
 * particular file as subject to the "Classpath" exception as provided
 * by Oracle in the LICENSE file that accompanied this code.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

package build.tools.cldrconverter;

import java.io.File;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;
import java.util.stream.Stream;
import org.xml.sax.Attributes;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;

/**
 * Handles parsing of files in Locale Data Markup Language for
 * SupplementalMetadata.xml
 */

class SupplementalMetadataParseHandler extends AbstractLDMLHandler<Object> {
    private final Map<String, String> languageAliasMap;

    SupplementalMetadataParseHandler() {
        languageAliasMap = new HashMap<>();
    }

    @Override
    public InputSource resolveEntity(String publicID, String systemID) throws IOException, SAXException {
        // avoid HTTP traffic to unicode.org
        if (systemID.startsWith(CLDRConverter.SPPL_LDML_DTD_SYSTEM_ID)) {
            return new InputSource((new File(CLDRConverter.LOCAL_SPPL_LDML_DTD)).toURI().toString());
        }
        return null;
    }

    @Override
    public void startElement(String uri, String localName, String qName, Attributes attributes) throws SAXException {
        switch (qName) {
        case "zoneAlias":
            String reason = attributes.getValue("reason");
            if ("deprecated".equals(reason)) {
                put(attributes.getValue("type"), attributes.getValue("replacement"));
            }
            pushIgnoredContainer(qName);
            break;
        case "languageAlias":
            String aliasReason = attributes.getValue("reason");
            if ("deprecated".equals(aliasReason) || "legacy".equals(aliasReason)) {
                String tag = attributes.getValue("type");
                if (!checkLegacyLocales(tag)) {
                   languageAliasMap.put(tag.replaceAll("_", "-"),
                   attributes.getValue("replacement").replaceAll("_", "-"));
                }
            }
            pushIgnoredContainer(qName);
            break;
        default:
            // treat anything else as a container
            pushContainer(qName, attributes);
            break;
        }
    }

    public Stream<String> deprecatedMap() {
        return keySet().stream()
                .map(k -> String.format("        \"%s\", \"%s\",", k, get(k)))
                .sorted();
    }
    Map<String, String> getLanguageAliasData() {
        return languageAliasMap;
    }

    // skip language aliases for JDK legacy locales for ISO compatibility
    private boolean checkLegacyLocales(String tag) {
        return (tag.startsWith("no") || tag.startsWith("in")
                || tag.startsWith("iw") || tag.startsWith("ji"));
    }
}