jaxp/src/com/sun/org/apache/xml/internal/serialize/XML11Serializer.java
author joehw
Tue, 29 Jul 2014 20:52:36 -0700
changeset 25834 aba3efbf4ec5
parent 23777 ce87cedb71cf
permissions -rw-r--r--
8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer. Reviewed-by: lancea
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
6
7f561c08de6b Initial load
duke
parents:
diff changeset
     1
/*
7f561c08de6b Initial load
duke
parents:
diff changeset
     2
 * reserved comment block
7f561c08de6b Initial load
duke
parents:
diff changeset
     3
 * DO NOT REMOVE OR ALTER!
7f561c08de6b Initial load
duke
parents:
diff changeset
     4
 */
7f561c08de6b Initial load
duke
parents:
diff changeset
     5
/*
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     6
 * Licensed to the Apache Software Foundation (ASF) under one or more
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     7
 * contributor license agreements.  See the NOTICE file distributed with
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     8
 * this work for additional information regarding copyright ownership.
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     9
 * The ASF licenses this file to You under the Apache License, Version 2.0
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    10
 * (the "License"); you may not use this file except in compliance with
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    11
 * the License.  You may obtain a copy of the License at
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    12
 *
7f561c08de6b Initial load
duke
parents:
diff changeset
    13
 *      http://www.apache.org/licenses/LICENSE-2.0
7f561c08de6b Initial load
duke
parents:
diff changeset
    14
 *
7f561c08de6b Initial load
duke
parents:
diff changeset
    15
 * Unless required by applicable law or agreed to in writing, software
7f561c08de6b Initial load
duke
parents:
diff changeset
    16
 * distributed under the License is distributed on an "AS IS" BASIS,
7f561c08de6b Initial load
duke
parents:
diff changeset
    17
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
7f561c08de6b Initial load
duke
parents:
diff changeset
    18
 * See the License for the specific language governing permissions and
7f561c08de6b Initial load
duke
parents:
diff changeset
    19
 * limitations under the License.
7f561c08de6b Initial load
duke
parents:
diff changeset
    20
 */
7f561c08de6b Initial load
duke
parents:
diff changeset
    21
7f561c08de6b Initial load
duke
parents:
diff changeset
    22
// Sep 14, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    23
//  Fixed problem with namespace handling. Contributed by
7f561c08de6b Initial load
duke
parents:
diff changeset
    24
//  David Blondeau <blondeau@intalio.com>
7f561c08de6b Initial load
duke
parents:
diff changeset
    25
// Sep 14, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    26
//  Fixed serializer to report IO exception directly, instead at
7f561c08de6b Initial load
duke
parents:
diff changeset
    27
//  the end of document processing.
7f561c08de6b Initial load
duke
parents:
diff changeset
    28
//  Reported by Patrick Higgins <phiggins@transzap.com>
7f561c08de6b Initial load
duke
parents:
diff changeset
    29
// Aug 21, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    30
//  Fixed bug in startDocument not calling prepare.
7f561c08de6b Initial load
duke
parents:
diff changeset
    31
//  Reported by Mikael Staldal <d96-mst-ingen-reklam@d.kth.se>
7f561c08de6b Initial load
duke
parents:
diff changeset
    32
// Aug 21, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    33
//  Added ability to omit DOCTYPE declaration.
7f561c08de6b Initial load
duke
parents:
diff changeset
    34
7f561c08de6b Initial load
duke
parents:
diff changeset
    35
package com.sun.org.apache.xml.internal.serialize;
7f561c08de6b Initial load
duke
parents:
diff changeset
    36
7f561c08de6b Initial load
duke
parents:
diff changeset
    37
import java.io.IOException;
7f561c08de6b Initial load
duke
parents:
diff changeset
    38
import java.io.OutputStream;
7f561c08de6b Initial load
duke
parents:
diff changeset
    39
import java.io.Writer;
7f561c08de6b Initial load
duke
parents:
diff changeset
    40
7f561c08de6b Initial load
duke
parents:
diff changeset
    41
import com.sun.org.apache.xerces.internal.dom.DOMMessageFormatter;
7f561c08de6b Initial load
duke
parents:
diff changeset
    42
import com.sun.org.apache.xerces.internal.util.NamespaceSupport;
7f561c08de6b Initial load
duke
parents:
diff changeset
    43
import com.sun.org.apache.xerces.internal.util.SymbolTable;
7f561c08de6b Initial load
duke
parents:
diff changeset
    44
import com.sun.org.apache.xerces.internal.util.XML11Char;
7f561c08de6b Initial load
duke
parents:
diff changeset
    45
import com.sun.org.apache.xerces.internal.util.XMLChar;
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    46
import org.w3c.dom.DOMError;
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    47
import org.w3c.dom.Document;
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    48
import org.xml.sax.SAXException;
7f561c08de6b Initial load
duke
parents:
diff changeset
    49
7f561c08de6b Initial load
duke
parents:
diff changeset
    50
/**
7f561c08de6b Initial load
duke
parents:
diff changeset
    51
 * Implements an XML serializer supporting both DOM and SAX pretty
7f561c08de6b Initial load
duke
parents:
diff changeset
    52
 * serializing. For usage instructions see {@link Serializer}.
7f561c08de6b Initial load
duke
parents:
diff changeset
    53
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    54
 * If an output stream is used, the encoding is taken from the
7f561c08de6b Initial load
duke
parents:
diff changeset
    55
 * output format (defaults to <tt>UTF-8</tt>). If a writer is
7f561c08de6b Initial load
duke
parents:
diff changeset
    56
 * used, make sure the writer uses the same encoding (if applies)
7f561c08de6b Initial load
duke
parents:
diff changeset
    57
 * as specified in the output format.
7f561c08de6b Initial load
duke
parents:
diff changeset
    58
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    59
 * The serializer supports both DOM and SAX. SAX serializing is done by firing
7f561c08de6b Initial load
duke
parents:
diff changeset
    60
 * SAX events and using the serializer as a document handler. DOM serializing is done
7f561c08de6b Initial load
duke
parents:
diff changeset
    61
 * by calling {@link #serialize(Document)} or by using DOM Level 3
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    62
 * {@link org.w3c.dom.ls.LSSerializer} and
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    63
 * serializing with {@link org.w3c.dom.ls.LSSerializer#write},
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    64
 * {@link org.w3c.dom.ls.LSSerializer#writeToString}.
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    65
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    66
 * If an I/O exception occurs while serializing, the serializer
7f561c08de6b Initial load
duke
parents:
diff changeset
    67
 * will not throw an exception directly, but only throw it
7f561c08de6b Initial load
duke
parents:
diff changeset
    68
 * at the end of serializing (either DOM or SAX's {@link
7f561c08de6b Initial load
duke
parents:
diff changeset
    69
 * org.xml.sax.DocumentHandler#endDocument}.
7f561c08de6b Initial load
duke
parents:
diff changeset
    70
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    71
 * For elements that are not specified as whitespace preserving,
7f561c08de6b Initial load
duke
parents:
diff changeset
    72
 * the serializer will potentially break long text lines at space
7f561c08de6b Initial load
duke
parents:
diff changeset
    73
 * boundaries, indent lines, and serialize elements on separate
7f561c08de6b Initial load
duke
parents:
diff changeset
    74
 * lines. Line terminators will be regarded as spaces, and
7f561c08de6b Initial load
duke
parents:
diff changeset
    75
 * spaces at beginning of line will be stripped.
25834
aba3efbf4ec5 8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer.
joehw
parents: 23777
diff changeset
    76
 *
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    77
 * @author <a href="mailto:arkin@intalio.com">Assaf Arkin</a>
7f561c08de6b Initial load
duke
parents:
diff changeset
    78
 * @author <a href="mailto:rahul.srivastava@sun.com">Rahul Srivastava</a>
7f561c08de6b Initial load
duke
parents:
diff changeset
    79
 * @author Elena Litani IBM
7f561c08de6b Initial load
duke
parents:
diff changeset
    80
 * @see Serializer
25834
aba3efbf4ec5 8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer.
joehw
parents: 23777
diff changeset
    81
 *
aba3efbf4ec5 8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer.
joehw
parents: 23777
diff changeset
    82
 * @deprecated As of JDK 1.9, Xerces 2.9.0, Xerces DOM L3 Serializer implementation
aba3efbf4ec5 8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer.
joehw
parents: 23777
diff changeset
    83
 * is replaced by that of Xalan. Main class
aba3efbf4ec5 8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer.
joehw
parents: 23777
diff changeset
    84
 * {@link com.sun.org.apache.xml.internal.serialize.DOMSerializerImpl} is replaced
aba3efbf4ec5 8035467: Xerces Update: Move to Xalan based DOM L3 serializer. Deprecate Xerces' native serializer.
joehw
parents: 23777
diff changeset
    85
 * by {@link com.sun.org.apache.xml.internal.serializer.dom3.LSSerializerImpl}.
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    86
 */
7f561c08de6b Initial load
duke
parents:
diff changeset
    87
public class XML11Serializer
7f561c08de6b Initial load
duke
parents:
diff changeset
    88
extends XMLSerializer {
7f561c08de6b Initial load
duke
parents:
diff changeset
    89
7f561c08de6b Initial load
duke
parents:
diff changeset
    90
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    91
    // constants
7f561c08de6b Initial load
duke
parents:
diff changeset
    92
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    93
7f561c08de6b Initial load
duke
parents:
diff changeset
    94
    protected static final boolean DEBUG = false;
7f561c08de6b Initial load
duke
parents:
diff changeset
    95
7f561c08de6b Initial load
duke
parents:
diff changeset
    96
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    97
    // data
7f561c08de6b Initial load
duke
parents:
diff changeset
    98
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    99
7f561c08de6b Initial load
duke
parents:
diff changeset
   100
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
   101
    // DOM Level 3 implementation: variables intialized in DOMSerializerImpl
7f561c08de6b Initial load
duke
parents:
diff changeset
   102
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
   103
7f561c08de6b Initial load
duke
parents:
diff changeset
   104
    /** stores namespaces in scope */
7f561c08de6b Initial load
duke
parents:
diff changeset
   105
    protected NamespaceSupport fNSBinder;
7f561c08de6b Initial load
duke
parents:
diff changeset
   106
7f561c08de6b Initial load
duke
parents:
diff changeset
   107
    /** stores all namespace bindings on the current element */
7f561c08de6b Initial load
duke
parents:
diff changeset
   108
    protected NamespaceSupport fLocalNSBinder;
7f561c08de6b Initial load
duke
parents:
diff changeset
   109
7f561c08de6b Initial load
duke
parents:
diff changeset
   110
    /** symbol table for serialization */
7f561c08de6b Initial load
duke
parents:
diff changeset
   111
    protected SymbolTable fSymbolTable;
7f561c08de6b Initial load
duke
parents:
diff changeset
   112
7f561c08de6b Initial load
duke
parents:
diff changeset
   113
    // is node dom level 1 node?
7f561c08de6b Initial load
duke
parents:
diff changeset
   114
    protected boolean fDOML1 = false;
7f561c08de6b Initial load
duke
parents:
diff changeset
   115
    // counter for new prefix names
7f561c08de6b Initial load
duke
parents:
diff changeset
   116
    protected int fNamespaceCounter = 1;
7f561c08de6b Initial load
duke
parents:
diff changeset
   117
    protected final static String PREFIX = "NS";
7f561c08de6b Initial load
duke
parents:
diff changeset
   118
7f561c08de6b Initial load
duke
parents:
diff changeset
   119
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   120
     * Controls whether namespace fixup should be performed during
7f561c08de6b Initial load
duke
parents:
diff changeset
   121
     * the serialization.
7f561c08de6b Initial load
duke
parents:
diff changeset
   122
     * NOTE: if this field is set to true the following
7f561c08de6b Initial load
duke
parents:
diff changeset
   123
     * fields need to be initialized: fNSBinder, fLocalNSBinder, fSymbolTable,
7f561c08de6b Initial load
duke
parents:
diff changeset
   124
     * XMLSymbols.EMPTY_STRING, fXmlSymbol, fXmlnsSymbol, fNamespaceCounter.
7f561c08de6b Initial load
duke
parents:
diff changeset
   125
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   126
    protected boolean fNamespaces = false;
7f561c08de6b Initial load
duke
parents:
diff changeset
   127
7f561c08de6b Initial load
duke
parents:
diff changeset
   128
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   129
     * Constructs a new serializer. The serializer cannot be used without
7f561c08de6b Initial load
duke
parents:
diff changeset
   130
     * calling {@link #setOutputCharStream} or {@link #setOutputByteStream}
7f561c08de6b Initial load
duke
parents:
diff changeset
   131
     * first.
7f561c08de6b Initial load
duke
parents:
diff changeset
   132
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   133
    public XML11Serializer() {
7f561c08de6b Initial load
duke
parents:
diff changeset
   134
        super( );
7f561c08de6b Initial load
duke
parents:
diff changeset
   135
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   136
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   137
7f561c08de6b Initial load
duke
parents:
diff changeset
   138
7f561c08de6b Initial load
duke
parents:
diff changeset
   139
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   140
     * Constructs a new serializer. The serializer cannot be used without
7f561c08de6b Initial load
duke
parents:
diff changeset
   141
     * calling {@link #setOutputCharStream} or {@link #setOutputByteStream}
7f561c08de6b Initial load
duke
parents:
diff changeset
   142
     * first.
7f561c08de6b Initial load
duke
parents:
diff changeset
   143
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   144
    public XML11Serializer( OutputFormat format ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   145
        super( format );
7f561c08de6b Initial load
duke
parents:
diff changeset
   146
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   147
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   148
7f561c08de6b Initial load
duke
parents:
diff changeset
   149
7f561c08de6b Initial load
duke
parents:
diff changeset
   150
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   151
     * Constructs a new serializer that writes to the specified writer
7f561c08de6b Initial load
duke
parents:
diff changeset
   152
     * using the specified output format. If <tt>format</tt> is null,
7f561c08de6b Initial load
duke
parents:
diff changeset
   153
     * will use a default output format.
7f561c08de6b Initial load
duke
parents:
diff changeset
   154
     *
7f561c08de6b Initial load
duke
parents:
diff changeset
   155
     * @param writer The writer to use
7f561c08de6b Initial load
duke
parents:
diff changeset
   156
     * @param format The output format to use, null for the default
7f561c08de6b Initial load
duke
parents:
diff changeset
   157
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   158
    public XML11Serializer( Writer writer, OutputFormat format ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   159
        super( writer, format );
7f561c08de6b Initial load
duke
parents:
diff changeset
   160
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   161
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   162
7f561c08de6b Initial load
duke
parents:
diff changeset
   163
7f561c08de6b Initial load
duke
parents:
diff changeset
   164
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   165
     * Constructs a new serializer that writes to the specified output
7f561c08de6b Initial load
duke
parents:
diff changeset
   166
     * stream using the specified output format. If <tt>format</tt>
7f561c08de6b Initial load
duke
parents:
diff changeset
   167
     * is null, will use a default output format.
7f561c08de6b Initial load
duke
parents:
diff changeset
   168
     *
7f561c08de6b Initial load
duke
parents:
diff changeset
   169
     * @param output The output stream to use
7f561c08de6b Initial load
duke
parents:
diff changeset
   170
     * @param format The output format to use, null for the default
7f561c08de6b Initial load
duke
parents:
diff changeset
   171
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   172
    public XML11Serializer( OutputStream output, OutputFormat format ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   173
        super( output, format != null ? format : new OutputFormat( Method.XML, null, false ) );
7f561c08de6b Initial load
duke
parents:
diff changeset
   174
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   175
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   176
7f561c08de6b Initial load
duke
parents:
diff changeset
   177
    //-----------------------------------------//
7f561c08de6b Initial load
duke
parents:
diff changeset
   178
    // SAX content handler serializing methods //
7f561c08de6b Initial load
duke
parents:
diff changeset
   179
    //-----------------------------------------//
7f561c08de6b Initial load
duke
parents:
diff changeset
   180
7f561c08de6b Initial load
duke
parents:
diff changeset
   181
7f561c08de6b Initial load
duke
parents:
diff changeset
   182
    public void characters( char[] chars, int start, int length )
7f561c08de6b Initial load
duke
parents:
diff changeset
   183
        throws SAXException
7f561c08de6b Initial load
duke
parents:
diff changeset
   184
    {
7f561c08de6b Initial load
duke
parents:
diff changeset
   185
        ElementState state;
7f561c08de6b Initial load
duke
parents:
diff changeset
   186
7f561c08de6b Initial load
duke
parents:
diff changeset
   187
        try {
7f561c08de6b Initial load
duke
parents:
diff changeset
   188
            state = content();
7f561c08de6b Initial load
duke
parents:
diff changeset
   189
7f561c08de6b Initial load
duke
parents:
diff changeset
   190
            // Check if text should be print as CDATA section or unescaped
7f561c08de6b Initial load
duke
parents:
diff changeset
   191
            // based on elements listed in the output format (the element
7f561c08de6b Initial load
duke
parents:
diff changeset
   192
            // state) or whether we are inside a CDATA section or entity.
7f561c08de6b Initial load
duke
parents:
diff changeset
   193
7f561c08de6b Initial load
duke
parents:
diff changeset
   194
            if ( state.inCData || state.doCData ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   195
                int          saveIndent;
7f561c08de6b Initial load
duke
parents:
diff changeset
   196
7f561c08de6b Initial load
duke
parents:
diff changeset
   197
                // Print a CDATA section. The text is not escaped, but ']]>'
7f561c08de6b Initial load
duke
parents:
diff changeset
   198
                // appearing in the code must be identified and dealt with.
7f561c08de6b Initial load
duke
parents:
diff changeset
   199
                // The contents of a text node is considered space preserving.
7f561c08de6b Initial load
duke
parents:
diff changeset
   200
                if ( ! state.inCData ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   201
                    _printer.printText( "<![CDATA[" );
7f561c08de6b Initial load
duke
parents:
diff changeset
   202
                    state.inCData = true;
7f561c08de6b Initial load
duke
parents:
diff changeset
   203
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   204
                saveIndent = _printer.getNextIndent();
7f561c08de6b Initial load
duke
parents:
diff changeset
   205
                _printer.setNextIndent( 0 );
7f561c08de6b Initial load
duke
parents:
diff changeset
   206
                char ch;
7f561c08de6b Initial load
duke
parents:
diff changeset
   207
                final int end = start + length;
7f561c08de6b Initial load
duke
parents:
diff changeset
   208
                for ( int index = start; index < end; ++index ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   209
                    ch = chars[index];
7f561c08de6b Initial load
duke
parents:
diff changeset
   210
                    if ( ch == ']' && index + 2 < end &&
7f561c08de6b Initial load
duke
parents:
diff changeset
   211
                        chars[ index + 1 ] == ']' && chars[ index + 2 ] == '>' ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   212
                        _printer.printText("]]]]><![CDATA[>");
7f561c08de6b Initial load
duke
parents:
diff changeset
   213
                        index +=2;
7f561c08de6b Initial load
duke
parents:
diff changeset
   214
                        continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   215
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   216
                    if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   217
                        // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   218
                        if (++index < end) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   219
                            surrogates(ch, chars[index], true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   220
                        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   221
                        else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   222
                            fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   223
                        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   224
                        continue;
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   225
                    }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   226
                    if ( _encodingInfo.isPrintable(ch) && XML11Char.isXML11ValidLiteral(ch)) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   227
                        _printer.printText(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   228
                    }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   229
                    else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   230
                        // The character is not printable -- split CDATA section
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   231
                        _printer.printText("]]>&#x");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   232
                        _printer.printText(Integer.toHexString(ch));
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   233
                        _printer.printText(";<![CDATA[");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   234
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   235
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   236
                _printer.setNextIndent( saveIndent );
7f561c08de6b Initial load
duke
parents:
diff changeset
   237
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   238
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   239
            else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   240
7f561c08de6b Initial load
duke
parents:
diff changeset
   241
                int saveIndent;
7f561c08de6b Initial load
duke
parents:
diff changeset
   242
7f561c08de6b Initial load
duke
parents:
diff changeset
   243
                if ( state.preserveSpace ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   244
                    // If preserving space then hold of indentation so no
7f561c08de6b Initial load
duke
parents:
diff changeset
   245
                    // excessive spaces are printed at line breaks, escape
7f561c08de6b Initial load
duke
parents:
diff changeset
   246
                    // the text content without replacing spaces and print
7f561c08de6b Initial load
duke
parents:
diff changeset
   247
                    // the text breaking only at line breaks.
7f561c08de6b Initial load
duke
parents:
diff changeset
   248
                    saveIndent = _printer.getNextIndent();
7f561c08de6b Initial load
duke
parents:
diff changeset
   249
                    _printer.setNextIndent( 0 );
7f561c08de6b Initial load
duke
parents:
diff changeset
   250
                    printText( chars, start, length, true, state.unescaped );
7f561c08de6b Initial load
duke
parents:
diff changeset
   251
                    _printer.setNextIndent( saveIndent );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   252
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   253
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   254
                    printText( chars, start, length, false, state.unescaped );
7f561c08de6b Initial load
duke
parents:
diff changeset
   255
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   256
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   257
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   258
        catch ( IOException except ) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   259
            throw new SAXException( except );
7f561c08de6b Initial load
duke
parents:
diff changeset
   260
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   261
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   262
7f561c08de6b Initial load
duke
parents:
diff changeset
   263
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
   264
    // overwrite printing functions to make sure serializer prints out valid XML
7f561c08de6b Initial load
duke
parents:
diff changeset
   265
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
   266
    protected void printEscaped( String source ) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   267
        int length = source.length();
7f561c08de6b Initial load
duke
parents:
diff changeset
   268
        for ( int i = 0 ; i < length ; ++i ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   269
            int ch = source.charAt(i);
7f561c08de6b Initial load
duke
parents:
diff changeset
   270
            if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   271
                if (++i <length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   272
                    surrogates(ch, source.charAt(i), false);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   273
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   274
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   275
                    fatalError("The character '"+(char)ch+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   276
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   277
                continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   278
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   279
            if (ch == '\n' || ch == '\r' || ch == '\t' || ch == 0x0085 || ch == 0x2028) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   280
                printHex(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   281
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   282
            else if (ch == '<') {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   283
                _printer.printText("&lt;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   284
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   285
            else if (ch == '&') {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   286
                _printer.printText("&amp;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   287
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   288
            else if (ch == '"') {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   289
                _printer.printText("&quot;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   290
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   291
            else if ((ch >= ' ' && _encodingInfo.isPrintable((char) ch))) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   292
                _printer.printText((char) ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   293
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   294
            else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   295
                printHex(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   296
            }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   297
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   298
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   299
7f561c08de6b Initial load
duke
parents:
diff changeset
   300
    protected final void printCDATAText(String text) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   301
        int length = text.length();
7f561c08de6b Initial load
duke
parents:
diff changeset
   302
        char ch;
7f561c08de6b Initial load
duke
parents:
diff changeset
   303
7f561c08de6b Initial load
duke
parents:
diff changeset
   304
        for (int index = 0; index < length; ++index) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   305
            ch = text.charAt(index);
7f561c08de6b Initial load
duke
parents:
diff changeset
   306
7f561c08de6b Initial load
duke
parents:
diff changeset
   307
            if (ch == ']'
7f561c08de6b Initial load
duke
parents:
diff changeset
   308
                && index + 2 < length
7f561c08de6b Initial load
duke
parents:
diff changeset
   309
                && text.charAt(index + 1) == ']'
7f561c08de6b Initial load
duke
parents:
diff changeset
   310
                && text.charAt(index + 2) == '>') { // check for ']]>'
7f561c08de6b Initial load
duke
parents:
diff changeset
   311
                if (fDOMErrorHandler != null){
7f561c08de6b Initial load
duke
parents:
diff changeset
   312
                    // REVISIT: this means that if DOM Error handler is not registered we don't report any
7f561c08de6b Initial load
duke
parents:
diff changeset
   313
                    // fatal errors and might serialize not wellformed document
7f561c08de6b Initial load
duke
parents:
diff changeset
   314
                if ((features & DOMSerializerImpl.SPLITCDATA) == 0
7f561c08de6b Initial load
duke
parents:
diff changeset
   315
                    && (features & DOMSerializerImpl.WELLFORMED) == 0) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   316
                    // issue fatal error
7f561c08de6b Initial load
duke
parents:
diff changeset
   317
                    String msg =
7f561c08de6b Initial load
duke
parents:
diff changeset
   318
                        DOMMessageFormatter.formatMessage(
7f561c08de6b Initial load
duke
parents:
diff changeset
   319
                            DOMMessageFormatter.SERIALIZER_DOMAIN,
7f561c08de6b Initial load
duke
parents:
diff changeset
   320
                            "EndingCDATA",
7f561c08de6b Initial load
duke
parents:
diff changeset
   321
                            null);
7f561c08de6b Initial load
duke
parents:
diff changeset
   322
                    modifyDOMError(
7f561c08de6b Initial load
duke
parents:
diff changeset
   323
                        msg,
7f561c08de6b Initial load
duke
parents:
diff changeset
   324
                        DOMError.SEVERITY_FATAL_ERROR,
7f561c08de6b Initial load
duke
parents:
diff changeset
   325
                        null, fCurrentNode);
7f561c08de6b Initial load
duke
parents:
diff changeset
   326
                    boolean continueProcess =
7f561c08de6b Initial load
duke
parents:
diff changeset
   327
                        fDOMErrorHandler.handleError(fDOMError);
7f561c08de6b Initial load
duke
parents:
diff changeset
   328
                    if (!continueProcess) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   329
                        throw new IOException();
7f561c08de6b Initial load
duke
parents:
diff changeset
   330
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   331
                } else {
7f561c08de6b Initial load
duke
parents:
diff changeset
   332
                    // issue warning
7f561c08de6b Initial load
duke
parents:
diff changeset
   333
                    String msg =
7f561c08de6b Initial load
duke
parents:
diff changeset
   334
                        DOMMessageFormatter.formatMessage(
7f561c08de6b Initial load
duke
parents:
diff changeset
   335
                            DOMMessageFormatter.SERIALIZER_DOMAIN,
7f561c08de6b Initial load
duke
parents:
diff changeset
   336
                            "SplittingCDATA",
7f561c08de6b Initial load
duke
parents:
diff changeset
   337
                            null);
7f561c08de6b Initial load
duke
parents:
diff changeset
   338
                    modifyDOMError(
7f561c08de6b Initial load
duke
parents:
diff changeset
   339
                        msg,
7f561c08de6b Initial load
duke
parents:
diff changeset
   340
                        DOMError.SEVERITY_WARNING,
7f561c08de6b Initial load
duke
parents:
diff changeset
   341
                        null, fCurrentNode);
7f561c08de6b Initial load
duke
parents:
diff changeset
   342
                    fDOMErrorHandler.handleError(fDOMError);
7f561c08de6b Initial load
duke
parents:
diff changeset
   343
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   344
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   345
                // split CDATA section
7f561c08de6b Initial load
duke
parents:
diff changeset
   346
                _printer.printText("]]]]><![CDATA[>");
7f561c08de6b Initial load
duke
parents:
diff changeset
   347
                index += 2;
7f561c08de6b Initial load
duke
parents:
diff changeset
   348
                continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   349
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   350
7f561c08de6b Initial load
duke
parents:
diff changeset
   351
            if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   352
                // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   353
                if (++index < length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   354
                    surrogates(ch, text.charAt(index), true);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   355
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   356
                else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   357
                    fatalError("The character '" + ch + "' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   358
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   359
                continue;
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   360
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   361
            if (_encodingInfo.isPrintable(ch)
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   362
                && XML11Char.isXML11ValidLiteral(ch)) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   363
                _printer.printText(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   364
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   365
            else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   366
                // The character is not printable -- split CDATA section
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   367
                _printer.printText("]]>&#x");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   368
                _printer.printText(Integer.toHexString(ch));
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   369
                _printer.printText(";<![CDATA[");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   370
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   371
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   372
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   373
7f561c08de6b Initial load
duke
parents:
diff changeset
   374
    // note that this "int" should, in all cases, be a char.
7f561c08de6b Initial load
duke
parents:
diff changeset
   375
    // REVISIT:  make it a char...
7f561c08de6b Initial load
duke
parents:
diff changeset
   376
    protected final void printXMLChar( int ch ) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   377
7f561c08de6b Initial load
duke
parents:
diff changeset
   378
        if (ch == '\r' || ch == 0x0085 || ch == 0x2028) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   379
            printHex(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   380
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   381
        else if ( ch == '<') {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   382
            _printer.printText("&lt;");
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   383
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   384
        else if (ch == '&') {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   385
            _printer.printText("&amp;");
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   386
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   387
        else if (ch == '>'){
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   388
            // character sequence "]]>" can't appear in content, therefore
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   389
            // we should escape '>'
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   390
            _printer.printText("&gt;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   391
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   392
        else if ( _encodingInfo.isPrintable((char)ch) && XML11Char.isXML11ValidLiteral(ch)) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   393
            _printer.printText((char)ch);
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   394
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   395
        else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   396
            printHex(ch);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   397
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   398
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   399
7f561c08de6b Initial load
duke
parents:
diff changeset
   400
7f561c08de6b Initial load
duke
parents:
diff changeset
   401
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   402
    protected final void surrogates(int high, int low, boolean inContent) throws IOException{
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   403
        if (XMLChar.isHighSurrogate(high)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   404
            if (!XMLChar.isLowSurrogate(low)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   405
                //Invalid XML
7f561c08de6b Initial load
duke
parents:
diff changeset
   406
                fatalError("The character '"+(char)low+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   407
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   408
            else {
7f561c08de6b Initial load
duke
parents:
diff changeset
   409
                int supplemental = XMLChar.supplemental((char)high, (char)low);
7f561c08de6b Initial load
duke
parents:
diff changeset
   410
                if (!XML11Char.isXML11Valid(supplemental)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   411
                    //Invalid XML
7f561c08de6b Initial load
duke
parents:
diff changeset
   412
                    fatalError("The character '"+(char)supplemental+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   413
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   414
                else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   415
                    if (inContent && content().inCData) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   416
                        _printer.printText("]]>&#x");
7f561c08de6b Initial load
duke
parents:
diff changeset
   417
                        _printer.printText(Integer.toHexString(supplemental));
7f561c08de6b Initial load
duke
parents:
diff changeset
   418
                        _printer.printText(";<![CDATA[");
7f561c08de6b Initial load
duke
parents:
diff changeset
   419
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   420
                    else {
7f561c08de6b Initial load
duke
parents:
diff changeset
   421
                                                printHex(supplemental);
7f561c08de6b Initial load
duke
parents:
diff changeset
   422
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   423
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   424
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   425
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   426
        else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   427
            fatalError("The character '"+(char)high+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   428
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   429
7f561c08de6b Initial load
duke
parents:
diff changeset
   430
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   431
7f561c08de6b Initial load
duke
parents:
diff changeset
   432
7f561c08de6b Initial load
duke
parents:
diff changeset
   433
    protected void printText( String text, boolean preserveSpace, boolean unescaped )
7f561c08de6b Initial load
duke
parents:
diff changeset
   434
    throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   435
        int index;
7f561c08de6b Initial load
duke
parents:
diff changeset
   436
        char ch;
7f561c08de6b Initial load
duke
parents:
diff changeset
   437
        int length = text.length();
7f561c08de6b Initial load
duke
parents:
diff changeset
   438
        if ( preserveSpace ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   439
            // Preserving spaces: the text must print exactly as it is,
7f561c08de6b Initial load
duke
parents:
diff changeset
   440
            // without breaking when spaces appear in the text and without
7f561c08de6b Initial load
duke
parents:
diff changeset
   441
            // consolidating spaces. If a line terminator is used, a line
7f561c08de6b Initial load
duke
parents:
diff changeset
   442
            // break will occur.
7f561c08de6b Initial load
duke
parents:
diff changeset
   443
            for ( index = 0 ; index < length ; ++index ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   444
                ch = text.charAt( index );
7f561c08de6b Initial load
duke
parents:
diff changeset
   445
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   446
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   447
                    if (++index <length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   448
                        surrogates(ch, text.charAt(index), true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   449
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   450
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   451
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   452
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   453
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   454
                if ( unescaped  && XML11Char.isXML11ValidLiteral(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   455
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   456
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   457
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   458
                    printXMLChar( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   459
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   460
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   461
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   462
        else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   463
            // Not preserving spaces: print one part at a time, and
7f561c08de6b Initial load
duke
parents:
diff changeset
   464
            // use spaces between parts to break them into different
7f561c08de6b Initial load
duke
parents:
diff changeset
   465
            // lines. Spaces at beginning of line will be stripped
7f561c08de6b Initial load
duke
parents:
diff changeset
   466
            // by printing mechanism. Line terminator is treated
7f561c08de6b Initial load
duke
parents:
diff changeset
   467
            // no different than other text part.
7f561c08de6b Initial load
duke
parents:
diff changeset
   468
            for ( index = 0 ; index < length ; ++index ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   469
                ch = text.charAt( index );
7f561c08de6b Initial load
duke
parents:
diff changeset
   470
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   471
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   472
                    if (++index <length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   473
                        surrogates(ch, text.charAt(index), true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   474
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   475
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   476
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   477
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   478
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   479
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   480
                if ( unescaped && XML11Char.isXML11ValidLiteral(ch) ) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   481
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   482
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   483
                else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   484
                    printXMLChar( ch );
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   485
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   486
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   487
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   488
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   489
7f561c08de6b Initial load
duke
parents:
diff changeset
   490
    protected void printText( char[] chars, int start, int length,
7f561c08de6b Initial load
duke
parents:
diff changeset
   491
                              boolean preserveSpace, boolean unescaped ) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   492
7f561c08de6b Initial load
duke
parents:
diff changeset
   493
        if ( preserveSpace ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   494
            // Preserving spaces: the text must print exactly as it is,
7f561c08de6b Initial load
duke
parents:
diff changeset
   495
            // without breaking when spaces appear in the text and without
7f561c08de6b Initial load
duke
parents:
diff changeset
   496
            // consolidating spaces. If a line terminator is used, a line
7f561c08de6b Initial load
duke
parents:
diff changeset
   497
            // break will occur.
7f561c08de6b Initial load
duke
parents:
diff changeset
   498
            while ( length-- > 0 ) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   499
                char ch = chars[start++];
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   500
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   501
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   502
                    if ( length-- > 0) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   503
                        surrogates(ch, chars[start++], true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   504
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   505
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   506
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   507
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   508
                }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   509
                if ( unescaped && XML11Char.isXML11ValidLiteral(ch)) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   510
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   511
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   512
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   513
                    printXMLChar( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   514
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   515
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   516
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   517
        else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   518
            // Not preserving spaces: print one part at a time, and
7f561c08de6b Initial load
duke
parents:
diff changeset
   519
            // use spaces between parts to break them into different
7f561c08de6b Initial load
duke
parents:
diff changeset
   520
            // lines. Spaces at beginning of line will be stripped
7f561c08de6b Initial load
duke
parents:
diff changeset
   521
            // by printing mechanism. Line terminator is treated
7f561c08de6b Initial load
duke
parents:
diff changeset
   522
            // no different than other text part.
7f561c08de6b Initial load
duke
parents:
diff changeset
   523
            while ( length-- > 0 ) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   524
                char ch = chars[start++];
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   525
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   526
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   527
                    if ( length-- > 0) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   528
                        surrogates(ch, chars[start++], true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   529
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   530
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   531
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   532
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   533
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   534
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   535
                if ( unescaped && XML11Char.isXML11ValidLiteral(ch)) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   536
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   537
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   538
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   539
                    printXMLChar( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   540
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   541
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   542
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   543
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   544
7f561c08de6b Initial load
duke
parents:
diff changeset
   545
    public boolean reset() {
7f561c08de6b Initial load
duke
parents:
diff changeset
   546
        super.reset();
7f561c08de6b Initial load
duke
parents:
diff changeset
   547
        return true;
7f561c08de6b Initial load
duke
parents:
diff changeset
   548
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   549
7f561c08de6b Initial load
duke
parents:
diff changeset
   550
}