jaxp/src/com/sun/org/apache/xml/internal/serialize/XML11Serializer.java
author aefimov
Mon, 31 Mar 2014 19:03:41 +0400
changeset 23777 ce87cedb71cf
parent 12457 c348e06f0e82
child 25834 aba3efbf4ec5
permissions -rw-r--r--
8035437: Xerces Update: xml/serialize/DOMSerializerImpl Reviewed-by: lancea
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
6
7f561c08de6b Initial load
duke
parents:
diff changeset
     1
/*
7f561c08de6b Initial load
duke
parents:
diff changeset
     2
 * reserved comment block
7f561c08de6b Initial load
duke
parents:
diff changeset
     3
 * DO NOT REMOVE OR ALTER!
7f561c08de6b Initial load
duke
parents:
diff changeset
     4
 */
7f561c08de6b Initial load
duke
parents:
diff changeset
     5
/*
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     6
 * Licensed to the Apache Software Foundation (ASF) under one or more
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     7
 * contributor license agreements.  See the NOTICE file distributed with
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     8
 * this work for additional information regarding copyright ownership.
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
     9
 * The ASF licenses this file to You under the Apache License, Version 2.0
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    10
 * (the "License"); you may not use this file except in compliance with
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    11
 * the License.  You may obtain a copy of the License at
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    12
 *
7f561c08de6b Initial load
duke
parents:
diff changeset
    13
 *      http://www.apache.org/licenses/LICENSE-2.0
7f561c08de6b Initial load
duke
parents:
diff changeset
    14
 *
7f561c08de6b Initial load
duke
parents:
diff changeset
    15
 * Unless required by applicable law or agreed to in writing, software
7f561c08de6b Initial load
duke
parents:
diff changeset
    16
 * distributed under the License is distributed on an "AS IS" BASIS,
7f561c08de6b Initial load
duke
parents:
diff changeset
    17
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
7f561c08de6b Initial load
duke
parents:
diff changeset
    18
 * See the License for the specific language governing permissions and
7f561c08de6b Initial load
duke
parents:
diff changeset
    19
 * limitations under the License.
7f561c08de6b Initial load
duke
parents:
diff changeset
    20
 */
7f561c08de6b Initial load
duke
parents:
diff changeset
    21
7f561c08de6b Initial load
duke
parents:
diff changeset
    22
// Sep 14, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    23
//  Fixed problem with namespace handling. Contributed by
7f561c08de6b Initial load
duke
parents:
diff changeset
    24
//  David Blondeau <blondeau@intalio.com>
7f561c08de6b Initial load
duke
parents:
diff changeset
    25
// Sep 14, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    26
//  Fixed serializer to report IO exception directly, instead at
7f561c08de6b Initial load
duke
parents:
diff changeset
    27
//  the end of document processing.
7f561c08de6b Initial load
duke
parents:
diff changeset
    28
//  Reported by Patrick Higgins <phiggins@transzap.com>
7f561c08de6b Initial load
duke
parents:
diff changeset
    29
// Aug 21, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    30
//  Fixed bug in startDocument not calling prepare.
7f561c08de6b Initial load
duke
parents:
diff changeset
    31
//  Reported by Mikael Staldal <d96-mst-ingen-reklam@d.kth.se>
7f561c08de6b Initial load
duke
parents:
diff changeset
    32
// Aug 21, 2000:
7f561c08de6b Initial load
duke
parents:
diff changeset
    33
//  Added ability to omit DOCTYPE declaration.
7f561c08de6b Initial load
duke
parents:
diff changeset
    34
7f561c08de6b Initial load
duke
parents:
diff changeset
    35
package com.sun.org.apache.xml.internal.serialize;
7f561c08de6b Initial load
duke
parents:
diff changeset
    36
7f561c08de6b Initial load
duke
parents:
diff changeset
    37
import java.io.IOException;
7f561c08de6b Initial load
duke
parents:
diff changeset
    38
import java.io.OutputStream;
7f561c08de6b Initial load
duke
parents:
diff changeset
    39
import java.io.Writer;
7f561c08de6b Initial load
duke
parents:
diff changeset
    40
7f561c08de6b Initial load
duke
parents:
diff changeset
    41
import com.sun.org.apache.xerces.internal.dom.DOMMessageFormatter;
7f561c08de6b Initial load
duke
parents:
diff changeset
    42
import com.sun.org.apache.xerces.internal.util.NamespaceSupport;
7f561c08de6b Initial load
duke
parents:
diff changeset
    43
import com.sun.org.apache.xerces.internal.util.SymbolTable;
7f561c08de6b Initial load
duke
parents:
diff changeset
    44
import com.sun.org.apache.xerces.internal.util.XML11Char;
7f561c08de6b Initial load
duke
parents:
diff changeset
    45
import com.sun.org.apache.xerces.internal.util.XMLChar;
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    46
import org.w3c.dom.DOMError;
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    47
import org.w3c.dom.Document;
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    48
import org.xml.sax.SAXException;
7f561c08de6b Initial load
duke
parents:
diff changeset
    49
7f561c08de6b Initial load
duke
parents:
diff changeset
    50
/**
7f561c08de6b Initial load
duke
parents:
diff changeset
    51
 * Implements an XML serializer supporting both DOM and SAX pretty
7f561c08de6b Initial load
duke
parents:
diff changeset
    52
 * serializing. For usage instructions see {@link Serializer}.
7f561c08de6b Initial load
duke
parents:
diff changeset
    53
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    54
 * If an output stream is used, the encoding is taken from the
7f561c08de6b Initial load
duke
parents:
diff changeset
    55
 * output format (defaults to <tt>UTF-8</tt>). If a writer is
7f561c08de6b Initial load
duke
parents:
diff changeset
    56
 * used, make sure the writer uses the same encoding (if applies)
7f561c08de6b Initial load
duke
parents:
diff changeset
    57
 * as specified in the output format.
7f561c08de6b Initial load
duke
parents:
diff changeset
    58
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    59
 * The serializer supports both DOM and SAX. SAX serializing is done by firing
7f561c08de6b Initial load
duke
parents:
diff changeset
    60
 * SAX events and using the serializer as a document handler. DOM serializing is done
7f561c08de6b Initial load
duke
parents:
diff changeset
    61
 * by calling {@link #serialize(Document)} or by using DOM Level 3
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    62
 * {@link org.w3c.dom.ls.LSSerializer} and
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    63
 * serializing with {@link org.w3c.dom.ls.LSSerializer#write},
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
    64
 * {@link org.w3c.dom.ls.LSSerializer#writeToString}.
6
7f561c08de6b Initial load
duke
parents:
diff changeset
    65
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    66
 * If an I/O exception occurs while serializing, the serializer
7f561c08de6b Initial load
duke
parents:
diff changeset
    67
 * will not throw an exception directly, but only throw it
7f561c08de6b Initial load
duke
parents:
diff changeset
    68
 * at the end of serializing (either DOM or SAX's {@link
7f561c08de6b Initial load
duke
parents:
diff changeset
    69
 * org.xml.sax.DocumentHandler#endDocument}.
7f561c08de6b Initial load
duke
parents:
diff changeset
    70
 * <p>
7f561c08de6b Initial load
duke
parents:
diff changeset
    71
 * For elements that are not specified as whitespace preserving,
7f561c08de6b Initial load
duke
parents:
diff changeset
    72
 * the serializer will potentially break long text lines at space
7f561c08de6b Initial load
duke
parents:
diff changeset
    73
 * boundaries, indent lines, and serialize elements on separate
7f561c08de6b Initial load
duke
parents:
diff changeset
    74
 * lines. Line terminators will be regarded as spaces, and
7f561c08de6b Initial load
duke
parents:
diff changeset
    75
 * spaces at beginning of line will be stripped.
7f561c08de6b Initial load
duke
parents:
diff changeset
    76
 * @author <a href="mailto:arkin@intalio.com">Assaf Arkin</a>
7f561c08de6b Initial load
duke
parents:
diff changeset
    77
 * @author <a href="mailto:rahul.srivastava@sun.com">Rahul Srivastava</a>
7f561c08de6b Initial load
duke
parents:
diff changeset
    78
 * @author Elena Litani IBM
7f561c08de6b Initial load
duke
parents:
diff changeset
    79
 * @see Serializer
7f561c08de6b Initial load
duke
parents:
diff changeset
    80
 */
7f561c08de6b Initial load
duke
parents:
diff changeset
    81
public class XML11Serializer
7f561c08de6b Initial load
duke
parents:
diff changeset
    82
extends XMLSerializer {
7f561c08de6b Initial load
duke
parents:
diff changeset
    83
7f561c08de6b Initial load
duke
parents:
diff changeset
    84
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    85
    // constants
7f561c08de6b Initial load
duke
parents:
diff changeset
    86
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    87
7f561c08de6b Initial load
duke
parents:
diff changeset
    88
    protected static final boolean DEBUG = false;
7f561c08de6b Initial load
duke
parents:
diff changeset
    89
7f561c08de6b Initial load
duke
parents:
diff changeset
    90
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    91
    // data
7f561c08de6b Initial load
duke
parents:
diff changeset
    92
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    93
7f561c08de6b Initial load
duke
parents:
diff changeset
    94
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    95
    // DOM Level 3 implementation: variables intialized in DOMSerializerImpl
7f561c08de6b Initial load
duke
parents:
diff changeset
    96
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
    97
7f561c08de6b Initial load
duke
parents:
diff changeset
    98
    /** stores namespaces in scope */
7f561c08de6b Initial load
duke
parents:
diff changeset
    99
    protected NamespaceSupport fNSBinder;
7f561c08de6b Initial load
duke
parents:
diff changeset
   100
7f561c08de6b Initial load
duke
parents:
diff changeset
   101
    /** stores all namespace bindings on the current element */
7f561c08de6b Initial load
duke
parents:
diff changeset
   102
    protected NamespaceSupport fLocalNSBinder;
7f561c08de6b Initial load
duke
parents:
diff changeset
   103
7f561c08de6b Initial load
duke
parents:
diff changeset
   104
    /** symbol table for serialization */
7f561c08de6b Initial load
duke
parents:
diff changeset
   105
    protected SymbolTable fSymbolTable;
7f561c08de6b Initial load
duke
parents:
diff changeset
   106
7f561c08de6b Initial load
duke
parents:
diff changeset
   107
    // is node dom level 1 node?
7f561c08de6b Initial load
duke
parents:
diff changeset
   108
    protected boolean fDOML1 = false;
7f561c08de6b Initial load
duke
parents:
diff changeset
   109
    // counter for new prefix names
7f561c08de6b Initial load
duke
parents:
diff changeset
   110
    protected int fNamespaceCounter = 1;
7f561c08de6b Initial load
duke
parents:
diff changeset
   111
    protected final static String PREFIX = "NS";
7f561c08de6b Initial load
duke
parents:
diff changeset
   112
7f561c08de6b Initial load
duke
parents:
diff changeset
   113
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   114
     * Controls whether namespace fixup should be performed during
7f561c08de6b Initial load
duke
parents:
diff changeset
   115
     * the serialization.
7f561c08de6b Initial load
duke
parents:
diff changeset
   116
     * NOTE: if this field is set to true the following
7f561c08de6b Initial load
duke
parents:
diff changeset
   117
     * fields need to be initialized: fNSBinder, fLocalNSBinder, fSymbolTable,
7f561c08de6b Initial load
duke
parents:
diff changeset
   118
     * XMLSymbols.EMPTY_STRING, fXmlSymbol, fXmlnsSymbol, fNamespaceCounter.
7f561c08de6b Initial load
duke
parents:
diff changeset
   119
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   120
    protected boolean fNamespaces = false;
7f561c08de6b Initial load
duke
parents:
diff changeset
   121
7f561c08de6b Initial load
duke
parents:
diff changeset
   122
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   123
     * Constructs a new serializer. The serializer cannot be used without
7f561c08de6b Initial load
duke
parents:
diff changeset
   124
     * calling {@link #setOutputCharStream} or {@link #setOutputByteStream}
7f561c08de6b Initial load
duke
parents:
diff changeset
   125
     * first.
7f561c08de6b Initial load
duke
parents:
diff changeset
   126
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   127
    public XML11Serializer() {
7f561c08de6b Initial load
duke
parents:
diff changeset
   128
        super( );
7f561c08de6b Initial load
duke
parents:
diff changeset
   129
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   130
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   131
7f561c08de6b Initial load
duke
parents:
diff changeset
   132
7f561c08de6b Initial load
duke
parents:
diff changeset
   133
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   134
     * Constructs a new serializer. The serializer cannot be used without
7f561c08de6b Initial load
duke
parents:
diff changeset
   135
     * calling {@link #setOutputCharStream} or {@link #setOutputByteStream}
7f561c08de6b Initial load
duke
parents:
diff changeset
   136
     * first.
7f561c08de6b Initial load
duke
parents:
diff changeset
   137
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   138
    public XML11Serializer( OutputFormat format ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   139
        super( format );
7f561c08de6b Initial load
duke
parents:
diff changeset
   140
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   141
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   142
7f561c08de6b Initial load
duke
parents:
diff changeset
   143
7f561c08de6b Initial load
duke
parents:
diff changeset
   144
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   145
     * Constructs a new serializer that writes to the specified writer
7f561c08de6b Initial load
duke
parents:
diff changeset
   146
     * using the specified output format. If <tt>format</tt> is null,
7f561c08de6b Initial load
duke
parents:
diff changeset
   147
     * will use a default output format.
7f561c08de6b Initial load
duke
parents:
diff changeset
   148
     *
7f561c08de6b Initial load
duke
parents:
diff changeset
   149
     * @param writer The writer to use
7f561c08de6b Initial load
duke
parents:
diff changeset
   150
     * @param format The output format to use, null for the default
7f561c08de6b Initial load
duke
parents:
diff changeset
   151
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   152
    public XML11Serializer( Writer writer, OutputFormat format ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   153
        super( writer, format );
7f561c08de6b Initial load
duke
parents:
diff changeset
   154
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   155
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   156
7f561c08de6b Initial load
duke
parents:
diff changeset
   157
7f561c08de6b Initial load
duke
parents:
diff changeset
   158
    /**
7f561c08de6b Initial load
duke
parents:
diff changeset
   159
     * Constructs a new serializer that writes to the specified output
7f561c08de6b Initial load
duke
parents:
diff changeset
   160
     * stream using the specified output format. If <tt>format</tt>
7f561c08de6b Initial load
duke
parents:
diff changeset
   161
     * is null, will use a default output format.
7f561c08de6b Initial load
duke
parents:
diff changeset
   162
     *
7f561c08de6b Initial load
duke
parents:
diff changeset
   163
     * @param output The output stream to use
7f561c08de6b Initial load
duke
parents:
diff changeset
   164
     * @param format The output format to use, null for the default
7f561c08de6b Initial load
duke
parents:
diff changeset
   165
     */
7f561c08de6b Initial load
duke
parents:
diff changeset
   166
    public XML11Serializer( OutputStream output, OutputFormat format ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   167
        super( output, format != null ? format : new OutputFormat( Method.XML, null, false ) );
7f561c08de6b Initial load
duke
parents:
diff changeset
   168
        _format.setVersion("1.1");
7f561c08de6b Initial load
duke
parents:
diff changeset
   169
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   170
7f561c08de6b Initial load
duke
parents:
diff changeset
   171
    //-----------------------------------------//
7f561c08de6b Initial load
duke
parents:
diff changeset
   172
    // SAX content handler serializing methods //
7f561c08de6b Initial load
duke
parents:
diff changeset
   173
    //-----------------------------------------//
7f561c08de6b Initial load
duke
parents:
diff changeset
   174
7f561c08de6b Initial load
duke
parents:
diff changeset
   175
7f561c08de6b Initial load
duke
parents:
diff changeset
   176
    public void characters( char[] chars, int start, int length )
7f561c08de6b Initial load
duke
parents:
diff changeset
   177
        throws SAXException
7f561c08de6b Initial load
duke
parents:
diff changeset
   178
    {
7f561c08de6b Initial load
duke
parents:
diff changeset
   179
        ElementState state;
7f561c08de6b Initial load
duke
parents:
diff changeset
   180
7f561c08de6b Initial load
duke
parents:
diff changeset
   181
        try {
7f561c08de6b Initial load
duke
parents:
diff changeset
   182
            state = content();
7f561c08de6b Initial load
duke
parents:
diff changeset
   183
7f561c08de6b Initial load
duke
parents:
diff changeset
   184
            // Check if text should be print as CDATA section or unescaped
7f561c08de6b Initial load
duke
parents:
diff changeset
   185
            // based on elements listed in the output format (the element
7f561c08de6b Initial load
duke
parents:
diff changeset
   186
            // state) or whether we are inside a CDATA section or entity.
7f561c08de6b Initial load
duke
parents:
diff changeset
   187
7f561c08de6b Initial load
duke
parents:
diff changeset
   188
            if ( state.inCData || state.doCData ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   189
                int          saveIndent;
7f561c08de6b Initial load
duke
parents:
diff changeset
   190
7f561c08de6b Initial load
duke
parents:
diff changeset
   191
                // Print a CDATA section. The text is not escaped, but ']]>'
7f561c08de6b Initial load
duke
parents:
diff changeset
   192
                // appearing in the code must be identified and dealt with.
7f561c08de6b Initial load
duke
parents:
diff changeset
   193
                // The contents of a text node is considered space preserving.
7f561c08de6b Initial load
duke
parents:
diff changeset
   194
                if ( ! state.inCData ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   195
                    _printer.printText( "<![CDATA[" );
7f561c08de6b Initial load
duke
parents:
diff changeset
   196
                    state.inCData = true;
7f561c08de6b Initial load
duke
parents:
diff changeset
   197
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   198
                saveIndent = _printer.getNextIndent();
7f561c08de6b Initial load
duke
parents:
diff changeset
   199
                _printer.setNextIndent( 0 );
7f561c08de6b Initial load
duke
parents:
diff changeset
   200
                char ch;
7f561c08de6b Initial load
duke
parents:
diff changeset
   201
                final int end = start + length;
7f561c08de6b Initial load
duke
parents:
diff changeset
   202
                for ( int index = start; index < end; ++index ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   203
                    ch = chars[index];
7f561c08de6b Initial load
duke
parents:
diff changeset
   204
                    if ( ch == ']' && index + 2 < end &&
7f561c08de6b Initial load
duke
parents:
diff changeset
   205
                        chars[ index + 1 ] == ']' && chars[ index + 2 ] == '>' ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   206
                        _printer.printText("]]]]><![CDATA[>");
7f561c08de6b Initial load
duke
parents:
diff changeset
   207
                        index +=2;
7f561c08de6b Initial load
duke
parents:
diff changeset
   208
                        continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   209
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   210
                    if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   211
                        // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   212
                        if (++index < end) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   213
                            surrogates(ch, chars[index], true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   214
                        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   215
                        else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   216
                            fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   217
                        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   218
                        continue;
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   219
                    }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   220
                    if ( _encodingInfo.isPrintable(ch) && XML11Char.isXML11ValidLiteral(ch)) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   221
                        _printer.printText(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   222
                    }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   223
                    else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   224
                        // The character is not printable -- split CDATA section
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   225
                        _printer.printText("]]>&#x");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   226
                        _printer.printText(Integer.toHexString(ch));
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   227
                        _printer.printText(";<![CDATA[");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   228
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   229
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   230
                _printer.setNextIndent( saveIndent );
7f561c08de6b Initial load
duke
parents:
diff changeset
   231
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   232
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   233
            else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   234
7f561c08de6b Initial load
duke
parents:
diff changeset
   235
                int saveIndent;
7f561c08de6b Initial load
duke
parents:
diff changeset
   236
7f561c08de6b Initial load
duke
parents:
diff changeset
   237
                if ( state.preserveSpace ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   238
                    // If preserving space then hold of indentation so no
7f561c08de6b Initial load
duke
parents:
diff changeset
   239
                    // excessive spaces are printed at line breaks, escape
7f561c08de6b Initial load
duke
parents:
diff changeset
   240
                    // the text content without replacing spaces and print
7f561c08de6b Initial load
duke
parents:
diff changeset
   241
                    // the text breaking only at line breaks.
7f561c08de6b Initial load
duke
parents:
diff changeset
   242
                    saveIndent = _printer.getNextIndent();
7f561c08de6b Initial load
duke
parents:
diff changeset
   243
                    _printer.setNextIndent( 0 );
7f561c08de6b Initial load
duke
parents:
diff changeset
   244
                    printText( chars, start, length, true, state.unescaped );
7f561c08de6b Initial load
duke
parents:
diff changeset
   245
                    _printer.setNextIndent( saveIndent );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   246
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   247
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   248
                    printText( chars, start, length, false, state.unescaped );
7f561c08de6b Initial load
duke
parents:
diff changeset
   249
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   250
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   251
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   252
        catch ( IOException except ) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   253
            throw new SAXException( except );
7f561c08de6b Initial load
duke
parents:
diff changeset
   254
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   255
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   256
7f561c08de6b Initial load
duke
parents:
diff changeset
   257
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
   258
    // overwrite printing functions to make sure serializer prints out valid XML
7f561c08de6b Initial load
duke
parents:
diff changeset
   259
    //
7f561c08de6b Initial load
duke
parents:
diff changeset
   260
    protected void printEscaped( String source ) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   261
        int length = source.length();
7f561c08de6b Initial load
duke
parents:
diff changeset
   262
        for ( int i = 0 ; i < length ; ++i ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   263
            int ch = source.charAt(i);
7f561c08de6b Initial load
duke
parents:
diff changeset
   264
            if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   265
                if (++i <length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   266
                    surrogates(ch, source.charAt(i), false);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   267
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   268
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   269
                    fatalError("The character '"+(char)ch+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   270
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   271
                continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   272
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   273
            if (ch == '\n' || ch == '\r' || ch == '\t' || ch == 0x0085 || ch == 0x2028) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   274
                printHex(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   275
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   276
            else if (ch == '<') {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   277
                _printer.printText("&lt;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   278
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   279
            else if (ch == '&') {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   280
                _printer.printText("&amp;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   281
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   282
            else if (ch == '"') {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   283
                _printer.printText("&quot;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   284
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   285
            else if ((ch >= ' ' && _encodingInfo.isPrintable((char) ch))) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   286
                _printer.printText((char) ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   287
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   288
            else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   289
                printHex(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   290
            }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   291
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   292
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   293
7f561c08de6b Initial load
duke
parents:
diff changeset
   294
    protected final void printCDATAText(String text) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   295
        int length = text.length();
7f561c08de6b Initial load
duke
parents:
diff changeset
   296
        char ch;
7f561c08de6b Initial load
duke
parents:
diff changeset
   297
7f561c08de6b Initial load
duke
parents:
diff changeset
   298
        for (int index = 0; index < length; ++index) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   299
            ch = text.charAt(index);
7f561c08de6b Initial load
duke
parents:
diff changeset
   300
7f561c08de6b Initial load
duke
parents:
diff changeset
   301
            if (ch == ']'
7f561c08de6b Initial load
duke
parents:
diff changeset
   302
                && index + 2 < length
7f561c08de6b Initial load
duke
parents:
diff changeset
   303
                && text.charAt(index + 1) == ']'
7f561c08de6b Initial load
duke
parents:
diff changeset
   304
                && text.charAt(index + 2) == '>') { // check for ']]>'
7f561c08de6b Initial load
duke
parents:
diff changeset
   305
                if (fDOMErrorHandler != null){
7f561c08de6b Initial load
duke
parents:
diff changeset
   306
                    // REVISIT: this means that if DOM Error handler is not registered we don't report any
7f561c08de6b Initial load
duke
parents:
diff changeset
   307
                    // fatal errors and might serialize not wellformed document
7f561c08de6b Initial load
duke
parents:
diff changeset
   308
                if ((features & DOMSerializerImpl.SPLITCDATA) == 0
7f561c08de6b Initial load
duke
parents:
diff changeset
   309
                    && (features & DOMSerializerImpl.WELLFORMED) == 0) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   310
                    // issue fatal error
7f561c08de6b Initial load
duke
parents:
diff changeset
   311
                    String msg =
7f561c08de6b Initial load
duke
parents:
diff changeset
   312
                        DOMMessageFormatter.formatMessage(
7f561c08de6b Initial load
duke
parents:
diff changeset
   313
                            DOMMessageFormatter.SERIALIZER_DOMAIN,
7f561c08de6b Initial load
duke
parents:
diff changeset
   314
                            "EndingCDATA",
7f561c08de6b Initial load
duke
parents:
diff changeset
   315
                            null);
7f561c08de6b Initial load
duke
parents:
diff changeset
   316
                    modifyDOMError(
7f561c08de6b Initial load
duke
parents:
diff changeset
   317
                        msg,
7f561c08de6b Initial load
duke
parents:
diff changeset
   318
                        DOMError.SEVERITY_FATAL_ERROR,
7f561c08de6b Initial load
duke
parents:
diff changeset
   319
                        null, fCurrentNode);
7f561c08de6b Initial load
duke
parents:
diff changeset
   320
                    boolean continueProcess =
7f561c08de6b Initial load
duke
parents:
diff changeset
   321
                        fDOMErrorHandler.handleError(fDOMError);
7f561c08de6b Initial load
duke
parents:
diff changeset
   322
                    if (!continueProcess) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   323
                        throw new IOException();
7f561c08de6b Initial load
duke
parents:
diff changeset
   324
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   325
                } else {
7f561c08de6b Initial load
duke
parents:
diff changeset
   326
                    // issue warning
7f561c08de6b Initial load
duke
parents:
diff changeset
   327
                    String msg =
7f561c08de6b Initial load
duke
parents:
diff changeset
   328
                        DOMMessageFormatter.formatMessage(
7f561c08de6b Initial load
duke
parents:
diff changeset
   329
                            DOMMessageFormatter.SERIALIZER_DOMAIN,
7f561c08de6b Initial load
duke
parents:
diff changeset
   330
                            "SplittingCDATA",
7f561c08de6b Initial load
duke
parents:
diff changeset
   331
                            null);
7f561c08de6b Initial load
duke
parents:
diff changeset
   332
                    modifyDOMError(
7f561c08de6b Initial load
duke
parents:
diff changeset
   333
                        msg,
7f561c08de6b Initial load
duke
parents:
diff changeset
   334
                        DOMError.SEVERITY_WARNING,
7f561c08de6b Initial load
duke
parents:
diff changeset
   335
                        null, fCurrentNode);
7f561c08de6b Initial load
duke
parents:
diff changeset
   336
                    fDOMErrorHandler.handleError(fDOMError);
7f561c08de6b Initial load
duke
parents:
diff changeset
   337
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   338
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   339
                // split CDATA section
7f561c08de6b Initial load
duke
parents:
diff changeset
   340
                _printer.printText("]]]]><![CDATA[>");
7f561c08de6b Initial load
duke
parents:
diff changeset
   341
                index += 2;
7f561c08de6b Initial load
duke
parents:
diff changeset
   342
                continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   343
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   344
7f561c08de6b Initial load
duke
parents:
diff changeset
   345
            if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   346
                // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   347
                if (++index < length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   348
                    surrogates(ch, text.charAt(index), true);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   349
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   350
                else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   351
                    fatalError("The character '" + ch + "' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   352
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   353
                continue;
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   354
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   355
            if (_encodingInfo.isPrintable(ch)
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   356
                && XML11Char.isXML11ValidLiteral(ch)) {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   357
                _printer.printText(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   358
            }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   359
            else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   360
                // The character is not printable -- split CDATA section
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   361
                _printer.printText("]]>&#x");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   362
                _printer.printText(Integer.toHexString(ch));
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   363
                _printer.printText(";<![CDATA[");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   364
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   365
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   366
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   367
7f561c08de6b Initial load
duke
parents:
diff changeset
   368
    // note that this "int" should, in all cases, be a char.
7f561c08de6b Initial load
duke
parents:
diff changeset
   369
    // REVISIT:  make it a char...
7f561c08de6b Initial load
duke
parents:
diff changeset
   370
    protected final void printXMLChar( int ch ) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   371
7f561c08de6b Initial load
duke
parents:
diff changeset
   372
        if (ch == '\r' || ch == 0x0085 || ch == 0x2028) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   373
            printHex(ch);
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   374
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   375
        else if ( ch == '<') {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   376
            _printer.printText("&lt;");
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   377
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   378
        else if (ch == '&') {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   379
            _printer.printText("&amp;");
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   380
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   381
        else if (ch == '>'){
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   382
            // character sequence "]]>" can't appear in content, therefore
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   383
            // we should escape '>'
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   384
            _printer.printText("&gt;");
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   385
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   386
        else if ( _encodingInfo.isPrintable((char)ch) && XML11Char.isXML11ValidLiteral(ch)) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   387
            _printer.printText((char)ch);
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   388
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   389
        else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   390
            printHex(ch);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   391
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   392
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   393
7f561c08de6b Initial load
duke
parents:
diff changeset
   394
7f561c08de6b Initial load
duke
parents:
diff changeset
   395
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   396
    protected final void surrogates(int high, int low, boolean inContent) throws IOException{
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   397
        if (XMLChar.isHighSurrogate(high)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   398
            if (!XMLChar.isLowSurrogate(low)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   399
                //Invalid XML
7f561c08de6b Initial load
duke
parents:
diff changeset
   400
                fatalError("The character '"+(char)low+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   401
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   402
            else {
7f561c08de6b Initial load
duke
parents:
diff changeset
   403
                int supplemental = XMLChar.supplemental((char)high, (char)low);
7f561c08de6b Initial load
duke
parents:
diff changeset
   404
                if (!XML11Char.isXML11Valid(supplemental)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   405
                    //Invalid XML
7f561c08de6b Initial load
duke
parents:
diff changeset
   406
                    fatalError("The character '"+(char)supplemental+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   407
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   408
                else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   409
                    if (inContent && content().inCData) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   410
                        _printer.printText("]]>&#x");
7f561c08de6b Initial load
duke
parents:
diff changeset
   411
                        _printer.printText(Integer.toHexString(supplemental));
7f561c08de6b Initial load
duke
parents:
diff changeset
   412
                        _printer.printText(";<![CDATA[");
7f561c08de6b Initial load
duke
parents:
diff changeset
   413
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   414
                    else {
7f561c08de6b Initial load
duke
parents:
diff changeset
   415
                                                printHex(supplemental);
7f561c08de6b Initial load
duke
parents:
diff changeset
   416
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   417
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   418
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   419
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   420
        else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   421
            fatalError("The character '"+(char)high+"' is an invalid XML character");
7f561c08de6b Initial load
duke
parents:
diff changeset
   422
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   423
7f561c08de6b Initial load
duke
parents:
diff changeset
   424
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   425
7f561c08de6b Initial load
duke
parents:
diff changeset
   426
7f561c08de6b Initial load
duke
parents:
diff changeset
   427
    protected void printText( String text, boolean preserveSpace, boolean unescaped )
7f561c08de6b Initial load
duke
parents:
diff changeset
   428
    throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   429
        int index;
7f561c08de6b Initial load
duke
parents:
diff changeset
   430
        char ch;
7f561c08de6b Initial load
duke
parents:
diff changeset
   431
        int length = text.length();
7f561c08de6b Initial load
duke
parents:
diff changeset
   432
        if ( preserveSpace ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   433
            // Preserving spaces: the text must print exactly as it is,
7f561c08de6b Initial load
duke
parents:
diff changeset
   434
            // without breaking when spaces appear in the text and without
7f561c08de6b Initial load
duke
parents:
diff changeset
   435
            // consolidating spaces. If a line terminator is used, a line
7f561c08de6b Initial load
duke
parents:
diff changeset
   436
            // break will occur.
7f561c08de6b Initial load
duke
parents:
diff changeset
   437
            for ( index = 0 ; index < length ; ++index ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   438
                ch = text.charAt( index );
7f561c08de6b Initial load
duke
parents:
diff changeset
   439
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   440
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   441
                    if (++index <length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   442
                        surrogates(ch, text.charAt(index), true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   443
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   444
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   445
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   446
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   447
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   448
                if ( unescaped  && XML11Char.isXML11ValidLiteral(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   449
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   450
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   451
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   452
                    printXMLChar( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   453
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   454
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   455
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   456
        else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   457
            // Not preserving spaces: print one part at a time, and
7f561c08de6b Initial load
duke
parents:
diff changeset
   458
            // use spaces between parts to break them into different
7f561c08de6b Initial load
duke
parents:
diff changeset
   459
            // lines. Spaces at beginning of line will be stripped
7f561c08de6b Initial load
duke
parents:
diff changeset
   460
            // by printing mechanism. Line terminator is treated
7f561c08de6b Initial load
duke
parents:
diff changeset
   461
            // no different than other text part.
7f561c08de6b Initial load
duke
parents:
diff changeset
   462
            for ( index = 0 ; index < length ; ++index ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   463
                ch = text.charAt( index );
7f561c08de6b Initial load
duke
parents:
diff changeset
   464
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   465
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   466
                    if (++index <length) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   467
                        surrogates(ch, text.charAt(index), true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   468
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   469
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   470
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   471
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   472
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   473
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   474
                if ( unescaped && XML11Char.isXML11ValidLiteral(ch) ) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   475
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   476
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   477
                else {
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   478
                    printXMLChar( ch );
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   479
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   480
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   481
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   482
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   483
7f561c08de6b Initial load
duke
parents:
diff changeset
   484
    protected void printText( char[] chars, int start, int length,
7f561c08de6b Initial load
duke
parents:
diff changeset
   485
                              boolean preserveSpace, boolean unescaped ) throws IOException {
7f561c08de6b Initial load
duke
parents:
diff changeset
   486
7f561c08de6b Initial load
duke
parents:
diff changeset
   487
        if ( preserveSpace ) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   488
            // Preserving spaces: the text must print exactly as it is,
7f561c08de6b Initial load
duke
parents:
diff changeset
   489
            // without breaking when spaces appear in the text and without
7f561c08de6b Initial load
duke
parents:
diff changeset
   490
            // consolidating spaces. If a line terminator is used, a line
7f561c08de6b Initial load
duke
parents:
diff changeset
   491
            // break will occur.
7f561c08de6b Initial load
duke
parents:
diff changeset
   492
            while ( length-- > 0 ) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   493
                char ch = chars[start++];
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   494
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   495
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   496
                    if ( length-- > 0) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   497
                        surrogates(ch, chars[start++], true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   498
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   499
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   500
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   501
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   502
                }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   503
                if ( unescaped && XML11Char.isXML11ValidLiteral(ch)) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   504
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   505
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   506
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   507
                    printXMLChar( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   508
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   509
            }
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   510
        }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   511
        else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   512
            // Not preserving spaces: print one part at a time, and
7f561c08de6b Initial load
duke
parents:
diff changeset
   513
            // use spaces between parts to break them into different
7f561c08de6b Initial load
duke
parents:
diff changeset
   514
            // lines. Spaces at beginning of line will be stripped
7f561c08de6b Initial load
duke
parents:
diff changeset
   515
            // by printing mechanism. Line terminator is treated
7f561c08de6b Initial load
duke
parents:
diff changeset
   516
            // no different than other text part.
7f561c08de6b Initial load
duke
parents:
diff changeset
   517
            while ( length-- > 0 ) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   518
                char ch = chars[start++];
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   519
                if (!XML11Char.isXML11Valid(ch)) {
7f561c08de6b Initial load
duke
parents:
diff changeset
   520
                    // check if it is surrogate
7f561c08de6b Initial load
duke
parents:
diff changeset
   521
                    if ( length-- > 0) {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   522
                        surrogates(ch, chars[start++], true);
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   523
                    } else {
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   524
                        fatalError("The character '"+ch+"' is an invalid XML character");
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   525
                    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   526
                    continue;
7f561c08de6b Initial load
duke
parents:
diff changeset
   527
                }
7f561c08de6b Initial load
duke
parents:
diff changeset
   528
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   529
                if ( unescaped && XML11Char.isXML11ValidLiteral(ch)) {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   530
                    _printer.printText( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   531
                }
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   532
                else {
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   533
                    printXMLChar( ch );
23777
ce87cedb71cf 8035437: Xerces Update: xml/serialize/DOMSerializerImpl
aefimov
parents: 12457
diff changeset
   534
                }
6
7f561c08de6b Initial load
duke
parents:
diff changeset
   535
            }
7f561c08de6b Initial load
duke
parents:
diff changeset
   536
        }
7f561c08de6b Initial load
duke
parents:
diff changeset
   537
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   538
7f561c08de6b Initial load
duke
parents:
diff changeset
   539
    public boolean reset() {
7f561c08de6b Initial load
duke
parents:
diff changeset
   540
        super.reset();
7f561c08de6b Initial load
duke
parents:
diff changeset
   541
        return true;
7f561c08de6b Initial load
duke
parents:
diff changeset
   542
    }
7f561c08de6b Initial load
duke
parents:
diff changeset
   543
7f561c08de6b Initial load
duke
parents:
diff changeset
   544
}