KickJava   Java API By Example, From Geeks To Geeks.

Java > Open Source Codes > org > enhydra > apache > xerces > readers > EBCDICRecognizer


1 /*
2  * The Apache Software License, Version 1.1
3  *
4  *
5  * Copyright (c) 1999 The Apache Software Foundation. All rights
6  * reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  *
12  * 1. Redistributions of source code must retain the above copyright
13  * notice, this list of conditions and the following disclaimer.
14  *
15  * 2. Redistributions in binary form must reproduce the above copyright
16  * notice, this list of conditions and the following disclaimer in
17  * the documentation and/or other materials provided with the
18  * distribution.
19  *
20  * 3. The end-user documentation included with the redistribution,
21  * if any, must include the following acknowledgment:
22  * "This product includes software developed by the
23  * Apache Software Foundation (http://www.apache.org/)."
24  * Alternately, this acknowledgment may appear in the software itself,
25  * if and wherever such third-party acknowledgments normally appear.
26  *
27  * 4. The names "Xerces" and "Apache Software Foundation" must
28  * not be used to endorse or promote products derived from this
29  * software without prior written permission. For written
30  * permission, please contact apache@apache.org.
31  *
32  * 5. Products derived from this software may not be called "Apache",
33  * nor may "Apache" appear in their name, without prior written
34  * permission of the Apache Software Foundation.
35  *
36  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
37  * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
38  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
39  * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
40  * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
41  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
42  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
43  * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
44  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
45  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
46  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
47  * SUCH DAMAGE.
48  * ====================================================================
49  *
50  * This software consists of voluntary contributions made by many
51  * individuals on behalf of the Apache Software Foundation and was
52  * originally based on software copyright (c) 1999, International
53  * Business Machines, Inc., http://www.apache.org. For more
54  * information on the Apache Software Foundation, please see
55  * <http://www.apache.org/>.
56  */

57
58 package org.enhydra.apache.xerces.readers;
59
60 import java.io.InputStreamReader JavaDoc;
61 import java.io.UnsupportedEncodingException JavaDoc;
62
63 import org.enhydra.apache.xerces.framework.XMLErrorReporter;
64 import org.enhydra.apache.xerces.utils.ChunkyByteArray;
65 import org.enhydra.apache.xerces.utils.StringPool;
66
67 /**
68  *
69  * @version
70  */

71 final class EBCDICRecognizer extends XMLDeclRecognizer {
72     //
73
//
74
//
75
public XMLEntityHandler.EntityReader recognize(XMLEntityReaderFactory readerFactory,
76                                                    XMLEntityHandler entityHandler,
77                                                    XMLErrorReporter errorReporter,
78                                                    boolean sendCharDataAsCharArray,
79                                                    StringPool stringPool,
80                                                    ChunkyByteArray data,
81                                                    boolean xmlDecl,
82                                                    boolean allowJavaEncodingName) throws Exception JavaDoc
83     {
84         XMLEntityHandler.EntityReader reader = null;
85         byte b0 = data.byteAt(0);
86         byte b1 = data.byteAt(1);
87         byte b2 = data.byteAt(2);
88         byte b3 = data.byteAt(3);
89         boolean debug = false;
90
91         if (b0 != 0x4c || b1 != 0x6f || b2 != (byte)0xa7 || b3 != (byte)0x94)
92             return reader;
93         XMLEntityHandler.EntityReader declReader = readerFactory.createCharReader(entityHandler, errorReporter, sendCharDataAsCharArray, new InputStreamReader JavaDoc(data, "CP037"), stringPool);
94         int encoding = prescanXMLDeclOrTextDecl(declReader, xmlDecl);
95         if (encoding == -1) {
96             data.rewind();
97             // REVISIT - The document is not well-formed. There is no encoding, yet the file is
98
// clearly not UTF8.
99
throw new UnsupportedEncodingException JavaDoc(null);
100         }
101         String JavaDoc enc = stringPool.orphanString(encoding).toUpperCase();
102         if ("ISO-10646-UCS-2".equals(enc)) throw new UnsupportedEncodingException JavaDoc(enc);
103         if ("ISO-10646-UCS-4".equals(enc)) throw new UnsupportedEncodingException JavaDoc(enc);
104         if ("UTF-16".equals(enc)) throw new UnsupportedEncodingException JavaDoc(enc);
105         String JavaDoc javaencname = MIME2Java.convert(enc);
106         if (null == javaencname) {
107             if (allowJavaEncodingName) {
108                 javaencname = enc;
109             } else {
110                 throw new UnsupportedEncodingException JavaDoc(enc);
111             }
112         }
113         try {
114             data.rewind();
115             reader = readerFactory.createCharReader(entityHandler, errorReporter, sendCharDataAsCharArray, new InputStreamReader JavaDoc(data, javaencname), stringPool);
116         } catch (UnsupportedEncodingException JavaDoc e) {
117             throw e;
118         } catch (Exception JavaDoc e) {
119             if( debug == true )
120                 e.printStackTrace(); // Internal Error
121
}
122         return reader;
123     }
124 }
125
Popular Tags