jackrabbit-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From tri...@apache.org
Subject svn commit: r1512568 [27/39] - in /jackrabbit/commons/filevault/trunk: ./ parent/ vault-cli/ vault-cli/src/ vault-cli/src/main/ vault-cli/src/main/appassembler/ vault-cli/src/main/assembly/ vault-cli/src/main/java/ vault-cli/src/main/java/org/ vault-cl...
Date Sat, 10 Aug 2013 05:53:54 GMT
Added: jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/EncodingMap.java
URL: http://svn.apache.org/viewvc/jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/EncodingMap.java?rev=1512568&view=auto
==============================================================================
--- jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/EncodingMap.java (added)
+++ jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/EncodingMap.java Sat Aug 10 05:53:42 2013
@@ -0,0 +1,1018 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.jackrabbit.vault.util.xml.xerces.util;
+
+import java.util.Hashtable;
+
+/**
+ * EncodingMap is a convenience class which handles conversions between
+ * IANA encoding names and Java encoding names, and vice versa. The
+ * encoding names used in XML instance documents <strong>must</strong>
+ * be the IANA encoding names specified or one of the aliases for those names
+ * which IANA defines.
+ * <p/>
+ * <TABLE BORDER="0" WIDTH="100%">
+ * <TR>
+ * <TD WIDTH="33%">
+ * <P ALIGN="CENTER"><B>Common Name</B>
+ * </TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER"><B>Use this name in XML files</B>
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER"><B>Name Type</B>
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER"><B>Xerces converts to this Java Encoder Name</B>
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">8 bit Unicode</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">UTF-8
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">UTF8
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin 1</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-1
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-1
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin 2</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-2
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-2
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin 3</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-3
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-3
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin 4</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-4
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-4
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin Cyrillic</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-5
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-5
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin Arabic</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-6
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-6
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin Greek</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-7
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-7
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin Hebrew</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-8
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-8
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">ISO Latin 5</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ISO-8859-9
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">ISO-8859-9
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: US</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-us
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp037
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Canada</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-ca
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp037
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Netherlands</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-nl
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp037
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Denmark</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-dk
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp277
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Norway</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-no
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp277
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Finland</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-fi
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp278
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Sweden</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-se
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp278
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Italy</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-it
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp280
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Spain, Latin America</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-es
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp284
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Great Britain</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-gb
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp285
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: France</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-fr
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp297
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Arabic</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-ar1
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp420
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Hebrew</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-he
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp424
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Switzerland</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-ch
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp500
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Roece</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-roece
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp870
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Yugoslavia</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-yu
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp870
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Iceland</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-is
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp871
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">EBCDIC: Urdu</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">ebcdic-cp-ar2
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">IANA
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">cp918
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Chinese for PRC, mixed 1/2 byte</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">gb2312
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">GB2312
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Extended Unix Code, packed for Japanese</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">euc-jp
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">eucjis
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Japanese: iso-2022-jp</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">iso-2020-jp
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">JIS
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Japanese: Shift JIS</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">Shift_JIS
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">SJIS
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Chinese: Big5</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">Big5
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">Big5
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Extended Unix Code, packed for Korean</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">euc-kr
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">iso2022kr
+ * </TD>
+ * </TR>
+ * <TR>
+ * <TD WIDTH="33%">Cyrillic</TD>
+ * <TD WIDTH="15%">
+ * <P ALIGN="CENTER">koi8-r
+ * </TD>
+ * <TD WIDTH="12%">
+ * <P ALIGN="CENTER">MIME
+ * </TD>
+ * <TD WIDTH="31%">
+ * <P ALIGN="CENTER">koi8-r
+ * </TD>
+ * </TR>
+ * </TABLE>
+ *
+ * @author TAMURA Kent, IBM
+ * @author Andy Clark, IBM
+ * @version $Id$
+ */
+public class EncodingMap {
+
+    //
+    // Data
+    //
+
+    /**
+     * fIANA2JavaMap
+     */
+    protected final static Hashtable fIANA2JavaMap = new Hashtable();
+
+    /**
+     * fJava2IANAMap
+     */
+    protected final static Hashtable fJava2IANAMap = new Hashtable();
+
+    //
+    // Static initialization
+    //
+
+    static {
+
+        // add IANA to Java encoding mappings.
+        fIANA2JavaMap.put("BIG5", "Big5");
+        fIANA2JavaMap.put("CSBIG5", "Big5");
+        fIANA2JavaMap.put("CP037", "CP037");
+        fIANA2JavaMap.put("IBM037", "CP037");
+        fIANA2JavaMap.put("CSIBM037", "CP037");
+        fIANA2JavaMap.put("EBCDIC-CP-US", "CP037");
+        fIANA2JavaMap.put("EBCDIC-CP-CA", "CP037");
+        fIANA2JavaMap.put("EBCDIC-CP-NL", "CP037");
+        fIANA2JavaMap.put("EBCDIC-CP-WT", "CP037");
+        fIANA2JavaMap.put("IBM273", "CP273");
+        fIANA2JavaMap.put("CP273", "CP273");
+        fIANA2JavaMap.put("CSIBM273", "CP273");
+        fIANA2JavaMap.put("IBM277", "CP277");
+        fIANA2JavaMap.put("CP277", "CP277");
+        fIANA2JavaMap.put("CSIBM277", "CP277");
+        fIANA2JavaMap.put("EBCDIC-CP-DK", "CP277");
+        fIANA2JavaMap.put("EBCDIC-CP-NO", "CP277");
+        fIANA2JavaMap.put("IBM278", "CP278");
+        fIANA2JavaMap.put("CP278", "CP278");
+        fIANA2JavaMap.put("CSIBM278", "CP278");
+        fIANA2JavaMap.put("EBCDIC-CP-FI", "CP278");
+        fIANA2JavaMap.put("EBCDIC-CP-SE", "CP278");
+        fIANA2JavaMap.put("IBM280", "CP280");
+        fIANA2JavaMap.put("CP280", "CP280");
+        fIANA2JavaMap.put("CSIBM280", "CP280");
+        fIANA2JavaMap.put("EBCDIC-CP-IT", "CP280");
+        fIANA2JavaMap.put("IBM284", "CP284");
+        fIANA2JavaMap.put("CP284", "CP284");
+        fIANA2JavaMap.put("CSIBM284", "CP284");
+        fIANA2JavaMap.put("EBCDIC-CP-ES", "CP284");
+        fIANA2JavaMap.put("EBCDIC-CP-GB", "CP285");
+        fIANA2JavaMap.put("IBM285", "CP285");
+        fIANA2JavaMap.put("CP285", "CP285");
+        fIANA2JavaMap.put("CSIBM285", "CP285");
+        fIANA2JavaMap.put("EBCDIC-JP-KANA", "CP290");
+        fIANA2JavaMap.put("IBM290", "CP290");
+        fIANA2JavaMap.put("CP290", "CP290");
+        fIANA2JavaMap.put("CSIBM290", "CP290");
+        fIANA2JavaMap.put("EBCDIC-CP-FR", "CP297");
+        fIANA2JavaMap.put("IBM297", "CP297");
+        fIANA2JavaMap.put("CP297", "CP297");
+        fIANA2JavaMap.put("CSIBM297", "CP297");
+        fIANA2JavaMap.put("EBCDIC-CP-AR1", "CP420");
+        fIANA2JavaMap.put("IBM420", "CP420");
+        fIANA2JavaMap.put("CP420", "CP420");
+        fIANA2JavaMap.put("CSIBM420", "CP420");
+        fIANA2JavaMap.put("EBCDIC-CP-HE", "CP424");
+        fIANA2JavaMap.put("IBM424", "CP424");
+        fIANA2JavaMap.put("CP424", "CP424");
+        fIANA2JavaMap.put("CSIBM424", "CP424");
+        fIANA2JavaMap.put("IBM437", "CP437");
+        fIANA2JavaMap.put("437", "CP437");
+        fIANA2JavaMap.put("CP437", "CP437");
+        fIANA2JavaMap.put("CSPC8CODEPAGE437", "CP437");
+        fIANA2JavaMap.put("EBCDIC-CP-CH", "CP500");
+        fIANA2JavaMap.put("IBM500", "CP500");
+        fIANA2JavaMap.put("CP500", "CP500");
+        fIANA2JavaMap.put("CSIBM500", "CP500");
+        fIANA2JavaMap.put("EBCDIC-CP-CH", "CP500");
+        fIANA2JavaMap.put("EBCDIC-CP-BE", "CP500");
+        fIANA2JavaMap.put("IBM775", "CP775");
+        fIANA2JavaMap.put("CP775", "CP775");
+        fIANA2JavaMap.put("CSPC775BALTIC", "CP775");
+        fIANA2JavaMap.put("IBM850", "CP850");
+        fIANA2JavaMap.put("850", "CP850");
+        fIANA2JavaMap.put("CP850", "CP850");
+        fIANA2JavaMap.put("CSPC850MULTILINGUAL", "CP850");
+        fIANA2JavaMap.put("IBM852", "CP852");
+        fIANA2JavaMap.put("852", "CP852");
+        fIANA2JavaMap.put("CP852", "CP852");
+        fIANA2JavaMap.put("CSPCP852", "CP852");
+        fIANA2JavaMap.put("IBM855", "CP855");
+        fIANA2JavaMap.put("855", "CP855");
+        fIANA2JavaMap.put("CP855", "CP855");
+        fIANA2JavaMap.put("CSIBM855", "CP855");
+        fIANA2JavaMap.put("IBM857", "CP857");
+        fIANA2JavaMap.put("857", "CP857");
+        fIANA2JavaMap.put("CP857", "CP857");
+        fIANA2JavaMap.put("CSIBM857", "CP857");
+        fIANA2JavaMap.put("IBM00858", "CP858");
+        fIANA2JavaMap.put("CP00858", "CP858");
+        fIANA2JavaMap.put("CCSID00858", "CP858");
+        fIANA2JavaMap.put("IBM860", "CP860");
+        fIANA2JavaMap.put("860", "CP860");
+        fIANA2JavaMap.put("CP860", "CP860");
+        fIANA2JavaMap.put("CSIBM860", "CP860");
+        fIANA2JavaMap.put("IBM861", "CP861");
+        fIANA2JavaMap.put("861", "CP861");
+        fIANA2JavaMap.put("CP861", "CP861");
+        fIANA2JavaMap.put("CP-IS", "CP861");
+        fIANA2JavaMap.put("CSIBM861", "CP861");
+        fIANA2JavaMap.put("IBM862", "CP862");
+        fIANA2JavaMap.put("862", "CP862");
+        fIANA2JavaMap.put("CP862", "CP862");
+        fIANA2JavaMap.put("CSPC862LATINHEBREW", "CP862");
+        fIANA2JavaMap.put("IBM863", "CP863");
+        fIANA2JavaMap.put("863", "CP863");
+        fIANA2JavaMap.put("CP863", "CP863");
+        fIANA2JavaMap.put("CSIBM863", "CP863");
+        fIANA2JavaMap.put("IBM864", "CP864");
+        fIANA2JavaMap.put("CP864", "CP864");
+        fIANA2JavaMap.put("CSIBM864", "CP864");
+        fIANA2JavaMap.put("IBM865", "CP865");
+        fIANA2JavaMap.put("865", "CP865");
+        fIANA2JavaMap.put("CP865", "CP865");
+        fIANA2JavaMap.put("CSIBM865", "CP865");
+        fIANA2JavaMap.put("IBM866", "CP866");
+        fIANA2JavaMap.put("866", "CP866");
+        fIANA2JavaMap.put("CP866", "CP866");
+        fIANA2JavaMap.put("CSIBM866", "CP866");
+        fIANA2JavaMap.put("IBM868", "CP868");
+        fIANA2JavaMap.put("CP868", "CP868");
+        fIANA2JavaMap.put("CSIBM868", "CP868");
+        fIANA2JavaMap.put("CP-AR", "CP868");
+        fIANA2JavaMap.put("IBM869", "CP869");
+        fIANA2JavaMap.put("CP869", "CP869");
+        fIANA2JavaMap.put("CSIBM869", "CP869");
+        fIANA2JavaMap.put("CP-GR", "CP869");
+        fIANA2JavaMap.put("IBM870", "CP870");
+        fIANA2JavaMap.put("CP870", "CP870");
+        fIANA2JavaMap.put("CSIBM870", "CP870");
+        fIANA2JavaMap.put("EBCDIC-CP-ROECE", "CP870");
+        fIANA2JavaMap.put("EBCDIC-CP-YU", "CP870");
+        fIANA2JavaMap.put("IBM871", "CP871");
+        fIANA2JavaMap.put("CP871", "CP871");
+        fIANA2JavaMap.put("CSIBM871", "CP871");
+        fIANA2JavaMap.put("EBCDIC-CP-IS", "CP871");
+        fIANA2JavaMap.put("IBM918", "CP918");
+        fIANA2JavaMap.put("CP918", "CP918");
+        fIANA2JavaMap.put("CSIBM918", "CP918");
+        fIANA2JavaMap.put("EBCDIC-CP-AR2", "CP918");
+        fIANA2JavaMap.put("IBM00924", "CP924");
+        fIANA2JavaMap.put("CP00924", "CP924");
+        fIANA2JavaMap.put("CCSID00924", "CP924");
+        // is this an error???
+        fIANA2JavaMap.put("EBCDIC-LATIN9--EURO", "CP924");
+        fIANA2JavaMap.put("IBM1026", "CP1026");
+        fIANA2JavaMap.put("CP1026", "CP1026");
+        fIANA2JavaMap.put("CSIBM1026", "CP1026");
+        fIANA2JavaMap.put("IBM01140", "Cp1140");
+        fIANA2JavaMap.put("CP01140", "Cp1140");
+        fIANA2JavaMap.put("CCSID01140", "Cp1140");
+        fIANA2JavaMap.put("IBM01141", "Cp1141");
+        fIANA2JavaMap.put("CP01141", "Cp1141");
+        fIANA2JavaMap.put("CCSID01141", "Cp1141");
+        fIANA2JavaMap.put("IBM01142", "Cp1142");
+        fIANA2JavaMap.put("CP01142", "Cp1142");
+        fIANA2JavaMap.put("CCSID01142", "Cp1142");
+        fIANA2JavaMap.put("IBM01143", "Cp1143");
+        fIANA2JavaMap.put("CP01143", "Cp1143");
+        fIANA2JavaMap.put("CCSID01143", "Cp1143");
+        fIANA2JavaMap.put("IBM01144", "Cp1144");
+        fIANA2JavaMap.put("CP01144", "Cp1144");
+        fIANA2JavaMap.put("CCSID01144", "Cp1144");
+        fIANA2JavaMap.put("IBM01145", "Cp1145");
+        fIANA2JavaMap.put("CP01145", "Cp1145");
+        fIANA2JavaMap.put("CCSID01145", "Cp1145");
+        fIANA2JavaMap.put("IBM01146", "Cp1146");
+        fIANA2JavaMap.put("CP01146", "Cp1146");
+        fIANA2JavaMap.put("CCSID01146", "Cp1146");
+        fIANA2JavaMap.put("IBM01147", "Cp1147");
+        fIANA2JavaMap.put("CP01147", "Cp1147");
+        fIANA2JavaMap.put("CCSID01147", "Cp1147");
+        fIANA2JavaMap.put("IBM01148", "Cp1148");
+        fIANA2JavaMap.put("CP01148", "Cp1148");
+        fIANA2JavaMap.put("CCSID01148", "Cp1148");
+        fIANA2JavaMap.put("IBM01149", "Cp1149");
+        fIANA2JavaMap.put("CP01149", "Cp1149");
+        fIANA2JavaMap.put("CCSID01149", "Cp1149");
+        fIANA2JavaMap.put("EUC-JP", "EUCJIS");
+        fIANA2JavaMap.put("CSEUCPKDFMTJAPANESE", "EUCJIS");
+        fIANA2JavaMap.put("EXTENDED_UNIX_CODE_PACKED_FORMAT_FOR_JAPANESE", "EUCJIS");
+        fIANA2JavaMap.put("EUC-KR", "KSC5601");
+        fIANA2JavaMap.put("CSEUCKR", "KSC5601");
+        fIANA2JavaMap.put("KS_C_5601-1987", "KS_C_5601-1987");
+        fIANA2JavaMap.put("ISO-IR-149", "KS_C_5601-1987");
+        fIANA2JavaMap.put("KS_C_5601-1989", "KS_C_5601-1987");
+        fIANA2JavaMap.put("KSC_5601", "KS_C_5601-1987");
+        fIANA2JavaMap.put("KOREAN", "KS_C_5601-1987");
+        fIANA2JavaMap.put("CSKSC56011987", "KS_C_5601-1987");
+        fIANA2JavaMap.put("GB2312", "GB2312");
+        fIANA2JavaMap.put("CSGB2312", "GB2312");
+        fIANA2JavaMap.put("ISO-2022-JP", "JIS");
+        fIANA2JavaMap.put("CSISO2022JP", "JIS");
+        fIANA2JavaMap.put("ISO-2022-KR", "ISO2022KR");
+        fIANA2JavaMap.put("CSISO2022KR", "ISO2022KR");
+        fIANA2JavaMap.put("ISO-2022-CN", "ISO2022CN");
+
+        fIANA2JavaMap.put("X0201", "JIS0201");
+        fIANA2JavaMap.put("CSISO13JISC6220JP", "JIS0201");
+        fIANA2JavaMap.put("X0208", "JIS0208");
+        fIANA2JavaMap.put("ISO-IR-87", "JIS0208");
+        fIANA2JavaMap.put("X0208dbiJIS_X0208-1983", "JIS0208");
+        fIANA2JavaMap.put("CSISO87JISX0208", "JIS0208");
+        fIANA2JavaMap.put("X0212", "JIS0212");
+        fIANA2JavaMap.put("ISO-IR-159", "JIS0212");
+        fIANA2JavaMap.put("CSISO159JISX02121990", "JIS0212");
+        fIANA2JavaMap.put("GB18030", "GB18030");
+        fIANA2JavaMap.put("GBK", "GBK");
+        fIANA2JavaMap.put("CP936", "GBK");
+        fIANA2JavaMap.put("MS936", "GBK");
+        fIANA2JavaMap.put("WINDOWS-936", "GBK");
+        fIANA2JavaMap.put("SHIFT_JIS", "SJIS");
+        fIANA2JavaMap.put("CSSHIFTJIS", "SJIS");
+        fIANA2JavaMap.put("MS_KANJI", "SJIS");
+        fIANA2JavaMap.put("WINDOWS-31J", "MS932");
+        fIANA2JavaMap.put("CSWINDOWS31J", "MS932");
+
+        // Add support for Cp1252 and its friends
+        fIANA2JavaMap.put("WINDOWS-1250", "Cp1250");
+        fIANA2JavaMap.put("WINDOWS-1251", "Cp1251");
+        fIANA2JavaMap.put("WINDOWS-1252", "Cp1252");
+        fIANA2JavaMap.put("WINDOWS-1253", "Cp1253");
+        fIANA2JavaMap.put("WINDOWS-1254", "Cp1254");
+        fIANA2JavaMap.put("WINDOWS-1255", "Cp1255");
+        fIANA2JavaMap.put("WINDOWS-1256", "Cp1256");
+        fIANA2JavaMap.put("WINDOWS-1257", "Cp1257");
+        fIANA2JavaMap.put("WINDOWS-1258", "Cp1258");
+        fIANA2JavaMap.put("TIS-620", "TIS620");
+
+        fIANA2JavaMap.put("ISO-8859-1", "ISO8859_1");
+        fIANA2JavaMap.put("ISO-IR-100", "ISO8859_1");
+        fIANA2JavaMap.put("ISO_8859-1", "ISO8859_1");
+        fIANA2JavaMap.put("LATIN1", "ISO8859_1");
+        fIANA2JavaMap.put("CSISOLATIN1", "ISO8859_1");
+        fIANA2JavaMap.put("L1", "ISO8859_1");
+        fIANA2JavaMap.put("IBM819", "ISO8859_1");
+        fIANA2JavaMap.put("CP819", "ISO8859_1");
+
+        fIANA2JavaMap.put("ISO-8859-2", "ISO8859_2");
+        fIANA2JavaMap.put("ISO-IR-101", "ISO8859_2");
+        fIANA2JavaMap.put("ISO_8859-2", "ISO8859_2");
+        fIANA2JavaMap.put("LATIN2", "ISO8859_2");
+        fIANA2JavaMap.put("CSISOLATIN2", "ISO8859_2");
+        fIANA2JavaMap.put("L2", "ISO8859_2");
+
+        fIANA2JavaMap.put("ISO-8859-3", "ISO8859_3");
+        fIANA2JavaMap.put("ISO-IR-109", "ISO8859_3");
+        fIANA2JavaMap.put("ISO_8859-3", "ISO8859_3");
+        fIANA2JavaMap.put("LATIN3", "ISO8859_3");
+        fIANA2JavaMap.put("CSISOLATIN3", "ISO8859_3");
+        fIANA2JavaMap.put("L3", "ISO8859_3");
+
+        fIANA2JavaMap.put("ISO-8859-4", "ISO8859_4");
+        fIANA2JavaMap.put("ISO-IR-110", "ISO8859_4");
+        fIANA2JavaMap.put("ISO_8859-4", "ISO8859_4");
+        fIANA2JavaMap.put("LATIN4", "ISO8859_4");
+        fIANA2JavaMap.put("CSISOLATIN4", "ISO8859_4");
+        fIANA2JavaMap.put("L4", "ISO8859_4");
+
+        fIANA2JavaMap.put("ISO-8859-5", "ISO8859_5");
+        fIANA2JavaMap.put("ISO-IR-144", "ISO8859_5");
+        fIANA2JavaMap.put("ISO_8859-5", "ISO8859_5");
+        fIANA2JavaMap.put("CYRILLIC", "ISO8859_5");
+        fIANA2JavaMap.put("CSISOLATINCYRILLIC", "ISO8859_5");
+
+        fIANA2JavaMap.put("ISO-8859-6", "ISO8859_6");
+        fIANA2JavaMap.put("ISO-IR-127", "ISO8859_6");
+        fIANA2JavaMap.put("ISO_8859-6", "ISO8859_6");
+        fIANA2JavaMap.put("ECMA-114", "ISO8859_6");
+        fIANA2JavaMap.put("ASMO-708", "ISO8859_6");
+        fIANA2JavaMap.put("ARABIC", "ISO8859_6");
+        fIANA2JavaMap.put("CSISOLATINARABIC", "ISO8859_6");
+
+        fIANA2JavaMap.put("ISO-8859-7", "ISO8859_7");
+        fIANA2JavaMap.put("ISO-IR-126", "ISO8859_7");
+        fIANA2JavaMap.put("ISO_8859-7", "ISO8859_7");
+        fIANA2JavaMap.put("ELOT_928", "ISO8859_7");
+        fIANA2JavaMap.put("ECMA-118", "ISO8859_7");
+        fIANA2JavaMap.put("GREEK", "ISO8859_7");
+        fIANA2JavaMap.put("CSISOLATINGREEK", "ISO8859_7");
+        fIANA2JavaMap.put("GREEK8", "ISO8859_7");
+
+        fIANA2JavaMap.put("ISO-8859-8", "ISO8859_8");
+        fIANA2JavaMap.put("ISO-8859-8-I", "ISO8859_8"); // added since this encoding only differs w.r.t. presentation
+        fIANA2JavaMap.put("ISO-IR-138", "ISO8859_8");
+        fIANA2JavaMap.put("ISO_8859-8", "ISO8859_8");
+        fIANA2JavaMap.put("HEBREW", "ISO8859_8");
+        fIANA2JavaMap.put("CSISOLATINHEBREW", "ISO8859_8");
+
+        fIANA2JavaMap.put("ISO-8859-9", "ISO8859_9");
+        fIANA2JavaMap.put("ISO-IR-148", "ISO8859_9");
+        fIANA2JavaMap.put("ISO_8859-9", "ISO8859_9");
+        fIANA2JavaMap.put("LATIN5", "ISO8859_9");
+        fIANA2JavaMap.put("CSISOLATIN5", "ISO8859_9");
+        fIANA2JavaMap.put("L5", "ISO8859_9");
+
+        fIANA2JavaMap.put("ISO-8859-13", "ISO8859_13");
+
+        fIANA2JavaMap.put("ISO-8859-15", "ISO8859_15_FDIS");
+        fIANA2JavaMap.put("ISO_8859-15", "ISO8859_15_FDIS");
+        fIANA2JavaMap.put("LATIN-9", "ISO8859_15_FDIS");
+
+        fIANA2JavaMap.put("KOI8-R", "KOI8_R");
+        fIANA2JavaMap.put("CSKOI8R", "KOI8_R");
+        fIANA2JavaMap.put("US-ASCII", "ASCII");
+        fIANA2JavaMap.put("ISO-IR-6", "ASCII");
+        fIANA2JavaMap.put("ANSI_X3.4-1968", "ASCII");
+        fIANA2JavaMap.put("ANSI_X3.4-1986", "ASCII");
+        fIANA2JavaMap.put("ISO_646.IRV:1991", "ASCII");
+        fIANA2JavaMap.put("ASCII", "ASCII");
+        fIANA2JavaMap.put("CSASCII", "ASCII");
+        fIANA2JavaMap.put("ISO646-US", "ASCII");
+        fIANA2JavaMap.put("US", "ASCII");
+        fIANA2JavaMap.put("IBM367", "ASCII");
+        fIANA2JavaMap.put("CP367", "ASCII");
+        fIANA2JavaMap.put("UTF-8", "UTF8");
+        fIANA2JavaMap.put("UTF-16", "UTF-16");
+        fIANA2JavaMap.put("UTF-16BE", "UnicodeBig");
+        fIANA2JavaMap.put("UTF-16LE", "UnicodeLittle");
+
+        // support for 1047, as proposed to be added to the 
+        // IANA registry in 
+        // http://lists.w3.org/Archives/Public/ietf-charset/2002JulSep/0049.html
+        fIANA2JavaMap.put("IBM-1047", "Cp1047");
+        fIANA2JavaMap.put("IBM1047", "Cp1047");
+        fIANA2JavaMap.put("CP1047", "Cp1047");
+
+        // Adding new aliases as proposed in
+        // http://lists.w3.org/Archives/Public/ietf-charset/2002JulSep/0058.html
+        fIANA2JavaMap.put("IBM-37", "CP037");
+        fIANA2JavaMap.put("IBM-273", "CP273");
+        fIANA2JavaMap.put("IBM-277", "CP277");
+        fIANA2JavaMap.put("IBM-278", "CP278");
+        fIANA2JavaMap.put("IBM-280", "CP280");
+        fIANA2JavaMap.put("IBM-284", "CP284");
+        fIANA2JavaMap.put("IBM-285", "CP285");
+        fIANA2JavaMap.put("IBM-290", "CP290");
+        fIANA2JavaMap.put("IBM-297", "CP297");
+        fIANA2JavaMap.put("IBM-420", "CP420");
+        fIANA2JavaMap.put("IBM-424", "CP424");
+        fIANA2JavaMap.put("IBM-437", "CP437");
+        fIANA2JavaMap.put("IBM-500", "CP500");
+        fIANA2JavaMap.put("IBM-775", "CP775");
+        fIANA2JavaMap.put("IBM-850", "CP850");
+        fIANA2JavaMap.put("IBM-852", "CP852");
+        fIANA2JavaMap.put("IBM-855", "CP855");
+        fIANA2JavaMap.put("IBM-857", "CP857");
+        fIANA2JavaMap.put("IBM-858", "CP858");
+        fIANA2JavaMap.put("IBM-860", "CP860");
+        fIANA2JavaMap.put("IBM-861", "CP861");
+        fIANA2JavaMap.put("IBM-862", "CP862");
+        fIANA2JavaMap.put("IBM-863", "CP863");
+        fIANA2JavaMap.put("IBM-864", "CP864");
+        fIANA2JavaMap.put("IBM-865", "CP865");
+        fIANA2JavaMap.put("IBM-866", "CP866");
+        fIANA2JavaMap.put("IBM-868", "CP868");
+        fIANA2JavaMap.put("IBM-869", "CP869");
+        fIANA2JavaMap.put("IBM-870", "CP870");
+        fIANA2JavaMap.put("IBM-871", "CP871");
+        fIANA2JavaMap.put("IBM-918", "CP918");
+        fIANA2JavaMap.put("IBM-924", "CP924");
+        fIANA2JavaMap.put("IBM-1026", "CP1026");
+        fIANA2JavaMap.put("IBM-1140", "Cp1140");
+        fIANA2JavaMap.put("IBM-1141", "Cp1141");
+        fIANA2JavaMap.put("IBM-1142", "Cp1142");
+        fIANA2JavaMap.put("IBM-1143", "Cp1143");
+        fIANA2JavaMap.put("IBM-1144", "Cp1144");
+        fIANA2JavaMap.put("IBM-1145", "Cp1145");
+        fIANA2JavaMap.put("IBM-1146", "Cp1146");
+        fIANA2JavaMap.put("IBM-1147", "Cp1147");
+        fIANA2JavaMap.put("IBM-1148", "Cp1148");
+        fIANA2JavaMap.put("IBM-1149", "Cp1149");
+        fIANA2JavaMap.put("IBM-819", "ISO8859_1");
+        fIANA2JavaMap.put("IBM-367", "ASCII");
+
+        // REVISIT:
+        //   j:CNS11643 -> EUC-TW?
+        //   ISO-2022-CN? ISO-2022-CN-EXT?
+
+        // add Java to IANA encoding mappings
+        //fJava2IANAMap.put("8859_1",    "US-ASCII"); // ?
+        fJava2IANAMap.put("ISO8859_1", "ISO-8859-1");
+        fJava2IANAMap.put("ISO8859_2", "ISO-8859-2");
+        fJava2IANAMap.put("ISO8859_3", "ISO-8859-3");
+        fJava2IANAMap.put("ISO8859_4", "ISO-8859-4");
+        fJava2IANAMap.put("ISO8859_5", "ISO-8859-5");
+        fJava2IANAMap.put("ISO8859_6", "ISO-8859-6");
+        fJava2IANAMap.put("ISO8859_7", "ISO-8859-7");
+        fJava2IANAMap.put("ISO8859_8", "ISO-8859-8");
+        fJava2IANAMap.put("ISO8859_9", "ISO-8859-9");
+        fJava2IANAMap.put("ISO8859_13", "ISO-8859-13");
+        fJava2IANAMap.put("ISO8859_15", "ISO-8859-15");
+        fJava2IANAMap.put("ISO8859_15_FDIS", "ISO-8859-15");
+        fJava2IANAMap.put("Big5", "BIG5");
+        fJava2IANAMap.put("CP037", "EBCDIC-CP-US");
+        fJava2IANAMap.put("CP273", "IBM273");
+        fJava2IANAMap.put("CP277", "EBCDIC-CP-DK");
+        fJava2IANAMap.put("CP278", "EBCDIC-CP-FI");
+        fJava2IANAMap.put("CP280", "EBCDIC-CP-IT");
+        fJava2IANAMap.put("CP284", "EBCDIC-CP-ES");
+        fJava2IANAMap.put("CP285", "EBCDIC-CP-GB");
+        fJava2IANAMap.put("CP290", "EBCDIC-JP-KANA");
+        fJava2IANAMap.put("CP297", "EBCDIC-CP-FR");
+        fJava2IANAMap.put("CP420", "EBCDIC-CP-AR1");
+        fJava2IANAMap.put("CP424", "EBCDIC-CP-HE");
+        fJava2IANAMap.put("CP437", "IBM437");
+        fJava2IANAMap.put("CP500", "EBCDIC-CP-CH");
+        fJava2IANAMap.put("CP775", "IBM775");
+        fJava2IANAMap.put("CP850", "IBM850");
+        fJava2IANAMap.put("CP852", "IBM852");
+        fJava2IANAMap.put("CP855", "IBM855");
+        fJava2IANAMap.put("CP857", "IBM857");
+        fJava2IANAMap.put("CP858", "IBM00858");
+        fJava2IANAMap.put("CP860", "IBM860");
+        fJava2IANAMap.put("CP861", "IBM861");
+        fJava2IANAMap.put("CP862", "IBM862");
+        fJava2IANAMap.put("CP863", "IBM863");
+        fJava2IANAMap.put("CP864", "IBM864");
+        fJava2IANAMap.put("CP865", "IBM865");
+        fJava2IANAMap.put("CP866", "IBM866");
+        fJava2IANAMap.put("CP868", "IBM868");
+        fJava2IANAMap.put("CP869", "IBM869");
+        fJava2IANAMap.put("CP870", "EBCDIC-CP-ROECE");
+        fJava2IANAMap.put("CP871", "EBCDIC-CP-IS");
+        fJava2IANAMap.put("CP918", "EBCDIC-CP-AR2");
+        fJava2IANAMap.put("CP924", "IBM00924");
+        fJava2IANAMap.put("CP1026", "IBM1026");
+        fJava2IANAMap.put("Cp01140", "IBM01140");
+        fJava2IANAMap.put("Cp01141", "IBM01141");
+        fJava2IANAMap.put("Cp01142", "IBM01142");
+        fJava2IANAMap.put("Cp01143", "IBM01143");
+        fJava2IANAMap.put("Cp01144", "IBM01144");
+        fJava2IANAMap.put("Cp01145", "IBM01145");
+        fJava2IANAMap.put("Cp01146", "IBM01146");
+        fJava2IANAMap.put("Cp01147", "IBM01147");
+        fJava2IANAMap.put("Cp01148", "IBM01148");
+        fJava2IANAMap.put("Cp01149", "IBM01149");
+        fJava2IANAMap.put("EUCJIS", "EUC-JP");
+        fJava2IANAMap.put("KS_C_5601-1987", "KS_C_5601-1987");
+        fJava2IANAMap.put("GB2312", "GB2312");
+        fJava2IANAMap.put("ISO2022KR", "ISO-2022-KR");
+        fJava2IANAMap.put("ISO2022CN", "ISO-2022-CN");
+        fJava2IANAMap.put("JIS", "ISO-2022-JP");
+        fJava2IANAMap.put("KOI8_R", "KOI8-R");
+        fJava2IANAMap.put("KSC5601", "EUC-KR");
+        fJava2IANAMap.put("GB18030", "GB18030");
+        fJava2IANAMap.put("GBK", "GBK");
+        fJava2IANAMap.put("SJIS", "SHIFT_JIS");
+        fJava2IANAMap.put("MS932", "WINDOWS-31J");
+        fJava2IANAMap.put("UTF8", "UTF-8");
+        fJava2IANAMap.put("Unicode", "UTF-16");
+        fJava2IANAMap.put("UnicodeBig", "UTF-16BE");
+        fJava2IANAMap.put("UnicodeLittle", "UTF-16LE");
+        fJava2IANAMap.put("JIS0201", "X0201");
+        fJava2IANAMap.put("JIS0208", "X0208");
+        fJava2IANAMap.put("JIS0212", "ISO-IR-159");
+
+        // proposed addition (see above for details):
+        fJava2IANAMap.put("CP1047", "IBM1047");
+
+    } // <clinit>()
+
+    //
+    // Constructors
+    //
+
+    /**
+     * Default constructor.
+     */
+    public EncodingMap() {
+    }
+
+    //
+    // Public static methods
+    //
+
+    /**
+     * Adds an IANA to Java encoding name mapping.
+     *
+     * @param ianaEncoding The IANA encoding name.
+     * @param javaEncoding The Java encoding name.
+     */
+    public static void putIANA2JavaMapping(String ianaEncoding,
+                                           String javaEncoding) {
+        fIANA2JavaMap.put(ianaEncoding, javaEncoding);
+    } // putIANA2JavaMapping(String,String)
+
+    /**
+     * Returns the Java encoding name for the specified IANA encoding name.
+     *
+     * @param ianaEncoding The IANA encoding name.
+     */
+    public static String getIANA2JavaMapping(String ianaEncoding) {
+        return (String) fIANA2JavaMap.get(ianaEncoding);
+    } // getIANA2JavaMapping(String):String
+
+    /**
+     * Removes an IANA to Java encoding name mapping.
+     *
+     * @param ianaEncoding The IANA encoding name.
+     */
+    public static String removeIANA2JavaMapping(String ianaEncoding) {
+        return (String) fIANA2JavaMap.remove(ianaEncoding);
+    } // removeIANA2JavaMapping(String):String
+
+    /**
+     * Adds a Java to IANA encoding name mapping.
+     *
+     * @param javaEncoding The Java encoding name.
+     * @param ianaEncoding The IANA encoding name.
+     */
+    public static void putJava2IANAMapping(String javaEncoding,
+                                           String ianaEncoding) {
+        fJava2IANAMap.put(javaEncoding, ianaEncoding);
+    } // putJava2IANAMapping(String,String)
+
+    /**
+     * Returns the IANA encoding name for the specified Java encoding name.
+     *
+     * @param javaEncoding The Java encoding name.
+     */
+    public static String getJava2IANAMapping(String javaEncoding) {
+        return (String) fJava2IANAMap.get(javaEncoding);
+    } // getJava2IANAMapping(String):String
+
+    /**
+     * Removes a Java to IANA encoding name mapping.
+     *
+     * @param javaEncoding The Java encoding name.
+     */
+    public static String removeJava2IANAMapping(String javaEncoding) {
+        return (String) fJava2IANAMap.remove(javaEncoding);
+    } // removeJava2IANAMapping
+
+} // class EncodingMap

Added: jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/NamespaceSupport.java
URL: http://svn.apache.org/viewvc/jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/NamespaceSupport.java?rev=1512568&view=auto
==============================================================================
--- jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/NamespaceSupport.java (added)
+++ jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/NamespaceSupport.java Sat Aug 10 05:53:42 2013
@@ -0,0 +1,311 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.jackrabbit.vault.util.xml.xerces.util;
+
+import java.util.Enumeration;
+import java.util.NoSuchElementException;
+
+import org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext;
+
+/**
+ * Namespace support for XML document handlers. This class doesn't
+ * perform any error checking and assumes that all strings passed
+ * as arguments to methods are unique symbols. The SymbolTable class
+ * can be used for this purpose.
+ *
+ * @author Andy Clark, IBM
+ * @version $Id$
+ */
+public class NamespaceSupport implements NamespaceContext {
+
+    //
+    // Data
+    //
+
+    /**
+     * Namespace binding information. This array is composed of a
+     * series of tuples containing the namespace binding information:
+     * &lt;prefix, uri&gt;. The default size can be set to anything
+     * as long as it is a power of 2 greater than 1.
+     *
+     * @see #fNamespaceSize
+     * @see #fContext
+     */
+    protected String[] fNamespace = new String[16 * 2];
+
+    /**
+     * The top of the namespace information array.
+     */
+    protected int fNamespaceSize;
+
+    // NOTE: The constructor depends on the initial context size 
+    //       being at least 1. -Ac
+
+    /**
+     * Context indexes. This array contains indexes into the namespace
+     * information array. The index at the current context is the start
+     * index of declared namespace bindings and runs to the size of the
+     * namespace information array.
+     *
+     * @see #fNamespaceSize
+     */
+    protected int[] fContext = new int[8];
+
+    /**
+     * The current context.
+     */
+    protected int fCurrentContext;
+
+    protected String[] fPrefixes = new String[16];
+
+    //
+    // Constructors
+    //
+
+    /**
+     * Default constructor.
+     */
+    public NamespaceSupport() {
+    } // <init>()
+
+    /**
+     * Constructs a namespace context object and initializes it with
+     * the prefixes declared in the specified context.
+     */
+    public NamespaceSupport(NamespaceContext context) {
+        pushContext();
+        // copy declaration in the context
+        Enumeration prefixes = context.getAllPrefixes();
+        while (prefixes.hasMoreElements()) {
+            String prefix = (String) prefixes.nextElement();
+            String uri = context.getURI(prefix);
+            declarePrefix(prefix, uri);
+        }
+    } // <init>(NamespaceContext)
+
+
+    //
+    // Public methods
+    //
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#reset()
+     */
+    public void reset() {
+
+        // reset namespace and context info
+        fNamespaceSize = 0;
+        fCurrentContext = 0;
+        fContext[fCurrentContext] = fNamespaceSize;
+
+        // bind "xml" prefix to the XML uri
+        fNamespace[fNamespaceSize++] = XMLSymbols.PREFIX_XML;
+        fNamespace[fNamespaceSize++] = NamespaceContext.XML_URI;
+        // bind "xmlns" prefix to the XMLNS uri
+        fNamespace[fNamespaceSize++] = XMLSymbols.PREFIX_XMLNS;
+        fNamespace[fNamespaceSize++] = NamespaceContext.XMLNS_URI;
+        ++fCurrentContext;
+
+    } // reset(SymbolTable)
+
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#pushContext()
+     */
+    public void pushContext() {
+
+        // extend the array, if necessary
+        if (fCurrentContext + 1 == fContext.length) {
+            int[] contextarray = new int[fContext.length * 2];
+            System.arraycopy(fContext, 0, contextarray, 0, fContext.length);
+            fContext = contextarray;
+        }
+
+        // push context
+        fContext[++fCurrentContext] = fNamespaceSize;
+
+    } // pushContext()
+
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#popContext()
+     */
+    public void popContext() {
+        fNamespaceSize = fContext[fCurrentContext--];
+    } // popContext()
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#declarePrefix(String, String)
+     */
+    public boolean declarePrefix(String prefix, String uri) {
+        // ignore "xml" and "xmlns" prefixes
+        if (prefix == XMLSymbols.PREFIX_XML || prefix == XMLSymbols.PREFIX_XMLNS) {
+            return false;
+        }
+
+        // see if prefix already exists in current context
+        for (int i = fNamespaceSize; i > fContext[fCurrentContext]; i -= 2) {
+            if (fNamespace[i - 2] == prefix) {
+                // REVISIT: [Q] Should the new binding override the
+                //          previously declared binding or should it
+                //          it be ignored? -Ac
+                // NOTE:    The SAX2 "NamespaceSupport" helper allows
+                //          re-bindings with the new binding overwriting
+                //          the previous binding. -Ac
+                fNamespace[i - 1] = uri;
+                return true;
+            }
+        }
+
+        // resize array, if needed
+        if (fNamespaceSize == fNamespace.length) {
+            String[] namespacearray = new String[fNamespaceSize * 2];
+            System.arraycopy(fNamespace, 0, namespacearray, 0, fNamespaceSize);
+            fNamespace = namespacearray;
+        }
+
+        // bind prefix to uri in current context
+        fNamespace[fNamespaceSize++] = prefix;
+        fNamespace[fNamespaceSize++] = uri;
+
+        return true;
+
+    } // declarePrefix(String,String):boolean
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#getURI(String)
+     */
+    public String getURI(String prefix) {
+
+        // find prefix in current context
+        for (int i = fNamespaceSize; i > 0; i -= 2) {
+            if (fNamespace[i - 2] == prefix) {
+                return fNamespace[i - 1];
+            }
+        }
+
+        // prefix not found
+        return null;
+
+    } // getURI(String):String
+
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#getPrefix(String)
+     */
+    public String getPrefix(String uri) {
+
+        // find uri in current context
+        for (int i = fNamespaceSize; i > 0; i -= 2) {
+            if (fNamespace[i - 1] == uri) {
+                if (getURI(fNamespace[i - 2]) == uri)
+                    return fNamespace[i - 2];
+            }
+        }
+
+        // uri not found
+        return null;
+
+    } // getPrefix(String):String
+
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#getDeclaredPrefixCount()
+     */
+    public int getDeclaredPrefixCount() {
+        return (fNamespaceSize - fContext[fCurrentContext]) / 2;
+    } // getDeclaredPrefixCount():int
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#getDeclaredPrefixAt(int)
+     */
+    public String getDeclaredPrefixAt(int index) {
+        return fNamespace[fContext[fCurrentContext] + index * 2];
+    } // getDeclaredPrefixAt(int):String
+
+    /**
+     * @see org.apache.jackrabbit.vault.util.xml.xerces.xni.NamespaceContext#getAllPrefixes()
+     */
+    public Enumeration getAllPrefixes() {
+        int count = 0;
+        if (fPrefixes.length < (fNamespace.length / 2)) {
+            // resize prefix array          
+            String[] prefixes = new String[fNamespaceSize];
+            fPrefixes = prefixes;
+        }
+        String prefix = null;
+        boolean unique = true;
+        for (int i = 2; i < (fNamespaceSize - 2); i += 2) {
+            prefix = fNamespace[i + 2];
+            for (int k = 0; k < count; k++) {
+                if (fPrefixes[k] == prefix) {
+                    unique = false;
+                    break;
+                }
+            }
+            if (unique) {
+                fPrefixes[count++] = prefix;
+            }
+            unique = true;
+        }
+        return new Prefixes(fPrefixes, count);
+    }
+
+    protected final class Prefixes implements Enumeration {
+        private String[] prefixes;
+        private int counter = 0;
+        private int size = 0;
+
+        /**
+         * Constructor for Prefixes.
+         */
+        public Prefixes(String[] prefixes, int size) {
+            this.prefixes = prefixes;
+            this.size = size;
+        }
+
+        /**
+         * @see java.util.Enumeration#hasMoreElements()
+         */
+        public boolean hasMoreElements() {
+            return (counter < size);
+        }
+
+        /**
+         * @see java.util.Enumeration#nextElement()
+         */
+        public Object nextElement() {
+            if (counter < size) {
+                return fPrefixes[counter++];
+            }
+            throw new NoSuchElementException("Illegal access to Namespace prefixes enumeration.");
+        }
+
+        public String toString() {
+            StringBuffer buf = new StringBuffer();
+            for (int i = 0; i < size; i++) {
+                buf.append(prefixes[i]);
+                buf.append(" ");
+            }
+
+            return buf.toString(); 
+        }
+
+}
+
+} // class NamespaceSupport

Added: jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/SymbolTable.java
URL: http://svn.apache.org/viewvc/jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/SymbolTable.java?rev=1512568&view=auto
==============================================================================
--- jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/SymbolTable.java (added)
+++ jackrabbit/commons/filevault/trunk/vault-core/src/main/java/org/apache/jackrabbit/vault/util/xml/xerces/util/SymbolTable.java Sat Aug 10 05:53:42 2013
@@ -0,0 +1,311 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.jackrabbit.vault.util.xml.xerces.util;
+
+/**
+ * This class is a symbol table implementation that guarantees that
+ * strings used as identifiers are unique references. Multiple calls
+ * to <code>addSymbol</code> will always return the same string
+ * reference.
+ * <p/>
+ * The symbol table performs the same task as <code>String.intern()</code>
+ * with the following differences:
+ * <ul>
+ * <li>
+ * A new string object does not need to be created in order to
+ * retrieve a unique reference. Symbols can be added by using
+ * a series of characters in a character array.
+ * </li>
+ * <li>
+ * Users of the symbol table can provide their own symbol hashing
+ * implementation. For example, a simple string hashing algorithm
+ * may fail to produce a balanced set of hashcodes for symbols
+ * that are <em>mostly</em> unique. Strings with similar leading
+ * characters are especially prone to this poor hashing behavior.
+ * </li>
+ * </ul>
+ *
+ * @author Andy Clark
+ * @version $Id$
+ * @see SymbolHash
+ */
+public class SymbolTable {
+
+    //
+    // Constants
+    //
+
+    /**
+     * Default table size.
+     */
+    protected static final int TABLE_SIZE = 101;
+
+    //
+    // Data
+    //
+
+    /**
+     * Buckets.
+     */
+    protected Entry[] fBuckets = null;
+
+    // actual table size
+    protected int fTableSize;
+
+    //
+    // Constructors
+    //
+
+    /**
+     * Constructs a symbol table with a default number of buckets.
+     */
+    public SymbolTable() {
+        this(TABLE_SIZE);
+    }
+
+    /**
+     * Constructs a symbol table with a specified number of buckets.
+     */
+    public SymbolTable(int tableSize) {
+        fTableSize = tableSize;
+        fBuckets = new Entry[fTableSize];
+    }
+
+    //
+    // Public methods
+    //
+
+    /**
+     * Adds the specified symbol to the symbol table and returns a
+     * reference to the unique symbol. If the symbol already exists,
+     * the previous symbol reference is returned instead, in order
+     * guarantee that symbol references remain unique.
+     *
+     * @param symbol The new symbol.
+     */
+    public String addSymbol(String symbol) {
+
+        // search for identical symbol
+        int bucket = hash(symbol) % fTableSize;
+        int length = symbol.length();
+        OUTER:
+        for (Entry entry = fBuckets[bucket]; entry != null; entry = entry.next) {
+            if (length == entry.characters.length) {
+                for (int i = 0; i < length; i++) {
+                    if (symbol.charAt(i) != entry.characters[i]) {
+                        continue OUTER;
+                    }
+                }
+                return entry.symbol;
+            }
+        }
+
+        // create new entry
+        Entry entry = new Entry(symbol, fBuckets[bucket]);
+        fBuckets[bucket] = entry;
+        return entry.symbol;
+
+    } // addSymbol(String):String
+
+    /**
+     * Adds the specified symbol to the symbol table and returns a
+     * reference to the unique symbol. If the symbol already exists,
+     * the previous symbol reference is returned instead, in order
+     * guarantee that symbol references remain unique.
+     *
+     * @param buffer The buffer containing the new symbol.
+     * @param offset The offset into the buffer of the new symbol.
+     * @param length The length of the new symbol in the buffer.
+     */
+    public String addSymbol(char[] buffer, int offset, int length) {
+
+        // search for identical symbol
+        int bucket = hash(buffer, offset, length) % fTableSize;
+        OUTER:
+        for (Entry entry = fBuckets[bucket]; entry != null; entry = entry.next) {
+            if (length == entry.characters.length) {
+                for (int i = 0; i < length; i++) {
+                    if (buffer[offset + i] != entry.characters[i]) {
+                        continue OUTER;
+                    }
+                }
+                return entry.symbol;
+            }
+        }
+
+        // add new entry
+        Entry entry = new Entry(buffer, offset, length, fBuckets[bucket]);
+        fBuckets[bucket] = entry;
+        return entry.symbol;
+
+    } // addSymbol(char[],int,int):String
+
+    /**
+     * Returns a hashcode value for the specified symbol. The value
+     * returned by this method must be identical to the value returned
+     * by the <code>hash(char[],int,int)</code> method when called
+     * with the character array that comprises the symbol string.
+     *
+     * @param symbol The symbol to hash.
+     */
+    public int hash(String symbol) {
+
+        int code = 0;
+        int length = symbol.length();
+        for (int i = 0; i < length; i++) {
+            code = code * 37 + symbol.charAt(i);
+        }
+        return code & 0x7FFFFFF;
+
+    } // hash(String):int
+
+    /**
+     * Returns a hashcode value for the specified symbol information.
+     * The value returned by this method must be identical to the value
+     * returned by the <code>hash(String)</code> method when called
+     * with the string object created from the symbol information.
+     *
+     * @param buffer The character buffer containing the symbol.
+     * @param offset The offset into the character buffer of the start
+     *               of the symbol.
+     * @param length The length of the symbol.
+     */
+    public int hash(char[] buffer, int offset, int length) {
+
+        int code = 0;
+        for (int i = 0; i < length; i++) {
+            code = code * 37 + buffer[offset + i];
+        }
+        return code & 0x7FFFFFF;
+
+    } // hash(char[],int,int):int
+
+    /**
+     * Returns true if the symbol table already contains the specified
+     * symbol.
+     *
+     * @param symbol The symbol to look for.
+     */
+    public boolean containsSymbol(String symbol) {
+
+        // search for identical symbol
+        int bucket = hash(symbol) % fTableSize;
+        int length = symbol.length();
+        OUTER:
+        for (Entry entry = fBuckets[bucket]; entry != null; entry = entry.next) {
+            if (length == entry.characters.length) {
+                for (int i = 0; i < length; i++) {
+                    if (symbol.charAt(i) != entry.characters[i]) {
+                        continue OUTER;
+                    }
+                }
+                return true;
+            }
+        }
+
+        return false;
+
+    } // containsSymbol(String):boolean
+
+    /**
+     * Returns true if the symbol table already contains the specified
+     * symbol.
+     *
+     * @param buffer The buffer containing the symbol to look for.
+     * @param offset The offset into the buffer.
+     * @param length The length of the symbol in the buffer.
+     */
+    public boolean containsSymbol(char[] buffer, int offset, int length) {
+
+        // search for identical symbol
+        int bucket = hash(buffer, offset, length) % fTableSize;
+        OUTER:
+        for (Entry entry = fBuckets[bucket]; entry != null; entry = entry.next) {
+            if (length == entry.characters.length) {
+                for (int i = 0; i < length; i++) {
+                    if (buffer[offset + i] != entry.characters[i]) {
+                        continue OUTER;
+                    }
+                }
+                return true;
+            }
+        }
+
+        return false;
+
+    } // containsSymbol(char[],int,int):boolean
+
+    //
+    // Classes
+    //
+
+    /**
+     * This class is a symbol table entry. Each entry acts as a node
+     * in a linked list.
+     */
+    protected static final class Entry {
+
+        //
+        // Data
+        //
+
+        /**
+         * Symbol.
+         */
+        public String symbol;
+
+        /**
+         * Symbol characters. This information is duplicated here for
+         * comparison performance.
+         */
+        public char[] characters;
+
+        /**
+         * The next entry.
+         */
+        public Entry next;
+
+        //
+        // Constructors
+        //
+
+        /**
+         * Constructs a new entry from the specified symbol and next entry
+         * reference.
+         */
+        public Entry(String symbol, Entry next) {
+            this.symbol = symbol.intern();
+            characters = new char[symbol.length()];
+            symbol.getChars(0, characters.length, characters, 0);
+            this.next = next;
+        }
+
+        /**
+         * Constructs a new entry from the specified symbol information and
+         * next entry reference.
+         */
+        public Entry(char[] ch, int offset, int length, Entry next) {
+            characters = new char[length];
+            System.arraycopy(ch, offset, characters, 0, length);
+            symbol = new String(characters).intern();
+            this.next = next;
+        }
+
+    } // class Entry
+
+} // class SymbolTable



Mime
View raw message