001: /*
002: * Licensed to the Apache Software Foundation (ASF) under one or more
003: * contributor license agreements. See the NOTICE file distributed with
004: * this work for additional information regarding copyright ownership.
005: * The ASF licenses this file to You under the Apache License, Version 2.0
006: * (the "License"); you may not use this file except in compliance with
007: * the License. You may obtain a copy of the License at
008: *
009: * http://www.apache.org/licenses/LICENSE-2.0
010: *
011: * Unless required by applicable law or agreed to in writing, software
012: * distributed under the License is distributed on an "AS IS" BASIS,
013: * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
014: * See the License for the specific language governing permissions and
015: * limitations under the License.
016: */
017:
018: package org.apache.harmony.niochar.charset.additional;
019:
020: import java.nio.charset.Charset;
021: import java.nio.charset.CoderResult;
022: import java.nio.charset.CharsetDecoder;
023: import java.nio.charset.CharsetEncoder;
024: import java.nio.CharBuffer;
025: import java.nio.ByteBuffer;
026:
027: import org.apache.harmony.nio.AddressUtil;
028:
029: public class IBM_Thai extends Charset {
030:
031: public IBM_Thai(String csName, String[] aliases) {
032: super (csName, aliases);
033: }
034:
035: public boolean contains(Charset cs) {
036: return cs.name().equalsIgnoreCase("IBM-Thai")
037: || cs.name().equalsIgnoreCase("IBM367")
038: || cs.name().equalsIgnoreCase("US-ASCII");
039: }
040:
041: public CharsetDecoder newDecoder() {
042: return new Decoder(this );
043: }
044:
045: public CharsetEncoder newEncoder() {
046: return new Encoder(this );
047: }
048:
049: private static final class Decoder extends CharsetDecoder {
050: private Decoder(Charset cs) {
051: super (cs, 1, 1);
052:
053: }
054:
055: public native int nDecode(char[] array, int arrPosition,
056: int remaining, long outAddr, int absolutePos);
057:
058: protected CoderResult decodeLoop(ByteBuffer bb, CharBuffer cb) {
059: int cbRemaining = cb.remaining();
060: if (bb.isDirect() && bb.hasRemaining() && cb.hasArray()) {
061: int toProceed = bb.remaining();
062: int cbPos = cb.position();
063: int bbPos = bb.position();
064: boolean throwOverflow = false;
065: if (cbRemaining < toProceed) {
066: toProceed = cbRemaining;
067: throwOverflow = true;
068: }
069: int res = nDecode(cb.array(), cb.arrayOffset() + cbPos,
070: toProceed, AddressUtil
071: .getDirectBufferAddress(bb), bbPos);
072: bb.position(bbPos + res);
073: cb.position(cbPos + res);
074: if (throwOverflow)
075: return CoderResult.OVERFLOW;
076: } else {
077: if (bb.hasArray() && cb.hasArray()) {
078: int rem = bb.remaining();
079: rem = cbRemaining >= rem ? rem : cbRemaining;
080: byte[] bArr = bb.array();
081: char[] cArr = cb.array();
082: int bStart = bb.position();
083: int cStart = cb.position();
084: int i;
085: for (i = bStart; i < bStart + rem; i++) {
086: char in = (char) (bArr[i] & 0xFF);
087: if (in >= 4) {
088: int index = (int) in - 4;
089: cArr[cStart++] = (char) arr[index];
090: } else {
091: cArr[cStart++] = (char) (in & 0xFF);
092: }
093: }
094: bb.position(i);
095: cb.position(cStart);
096: if (rem == cbRemaining && bb.hasRemaining())
097: return CoderResult.OVERFLOW;
098: } else {
099: while (bb.hasRemaining()) {
100: if (cbRemaining == 0)
101: return CoderResult.OVERFLOW;
102: char in = (char) (bb.get() & 0xFF);
103: if (in >= 4) {
104: int index = (int) in - 4;
105: cb.put(arr[index]);
106: } else {
107: cb.put((char) (in & 0xFF));
108: }
109: cbRemaining--;
110: }
111: }
112: }
113: return CoderResult.UNDERFLOW;
114: }
115:
116: final static char[] arr = { 0x009C, 0x0009, 0x0086, 0x007F,
117: 0x0097, 0x008D, 0x008E, 0x000B, 0x000C, 0x000D, 0x000E,
118: 0x000F, 0x0010, 0x0011, 0x0012, 0x0013, 0x009D, 0x0085,
119: 0x0008, 0x0087, 0x0018, 0x0019, 0x0092, 0x008F, 0x001C,
120: 0x001D, 0x001E, 0x001F, 0x0080, 0x0081, 0x0082, 0x0083,
121: 0x0084, 0x000A, 0x0017, 0x001B, 0x0088, 0x0089, 0x008A,
122: 0x008B, 0x008C, 0x0005, 0x0006, 0x0007, 0x0090, 0x0091,
123: 0x0016, 0x0093, 0x0094, 0x0095, 0x0096, 0x0004, 0x0098,
124: 0x0099, 0x009A, 0x009B, 0x0014, 0x0015, 0x009E, 0x001A,
125: 0x0020, 0x00A0, 0x0E01, 0x0E02, 0x0E03, 0x0E04, 0x0E05,
126: 0x0E06, 0x0E07, 0x005B, 0x00A2, 0x002E, 0x003C, 0x0028,
127: 0x002B, 0x007C, 0x0026, 0x0E48, 0x0E08, 0x0E09, 0x0E0A,
128: 0x0E0B, 0x0E0C, 0x0E0D, 0x0E0E, 0x005D, 0x0021, 0x0024,
129: 0x002A, 0x0029, 0x003B, 0x00AC, 0x002D, 0x002F, 0x0E0F,
130: 0x0E10, 0x0E11, 0x0E12, 0x0E13, 0x0E14, 0x0E15, 0x005E,
131: 0x00A6, 0x002C, 0x0025, 0x005F, 0x003E, 0x003F, 0x0E3F,
132: 0x0E4E, 0x0E16, 0x0E17, 0x0E18, 0x0E19, 0x0E1A, 0x0E1B,
133: 0x0E1C, 0x0060, 0x003A, 0x0023, 0x0040, 0x0027, 0x003D,
134: 0x0022, 0x0E4F, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065,
135: 0x0066, 0x0067, 0x0068, 0x0069, 0x0E1D, 0x0E1E, 0x0E1F,
136: 0x0E20, 0x0E21, 0x0E22, 0x0E5A, 0x006A, 0x006B, 0x006C,
137: 0x006D, 0x006E, 0x006F, 0x0070, 0x0071, 0x0072, 0x0E23,
138: 0x0E24, 0x0E25, 0x0E26, 0x0E27, 0x0E28, 0x0E5B, 0x007E,
139: 0x0073, 0x0074, 0x0075, 0x0076, 0x0077, 0x0078, 0x0079,
140: 0x007A, 0x0E29, 0x0E2A, 0x0E2B, 0x0E2C, 0x0E2D, 0x0E2E,
141: 0x0E50, 0x0E51, 0x0E52, 0x0E53, 0x0E54, 0x0E55, 0x0E56,
142: 0x0E57, 0x0E58, 0x0E59, 0x0E2F, 0x0E30, 0x0E31, 0x0E32,
143: 0x0E33, 0x0E34, 0x007B, 0x0041, 0x0042, 0x0043, 0x0044,
144: 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x0E49, 0x0E35,
145: 0x0E36, 0x0E37, 0x0E38, 0x0E39, 0x007D, 0x004A, 0x004B,
146: 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052,
147: 0x0E3A, 0x0E40, 0x0E41, 0x0E42, 0x0E43, 0x0E44, 0x005C,
148: 0x0E4A, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058,
149: 0x0059, 0x005A, 0x0E45, 0x0E46, 0x0E47, 0x0E48, 0x0E49,
150: 0x0E4A, 0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035,
151: 0x0036, 0x0037, 0x0038, 0x0039, 0x0E4B, 0x0E4C, 0x0E4D,
152: 0x0E4B, 0x0E4C, 0x009F };
153: }
154:
155: private static final class Encoder extends CharsetEncoder {
156: private Encoder(Charset cs) {
157: super (cs, 1, 1);
158: }
159:
160: private native void nEncode(long outAddr, int absolutePos,
161: char[] array, int arrPosition, int[] res);
162:
163: protected CoderResult encodeLoop(CharBuffer cb, ByteBuffer bb) {
164: int bbRemaining = bb.remaining();
165: if (bb.isDirect() && cb.hasRemaining() && cb.hasArray()) {
166: int toProceed = cb.remaining();
167: int cbPos = cb.position();
168: int bbPos = bb.position();
169: boolean throwOverflow = false;
170: if (bbRemaining < toProceed) {
171: toProceed = bbRemaining;
172: throwOverflow = true;
173: }
174: int[] res = { toProceed, 0 };
175: nEncode(AddressUtil.getDirectBufferAddress(bb), bbPos,
176: cb.array(), cb.arrayOffset() + cbPos, res);
177: if (res[0] <= 0) {
178: bb.position(bbPos - res[0]);
179: cb.position(cbPos - res[0]);
180: if (res[1] != 0) {
181: if (res[1] < 0)
182: return CoderResult
183: .malformedForLength(-res[1]);
184: else
185: return CoderResult
186: .unmappableForLength(res[1]);
187: }
188: } else {
189: bb.position(bbPos + res[0]);
190: cb.position(cbPos + res[0]);
191: if (throwOverflow)
192: return CoderResult.OVERFLOW;
193: }
194: } else {
195: if (bb.hasArray() && cb.hasArray()) {
196: byte[] byteArr = bb.array();
197: char[] charArr = cb.array();
198: int rem = cb.remaining();
199: int byteArrStart = bb.position();
200: rem = bbRemaining <= rem ? bbRemaining : rem;
201: int x;
202: for (x = cb.position(); x < cb.position() + rem; x++) {
203: char c = charArr[x];
204: if (c > (char) 0x0E5B) {
205: if (c >= 0xD800 && c <= 0xDFFF) {
206: if (x + 1 < cb.limit()) {
207: char c1 = charArr[x + 1];
208: if (c1 >= 0xD800 && c1 <= 0xDFFF) {
209: cb.position(x);
210: bb.position(byteArrStart);
211: return CoderResult
212: .unmappableForLength(2);
213: }
214: } else {
215: cb.position(x);
216: bb.position(byteArrStart);
217: return CoderResult.UNDERFLOW;
218: }
219: cb.position(x);
220: bb.position(byteArrStart);
221: return CoderResult
222: .malformedForLength(1);
223: }
224: cb.position(x);
225: bb.position(byteArrStart);
226: return CoderResult.unmappableForLength(1);
227: } else {
228: if (c < 0x04) {
229: byteArr[byteArrStart++] = (byte) c;
230: } else {
231: int index = (int) c >> 8;
232: index = encodeIndex[index];
233: if (index < 0) {
234: cb.position(x);
235: bb.position(byteArrStart);
236: return CoderResult
237: .unmappableForLength(1);
238: }
239: index <<= 8;
240: index += (int) c & 0xFF;
241: if ((byte) arr[index] != 0) {
242: byteArr[byteArrStart++] = (byte) arr[index];
243: } else {
244: cb.position(x);
245: bb.position(byteArrStart);
246: return CoderResult
247: .unmappableForLength(1);
248: }
249: }
250: }
251: }
252: cb.position(x);
253: bb.position(byteArrStart);
254: if (rem == bbRemaining && cb.hasRemaining()) {
255: return CoderResult.OVERFLOW;
256: }
257: } else {
258: while (cb.hasRemaining()) {
259: if (bbRemaining == 0)
260: return CoderResult.OVERFLOW;
261: char c = cb.get();
262: if (c > (char) 0x0E5B) {
263: if (c >= 0xD800 && c <= 0xDFFF) {
264: if (cb.hasRemaining()) {
265: char c1 = cb.get();
266: if (c1 >= 0xD800 && c1 <= 0xDFFF) {
267: cb.position(cb.position() - 2);
268: return CoderResult
269: .unmappableForLength(2);
270: } else {
271: cb.position(cb.position() - 1);
272: }
273: } else {
274: cb.position(cb.position() - 1);
275: return CoderResult.UNDERFLOW;
276: }
277: cb.position(cb.position() - 1);
278: return CoderResult
279: .malformedForLength(1);
280: }
281: cb.position(cb.position() - 1);
282: return CoderResult.unmappableForLength(1);
283: } else {
284: if (c < 0x04) {
285: bb.put((byte) c);
286: } else {
287: int index = (int) c >> 8;
288: index = encodeIndex[index];
289: if (index < 0) {
290: cb.position(cb.position() - 1);
291: return CoderResult
292: .unmappableForLength(1);
293: }
294: index <<= 8;
295: index += (int) c & 0xFF;
296: if ((byte) arr[index] != 0) {
297: bb.put((byte) arr[index]);
298: } else {
299: cb.position(cb.position() - 1);
300: return CoderResult
301: .unmappableForLength(1);
302: }
303: }
304: bbRemaining--;
305: }
306: }
307: }
308: }
309: return CoderResult.UNDERFLOW;
310: }
311:
312: final static char arr[] = {
313:
314: 0x00, 0x01, 0x02, 0x03, 0x37, 0x2D, 0x2E, 0x2F, 0x16, 0x05,
315: 0x25, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12,
316: 0x13, 0x3C, 0x3D, 0x32, 0x26, 0x18, 0x19, 0x3F, 0x27,
317: 0x1C, 0x1D, 0x1E, 0x1F, 0x40, 0x5A, 0x7F, 0x7B, 0x5B,
318: 0x6C, 0x50, 0x7D, 0x4D, 0x5D, 0x5C, 0x4E, 0x6B, 0x60,
319: 0x4B, 0x61, 0xF0, 0xF1, 0xF2, 0xF3, 0xF4, 0xF5, 0xF6,
320: 0xF7, 0xF8, 0xF9, 0x7A, 0x5E, 0x4C, 0x7E, 0x6E, 0x6F,
321: 0x7C, 0xC1, 0xC2, 0xC3, 0xC4, 0xC5, 0xC6, 0xC7, 0xC8,
322: 0xC9, 0xD1, 0xD2, 0xD3, 0xD4, 0xD5, 0xD6, 0xD7, 0xD8,
323: 0xD9, 0xE2, 0xE3, 0xE4, 0xE5, 0xE6, 0xE7, 0xE8, 0xE9,
324: 0x49, 0xE0, 0x59, 0x69, 0x6D, 0x79, 0x81, 0x82, 0x83,
325: 0x84, 0x85, 0x86, 0x87, 0x88, 0x89, 0x91, 0x92, 0x93,
326: 0x94, 0x95, 0x96, 0x97, 0x98, 0x99, 0xA2, 0xA3, 0xA4,
327: 0xA5, 0xA6, 0xA7, 0xA8, 0xA9, 0xC0, 0x4F, 0xD0, 0xA1,
328: 0x07, 0x20, 0x21, 0x22, 0x23, 0x24, 0x15, 0x06, 0x17,
329: 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x09, 0x0A, 0x1B, 0x30,
330: 0x31, 0x1A, 0x33, 0x34, 0x35, 0x36, 0x08, 0x38, 0x39,
331: 0x3A, 0x3B, 0x04, 0x14, 0x3E, 0xFF, 0x41, 0x00, 0x4A,
332: 0x00, 0x00, 0x00, 0x6A, 0x00, 0x00, 0x00, 0x00, 0x00,
333: 0x5F, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
334: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
335: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
336: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
337: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
338: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
339: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
340: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
341: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
342: 0x00, 0x00, 0x00,
343:
344: 0x00, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x52,
345: 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x62, 0x63, 0x64,
346: 0x65, 0x66, 0x67, 0x68, 0x72, 0x73, 0x74, 0x75, 0x76,
347: 0x77, 0x78, 0x8A, 0x8B, 0x8C, 0x8D, 0x8E, 0x8F, 0x9A,
348: 0x9B, 0x9C, 0x9D, 0x9E, 0x9F, 0xAA, 0xAB, 0xAC, 0xAD,
349: 0xAE, 0xAF, 0xBA, 0xBB, 0xBC, 0xBD, 0xBE, 0xBF, 0xCB,
350: 0xCC, 0xCD, 0xCE, 0xCF, 0xDA, 0x00, 0x00, 0x00, 0x00,
351: 0x70, 0xDB, 0xDC, 0xDD, 0xDE, 0xDF, 0xEA, 0xEB, 0xEC,
352: 0xED, 0xEE, 0xEF, 0xFD, 0xFE, 0xFC, 0x71, 0x80, 0xB0,
353: 0xB1, 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7, 0xB8, 0xB9,
354: 0x90, 0xA0, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
355: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
356: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
357: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
358: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
359: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
360: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
361: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
362: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
363: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
364: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
365: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
366: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
367: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
368: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
369: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
370: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
371: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
372: 0x00, 0x00, 0x00, 0x00 };
373:
374: final static int[] encodeIndex = { 0, -1, -1, -1, -1, -1, -1,
375: -1, -1, -1, -1, -1, -1, -1, 1, -1, -1, -1, -1, -1, -1,
376: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
377: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
378: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
379: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
380: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
381: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
382: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
383: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
384: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
385: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
386: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
387: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
388: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
389: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
390: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
391: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
392: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 };
393: }
394: }
|