001: /*
002: * Licensed to the Apache Software Foundation (ASF) under one or more
003: * contributor license agreements. See the NOTICE file distributed with
004: * this work for additional information regarding copyright ownership.
005: * The ASF licenses this file to You under the Apache License, Version 2.0
006: * (the "License"); you may not use this file except in compliance with
007: * the License. You may obtain a copy of the License at
008: *
009: * http://www.apache.org/licenses/LICENSE-2.0
010: *
011: * Unless required by applicable law or agreed to in writing, software
012: * distributed under the License is distributed on an "AS IS" BASIS,
013: * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
014: * See the License for the specific language governing permissions and
015: * limitations under the License.
016: */
017:
018: package org.apache.harmony.niochar.charset;
019:
020: import java.nio.charset.Charset;
021: import java.nio.charset.CoderResult;
022: import java.nio.charset.CharsetDecoder;
023: import java.nio.charset.CharsetEncoder;
024: import java.nio.CharBuffer;
025: import java.nio.ByteBuffer;
026:
027: import org.apache.harmony.nio.AddressUtil;
028:
029: public class ISO_8859_9 extends Charset {
030:
031: public ISO_8859_9(String csName, String[] aliases) {
032: super (csName, aliases);
033: }
034:
035: public boolean contains(Charset cs) {
036: return cs.name().equalsIgnoreCase("IBM1026")
037: || cs.name().equalsIgnoreCase("IBM367")
038: || cs.name().equalsIgnoreCase("iso-8859-9")
039: || cs.name().equalsIgnoreCase("US-ASCII");
040: }
041:
042: public CharsetDecoder newDecoder() {
043: return new Decoder(this );
044: }
045:
046: public CharsetEncoder newEncoder() {
047: return new Encoder(this );
048: }
049:
050: private static final class Decoder extends CharsetDecoder {
051: private Decoder(Charset cs) {
052: super (cs, 1, 1);
053:
054: }
055:
056: public native int nDecode(char[] array, int arrPosition,
057: int remaining, long outAddr, int absolutePos);
058:
059: protected CoderResult decodeLoop(ByteBuffer bb, CharBuffer cb) {
060: int cbRemaining = cb.remaining();
061: if (bb.isDirect() && bb.hasRemaining() && cb.hasArray()) {
062: int toProceed = bb.remaining();
063: int cbPos = cb.position();
064: int bbPos = bb.position();
065: boolean throwOverflow = false;
066: if (cbRemaining < toProceed) {
067: toProceed = cbRemaining;
068: throwOverflow = true;
069: }
070: int res = nDecode(cb.array(), cb.arrayOffset() + cbPos,
071: toProceed, AddressUtil
072: .getDirectBufferAddress(bb), bbPos);
073: bb.position(bbPos + res);
074: cb.position(cbPos + res);
075: if (throwOverflow)
076: return CoderResult.OVERFLOW;
077: } else {
078: if (bb.hasArray() && cb.hasArray()) {
079: int rem = bb.remaining();
080: rem = cbRemaining >= rem ? rem : cbRemaining;
081: byte[] bArr = bb.array();
082: char[] cArr = cb.array();
083: int bStart = bb.position();
084: int cStart = cb.position();
085: int i;
086: for (i = bStart; i < bStart + rem; i++) {
087: int in = (int) bArr[i];
088: if (in < 0 && in >= -48) {
089: int index = (int) in + 48;
090: cArr[cStart++] = (char) arr[index];
091: } else {
092: cArr[cStart++] = (char) (in & 0xFF);
093: }
094: }
095: bb.position(i);
096: cb.position(cStart);
097: if (rem == cbRemaining && bb.hasRemaining())
098: return CoderResult.OVERFLOW;
099: } else {
100: while (bb.hasRemaining()) {
101: if (cbRemaining == 0)
102: return CoderResult.OVERFLOW;
103: int in = (int) bb.get();
104: if (in < 0 && in >= -48) {
105: int index = (int) in + 48;
106: cb.put(arr[index]);
107: } else {
108: cb.put((char) (in & 0xFF));
109: }
110: cbRemaining--;
111: }
112: }
113: }
114: return CoderResult.UNDERFLOW;
115: }
116:
117: final static char[] arr = { 0x011E, 0x00D1, 0x00D2, 0x00D3,
118: 0x00D4, 0x00D5, 0x00D6, 0x00D7, 0x00D8, 0x00D9, 0x00DA,
119: 0x00DB, 0x00DC, 0x0130, 0x015E, 0x00DF, 0x00E0, 0x00E1,
120: 0x00E2, 0x00E3, 0x00E4, 0x00E5, 0x00E6, 0x00E7, 0x00E8,
121: 0x00E9, 0x00EA, 0x00EB, 0x00EC, 0x00ED, 0x00EE, 0x00EF,
122: 0x011F, 0x00F1, 0x00F2, 0x00F3, 0x00F4, 0x00F5, 0x00F6,
123: 0x00F7, 0x00F8, 0x00F9, 0x00FA, 0x00FB, 0x00FC, 0x0131,
124: 0x015F, 0x00FF };
125: }
126:
127: private static final class Encoder extends CharsetEncoder {
128: private Encoder(Charset cs) {
129: super (cs, 1, 1);
130: }
131:
132: private native void nEncode(long outAddr, int absolutePos,
133: char[] array, int arrPosition, int[] res);
134:
135: protected CoderResult encodeLoop(CharBuffer cb, ByteBuffer bb) {
136: int bbRemaining = bb.remaining();
137: if (bb.isDirect() && cb.hasRemaining() && cb.hasArray()) {
138: int toProceed = cb.remaining();
139: int cbPos = cb.position();
140: int bbPos = bb.position();
141: boolean throwOverflow = false;
142: if (bbRemaining < toProceed) {
143: toProceed = bbRemaining;
144: throwOverflow = true;
145: }
146: int[] res = { toProceed, 0 };
147: nEncode(AddressUtil.getDirectBufferAddress(bb), bbPos,
148: cb.array(), cb.arrayOffset() + cbPos, res);
149: if (res[0] <= 0) {
150: bb.position(bbPos - res[0]);
151: cb.position(cbPos - res[0]);
152: if (res[1] != 0) {
153: if (res[1] < 0)
154: return CoderResult
155: .malformedForLength(-res[1]);
156: else
157: return CoderResult
158: .unmappableForLength(res[1]);
159: }
160: } else {
161: bb.position(bbPos + res[0]);
162: cb.position(cbPos + res[0]);
163: if (throwOverflow)
164: return CoderResult.OVERFLOW;
165: }
166: } else {
167: if (bb.hasArray() && cb.hasArray()) {
168: byte[] byteArr = bb.array();
169: char[] charArr = cb.array();
170: int rem = cb.remaining();
171: int byteArrStart = bb.position();
172: rem = bbRemaining <= rem ? bbRemaining : rem;
173: int x;
174: for (x = cb.position(); x < cb.position() + rem; x++) {
175: char c = charArr[x];
176: if (c > (char) 0x015F) {
177: if (c >= 0xD800 && c <= 0xDFFF) {
178: if (x + 1 < cb.limit()) {
179: char c1 = charArr[x + 1];
180: if (c1 >= 0xD800 && c1 <= 0xDFFF) {
181: cb.position(x);
182: bb.position(byteArrStart);
183: return CoderResult
184: .unmappableForLength(2);
185: }
186: } else {
187: cb.position(x);
188: bb.position(byteArrStart);
189: return CoderResult.UNDERFLOW;
190: }
191: cb.position(x);
192: bb.position(byteArrStart);
193: return CoderResult
194: .malformedForLength(1);
195: }
196: cb.position(x);
197: bb.position(byteArrStart);
198: return CoderResult.unmappableForLength(1);
199: } else {
200: if (c < 0xD0) {
201: byteArr[byteArrStart++] = (byte) c;
202: } else {
203: int index = (int) c >> 8;
204: index = encodeIndex[index];
205: if (index < 0) {
206: cb.position(x);
207: bb.position(byteArrStart);
208: return CoderResult
209: .unmappableForLength(1);
210: }
211: index <<= 8;
212: index += (int) c & 0xFF;
213: if ((byte) arr[index] != 0) {
214: byteArr[byteArrStart++] = (byte) arr[index];
215: } else {
216: cb.position(x);
217: bb.position(byteArrStart);
218: return CoderResult
219: .unmappableForLength(1);
220: }
221: }
222: }
223: }
224: cb.position(x);
225: bb.position(byteArrStart);
226: if (rem == bbRemaining && cb.hasRemaining()) {
227: return CoderResult.OVERFLOW;
228: }
229: } else {
230: while (cb.hasRemaining()) {
231: if (bbRemaining == 0)
232: return CoderResult.OVERFLOW;
233: char c = cb.get();
234: if (c > (char) 0x015F) {
235: if (c >= 0xD800 && c <= 0xDFFF) {
236: if (cb.hasRemaining()) {
237: char c1 = cb.get();
238: if (c1 >= 0xD800 && c1 <= 0xDFFF) {
239: cb.position(cb.position() - 2);
240: return CoderResult
241: .unmappableForLength(2);
242: } else {
243: cb.position(cb.position() - 1);
244: }
245: } else {
246: cb.position(cb.position() - 1);
247: return CoderResult.UNDERFLOW;
248: }
249: cb.position(cb.position() - 1);
250: return CoderResult
251: .malformedForLength(1);
252: }
253: cb.position(cb.position() - 1);
254: return CoderResult.unmappableForLength(1);
255: } else {
256: if (c < 0xD0) {
257: bb.put((byte) c);
258: } else {
259: int index = (int) c >> 8;
260: index = encodeIndex[index];
261: if (index < 0) {
262: cb.position(cb.position() - 1);
263: return CoderResult
264: .unmappableForLength(1);
265: }
266: index <<= 8;
267: index += (int) c & 0xFF;
268: if ((byte) arr[index] != 0) {
269: bb.put((byte) arr[index]);
270: } else {
271: cb.position(cb.position() - 1);
272: return CoderResult
273: .unmappableForLength(1);
274: }
275: }
276: bbRemaining--;
277: }
278: }
279: }
280: }
281: return CoderResult.UNDERFLOW;
282: }
283:
284: final static char arr[] = {
285:
286: 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09,
287: 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12,
288: 0x13, 0x14, 0x15, 0x16, 0x17, 0x18, 0x19, 0x1A, 0x1B,
289: 0x1C, 0x1D, 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24,
290: 0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D,
291: 0x2E, 0x2F, 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36,
292: 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x3E, 0x3F,
293: 0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
294: 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50, 0x51,
295: 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A,
296: 0x5B, 0x5C, 0x5D, 0x5E, 0x5F, 0x60, 0x61, 0x62, 0x63,
297: 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, 0x6A, 0x6B, 0x6C,
298: 0x6D, 0x6E, 0x6F, 0x70, 0x71, 0x72, 0x73, 0x74, 0x75,
299: 0x76, 0x77, 0x78, 0x79, 0x7A, 0x7B, 0x7C, 0x7D, 0x7E,
300: 0x7F, 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
301: 0x88, 0x89, 0x8A, 0x8B, 0x8C, 0x8D, 0x8E, 0x8F, 0x90,
302: 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98, 0x99,
303: 0x9A, 0x9B, 0x9C, 0x9D, 0x9E, 0x9F, 0xA0, 0xA1, 0xA2,
304: 0xA3, 0xA4, 0xA5, 0xA6, 0xA7, 0xA8, 0xA9, 0xAA, 0xAB,
305: 0xAC, 0xAD, 0xAE, 0xAF, 0xB0, 0xB1, 0xB2, 0xB3, 0xB4,
306: 0xB5, 0xB6, 0xB7, 0xB8, 0xB9, 0xBA, 0xBB, 0xBC, 0xBD,
307: 0xBE, 0xBF, 0xC0, 0xC1, 0xC2, 0xC3, 0xC4, 0xC5, 0xC6,
308: 0xC7, 0xC8, 0xC9, 0xCA, 0xCB, 0xCC, 0xCD, 0xCE, 0xCF,
309: 0x00, 0xD1, 0xD2, 0xD3, 0xD4, 0xD5, 0xD6, 0xD7, 0xD8,
310: 0xD9, 0xDA, 0xDB, 0xDC, 0x00, 0x00, 0xDF, 0xE0, 0xE1,
311: 0xE2, 0xE3, 0xE4, 0xE5, 0xE6, 0xE7, 0xE8, 0xE9, 0xEA,
312: 0xEB, 0xEC, 0xED, 0xEE, 0xEF, 0x00, 0xF1, 0xF2, 0xF3,
313: 0xF4, 0xF5, 0xF6, 0xF7, 0xF8, 0xF9, 0xFA, 0xFB, 0xFC,
314: 0x00, 0x00, 0xFF,
315:
316: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
317: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
318: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
319: 0x00, 0x00, 0x00, 0xD0, 0xF0, 0x00, 0x00, 0x00, 0x00,
320: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
321: 0x00, 0x00, 0x00, 0xDD, 0xFD, 0x00, 0x00, 0x00, 0x00,
322: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
323: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
324: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
325: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
326: 0x00, 0x00, 0x00, 0x00, 0xDE, 0xFE, 0x00, 0x00, 0x00,
327: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
328: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
329: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
330: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
331: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
332: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
333: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
334: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
335: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
336: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
337: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
338: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
339: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
340: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
341: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
342: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
343: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
344: 0x00, 0x00, 0x00, 0x00 };
345:
346: final static int[] encodeIndex = { 0, 1, -1, -1, -1, -1, -1,
347: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
348: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
349: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
350: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
351: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
352: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
353: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
354: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
355: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
356: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
357: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
358: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
359: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
360: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
361: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
362: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
363: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
364: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 };
365: }
366: }
|