001: /*
002: * Licensed to the Apache Software Foundation (ASF) under one or more
003: * contributor license agreements. See the NOTICE file distributed with
004: * this work for additional information regarding copyright ownership.
005: * The ASF licenses this file to You under the Apache License, Version 2.0
006: * (the "License"); you may not use this file except in compliance with
007: * the License. You may obtain a copy of the License at
008: *
009: * http://www.apache.org/licenses/LICENSE-2.0
010: *
011: * Unless required by applicable law or agreed to in writing, software
012: * distributed under the License is distributed on an "AS IS" BASIS,
013: * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
014: * See the License for the specific language governing permissions and
015: * limitations under the License.
016: */
017:
018: package org.apache.harmony.niochar.charset;
019:
020: import java.nio.charset.Charset;
021: import java.nio.charset.CoderResult;
022: import java.nio.charset.CharsetDecoder;
023: import java.nio.charset.CharsetEncoder;
024: import java.nio.CharBuffer;
025: import java.nio.ByteBuffer;
026:
027: import org.apache.harmony.nio.AddressUtil;
028:
029: public class ISO_8859_5 extends Charset {
030:
031: public ISO_8859_5(String csName, String[] aliases) {
032: super (csName, aliases);
033: }
034:
035: public boolean contains(Charset cs) {
036: return cs.name().equalsIgnoreCase("IBM367")
037: || cs.name().equalsIgnoreCase("iso-8859-5")
038: || cs.name().equalsIgnoreCase("US-ASCII");
039: }
040:
041: public CharsetDecoder newDecoder() {
042: return new Decoder(this );
043: }
044:
045: public CharsetEncoder newEncoder() {
046: return new Encoder(this );
047: }
048:
049: private static final class Decoder extends CharsetDecoder {
050: private Decoder(Charset cs) {
051: super (cs, 1, 1);
052:
053: }
054:
055: public native int nDecode(char[] array, int arrPosition,
056: int remaining, long outAddr, int absolutePos);
057:
058: protected CoderResult decodeLoop(ByteBuffer bb, CharBuffer cb) {
059: int cbRemaining = cb.remaining();
060: if (bb.isDirect() && bb.hasRemaining() && cb.hasArray()) {
061: int toProceed = bb.remaining();
062: int cbPos = cb.position();
063: int bbPos = bb.position();
064: boolean throwOverflow = false;
065: if (cbRemaining < toProceed) {
066: toProceed = cbRemaining;
067: throwOverflow = true;
068: }
069: int res = nDecode(cb.array(), cb.arrayOffset() + cbPos,
070: toProceed, AddressUtil
071: .getDirectBufferAddress(bb), bbPos);
072: bb.position(bbPos + res);
073: cb.position(cbPos + res);
074: if (throwOverflow)
075: return CoderResult.OVERFLOW;
076: } else {
077: if (bb.hasArray() && cb.hasArray()) {
078: int rem = bb.remaining();
079: rem = cbRemaining >= rem ? rem : cbRemaining;
080: byte[] bArr = bb.array();
081: char[] cArr = cb.array();
082: int bStart = bb.position();
083: int cStart = cb.position();
084: int i;
085: for (i = bStart; i < bStart + rem; i++) {
086: int in = (int) bArr[i];
087: if (in < 0 && in >= -95) {
088: int index = (int) in + 95;
089: cArr[cStart++] = (char) arr[index];
090: } else {
091: cArr[cStart++] = (char) (in & 0xFF);
092: }
093: }
094: bb.position(i);
095: cb.position(cStart);
096: if (rem == cbRemaining && bb.hasRemaining())
097: return CoderResult.OVERFLOW;
098: } else {
099: while (bb.hasRemaining()) {
100: if (cbRemaining == 0)
101: return CoderResult.OVERFLOW;
102: int in = (int) bb.get();
103: if (in < 0 && in >= -95) {
104: int index = (int) in + 95;
105: cb.put(arr[index]);
106: } else {
107: cb.put((char) (in & 0xFF));
108: }
109: cbRemaining--;
110: }
111: }
112: }
113: return CoderResult.UNDERFLOW;
114: }
115:
116: final static char[] arr = { 0x0401, 0x0402, 0x0403, 0x0404,
117: 0x0405, 0x0406, 0x0407, 0x0408, 0x0409, 0x040A, 0x040B,
118: 0x040C, 0x00AD, 0x040E, 0x040F, 0x0410, 0x0411, 0x0412,
119: 0x0413, 0x0414, 0x0415, 0x0416, 0x0417, 0x0418, 0x0419,
120: 0x041A, 0x041B, 0x041C, 0x041D, 0x041E, 0x041F, 0x0420,
121: 0x0421, 0x0422, 0x0423, 0x0424, 0x0425, 0x0426, 0x0427,
122: 0x0428, 0x0429, 0x042A, 0x042B, 0x042C, 0x042D, 0x042E,
123: 0x042F, 0x0430, 0x0431, 0x0432, 0x0433, 0x0434, 0x0435,
124: 0x0436, 0x0437, 0x0438, 0x0439, 0x043A, 0x043B, 0x043C,
125: 0x043D, 0x043E, 0x043F, 0x0440, 0x0441, 0x0442, 0x0443,
126: 0x0444, 0x0445, 0x0446, 0x0447, 0x0448, 0x0449, 0x044A,
127: 0x044B, 0x044C, 0x044D, 0x044E, 0x044F, 0x2116, 0x0451,
128: 0x0452, 0x0453, 0x0454, 0x0455, 0x0456, 0x0457, 0x0458,
129: 0x0459, 0x045A, 0x045B, 0x045C, 0x00A7, 0x045E, 0x045F };
130: }
131:
132: private static final class Encoder extends CharsetEncoder {
133: private Encoder(Charset cs) {
134: super (cs, 1, 1);
135: }
136:
137: private native void nEncode(long outAddr, int absolutePos,
138: char[] array, int arrPosition, int[] res);
139:
140: protected CoderResult encodeLoop(CharBuffer cb, ByteBuffer bb) {
141: int bbRemaining = bb.remaining();
142: if (bb.isDirect() && cb.hasRemaining() && cb.hasArray()) {
143: int toProceed = cb.remaining();
144: int cbPos = cb.position();
145: int bbPos = bb.position();
146: boolean throwOverflow = false;
147: if (bbRemaining < toProceed) {
148: toProceed = bbRemaining;
149: throwOverflow = true;
150: }
151: int[] res = { toProceed, 0 };
152: nEncode(AddressUtil.getDirectBufferAddress(bb), bbPos,
153: cb.array(), cb.arrayOffset() + cbPos, res);
154: if (res[0] <= 0) {
155: bb.position(bbPos - res[0]);
156: cb.position(cbPos - res[0]);
157: if (res[1] != 0) {
158: if (res[1] < 0)
159: return CoderResult
160: .malformedForLength(-res[1]);
161: else
162: return CoderResult
163: .unmappableForLength(res[1]);
164: }
165: } else {
166: bb.position(bbPos + res[0]);
167: cb.position(cbPos + res[0]);
168: if (throwOverflow)
169: return CoderResult.OVERFLOW;
170: }
171: } else {
172: if (bb.hasArray() && cb.hasArray()) {
173: byte[] byteArr = bb.array();
174: char[] charArr = cb.array();
175: int rem = cb.remaining();
176: int byteArrStart = bb.position();
177: rem = bbRemaining <= rem ? bbRemaining : rem;
178: int x;
179: for (x = cb.position(); x < cb.position() + rem; x++) {
180: char c = charArr[x];
181: if (c > (char) 0x2116) {
182: if (c >= 0xD800 && c <= 0xDFFF) {
183: if (x + 1 < cb.limit()) {
184: char c1 = charArr[x + 1];
185: if (c1 >= 0xD800 && c1 <= 0xDFFF) {
186: cb.position(x);
187: bb.position(byteArrStart);
188: return CoderResult
189: .unmappableForLength(2);
190: }
191: } else {
192: cb.position(x);
193: bb.position(byteArrStart);
194: return CoderResult.UNDERFLOW;
195: }
196: cb.position(x);
197: bb.position(byteArrStart);
198: return CoderResult
199: .malformedForLength(1);
200: }
201: cb.position(x);
202: bb.position(byteArrStart);
203: return CoderResult.unmappableForLength(1);
204: } else {
205: if (c < 0xA1) {
206: byteArr[byteArrStart++] = (byte) c;
207: } else {
208: int index = (int) c >> 8;
209: index = encodeIndex[index];
210: if (index < 0) {
211: cb.position(x);
212: bb.position(byteArrStart);
213: return CoderResult
214: .unmappableForLength(1);
215: }
216: index <<= 8;
217: index += (int) c & 0xFF;
218: if ((byte) arr[index] != 0) {
219: byteArr[byteArrStart++] = (byte) arr[index];
220: } else {
221: cb.position(x);
222: bb.position(byteArrStart);
223: return CoderResult
224: .unmappableForLength(1);
225: }
226: }
227: }
228: }
229: cb.position(x);
230: bb.position(byteArrStart);
231: if (rem == bbRemaining && cb.hasRemaining()) {
232: return CoderResult.OVERFLOW;
233: }
234: } else {
235: while (cb.hasRemaining()) {
236: if (bbRemaining == 0)
237: return CoderResult.OVERFLOW;
238: char c = cb.get();
239: if (c > (char) 0x2116) {
240: if (c >= 0xD800 && c <= 0xDFFF) {
241: if (cb.hasRemaining()) {
242: char c1 = cb.get();
243: if (c1 >= 0xD800 && c1 <= 0xDFFF) {
244: cb.position(cb.position() - 2);
245: return CoderResult
246: .unmappableForLength(2);
247: } else {
248: cb.position(cb.position() - 1);
249: }
250: } else {
251: cb.position(cb.position() - 1);
252: return CoderResult.UNDERFLOW;
253: }
254: cb.position(cb.position() - 1);
255: return CoderResult
256: .malformedForLength(1);
257: }
258: cb.position(cb.position() - 1);
259: return CoderResult.unmappableForLength(1);
260: } else {
261: if (c < 0xA1) {
262: bb.put((byte) c);
263: } else {
264: int index = (int) c >> 8;
265: index = encodeIndex[index];
266: if (index < 0) {
267: cb.position(cb.position() - 1);
268: return CoderResult
269: .unmappableForLength(1);
270: }
271: index <<= 8;
272: index += (int) c & 0xFF;
273: if ((byte) arr[index] != 0) {
274: bb.put((byte) arr[index]);
275: } else {
276: cb.position(cb.position() - 1);
277: return CoderResult
278: .unmappableForLength(1);
279: }
280: }
281: bbRemaining--;
282: }
283: }
284: }
285: }
286: return CoderResult.UNDERFLOW;
287: }
288:
289: final static char arr[] = {
290:
291: 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09,
292: 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12,
293: 0x13, 0x14, 0x15, 0x16, 0x17, 0x18, 0x19, 0x1A, 0x1B,
294: 0x1C, 0x1D, 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24,
295: 0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D,
296: 0x2E, 0x2F, 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36,
297: 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x3E, 0x3F,
298: 0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
299: 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50, 0x51,
300: 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A,
301: 0x5B, 0x5C, 0x5D, 0x5E, 0x5F, 0x60, 0x61, 0x62, 0x63,
302: 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, 0x6A, 0x6B, 0x6C,
303: 0x6D, 0x6E, 0x6F, 0x70, 0x71, 0x72, 0x73, 0x74, 0x75,
304: 0x76, 0x77, 0x78, 0x79, 0x7A, 0x7B, 0x7C, 0x7D, 0x7E,
305: 0x7F, 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
306: 0x88, 0x89, 0x8A, 0x8B, 0x8C, 0x8D, 0x8E, 0x8F, 0x90,
307: 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98, 0x99,
308: 0x9A, 0x9B, 0x9C, 0x9D, 0x9E, 0x9F, 0xA0, 0x00, 0x00,
309: 0x00, 0x00, 0x00, 0x00, 0xFD, 0x00, 0x00, 0x00, 0x00,
310: 0x00, 0xAD, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
311: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
312: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
313: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
314: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
315: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
316: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
317: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
318: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
319: 0x00, 0x00, 0x00,
320:
321: 0x00, 0xA1, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6, 0xA7, 0xA8,
322: 0xA9, 0xAA, 0xAB, 0xAC, 0x00, 0xAE, 0xAF, 0xB0, 0xB1,
323: 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7, 0xB8, 0xB9, 0xBA,
324: 0xBB, 0xBC, 0xBD, 0xBE, 0xBF, 0xC0, 0xC1, 0xC2, 0xC3,
325: 0xC4, 0xC5, 0xC6, 0xC7, 0xC8, 0xC9, 0xCA, 0xCB, 0xCC,
326: 0xCD, 0xCE, 0xCF, 0xD0, 0xD1, 0xD2, 0xD3, 0xD4, 0xD5,
327: 0xD6, 0xD7, 0xD8, 0xD9, 0xDA, 0xDB, 0xDC, 0xDD, 0xDE,
328: 0xDF, 0xE0, 0xE1, 0xE2, 0xE3, 0xE4, 0xE5, 0xE6, 0xE7,
329: 0xE8, 0xE9, 0xEA, 0xEB, 0xEC, 0xED, 0xEE, 0xEF, 0x00,
330: 0xF1, 0xF2, 0xF3, 0xF4, 0xF5, 0xF6, 0xF7, 0xF8, 0xF9,
331: 0xFA, 0xFB, 0xFC, 0x00, 0xFE, 0xFF, 0x00, 0x00, 0x00,
332: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
333: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
334: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
335: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
336: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
337: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
338: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
339: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
340: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
341: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
342: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
343: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
344: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
345: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
346: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
347: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
348: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
349: 0x00, 0x00, 0x00, 0x00,
350:
351: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
352: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
353: 0x00, 0x00, 0x00, 0x00, 0xF0, 0x00, 0x00, 0x00, 0x00,
354: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
355: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
356: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
357: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
358: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
359: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
360: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
361: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
362: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
363: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
364: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
365: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
366: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
367: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
368: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
369: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
370: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
371: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
372: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
373: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
374: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
375: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
376: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
377: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
378: 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
379: 0x00, 0x00, 0x00, 0x00 };
380:
381: final static int[] encodeIndex = { 0, -1, -1, -1, 1, -1, -1,
382: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
383: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, 2, -1,
384: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
385: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
386: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
387: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
388: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
389: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
390: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
391: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
392: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
393: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
394: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
395: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
396: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
397: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
398: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
399: -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 };
400: }
401: }
|