001: /*
002: * The Apache Software License, Version 1.1
003: *
004: *
005: * Copyright (c) 2000 The Apache Software Foundation. All rights
006: * reserved.
007: *
008: * Redistribution and use in source and binary forms, with or without
009: * modification, are permitted provided that the following conditions
010: * are met:
011: *
012: * 1. Redistributions of source code must retain the above copyright
013: * notice, this list of conditions and the following disclaimer.
014: *
015: * 2. Redistributions in binary form must reproduce the above copyright
016: * notice, this list of conditions and the following disclaimer in
017: * the documentation and/or other materials provided with the
018: * distribution.
019: *
020: * 3. The end-user documentation included with the redistribution,
021: * if any, must include the following acknowledgment:
022: * "This product includes software developed by the
023: * Apache Software Foundation (http://www.apache.org/)."
024: * Alternately, this acknowledgment may appear in the software itself,
025: * if and wherever such third-party acknowledgments normally appear.
026: *
027: * 4. The names "Xerces" and "Apache Software Foundation" must
028: * not be used to endorse or promote products derived from this
029: * software without prior written permission. For written
030: * permission, please contact apache@apache.org.
031: *
032: * 5. Products derived from this software may not be called "Apache",
033: * nor may "Apache" appear in their name, without prior written
034: * permission of the Apache Software Foundation.
035: *
036: * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
037: * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
038: * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
039: * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
040: * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
041: * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
042: * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
043: * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
044: * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
045: * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
046: * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
047: * SUCH DAMAGE.
048: * ====================================================================
049: *
050: * This software consists of voluntary contributions made by many
051: * individuals on behalf of the Apache Software Foundation and was
052: * originally based on software copyright (c) 1999, International
053: * Business Machines, Inc., http://www.apache.org. For more
054: * information on the Apache Software Foundation, please see
055: * <http://www.apache.org/>.
056: */
057:
058: package org.apache.xml.serialize;
059:
060: import java.io.ByteArrayOutputStream;
061: import java.io.IOException;
062: import java.io.OutputStreamWriter;
063: import java.io.Writer;
064:
065: /**
066: * This class represents an encoding.
067: *
068: * @version $Id: SieveEncodingInfo.java,v 1.1 2000/12/14 19:21:55 lehors Exp $
069: */
070: public class SieveEncodingInfo extends EncodingInfo {
071:
072: BAOutputStream checkerStream = null;
073: Writer checkerWriter = null;
074: String dangerChars = null;
075:
076: /**
077: * Creates new <code>SeiveEncodingInfo</code> instance.
078: *
079: * @param dangers A sorted characters that are always printed as character references.
080: */
081: public SieveEncodingInfo(String mimeName, String javaName,
082: int lastPrintable, String dangers) {
083: super (mimeName, javaName, lastPrintable);
084: this .dangerChars = dangers;
085: }
086:
087: /**
088: * Creates new <code>SeiveEncodingInfo</code> instance.
089: */
090: public SieveEncodingInfo(String mimeName, int lastPrintable) {
091: this (mimeName, mimeName, lastPrintable, null);
092: }
093:
094: /**
095: * Checks whether the specified character is printable or not.
096: *
097: * @param ch a code point (0-0x10ffff)
098: */
099: public boolean isPrintable(int ch) {
100: if (this .dangerChars != null && ch <= 0xffff) {
101: /**
102: * Searches this.dangerChars for ch.
103: * TODO: Use binary search.
104: */
105: if (this .dangerChars.indexOf(ch) >= 0)
106: return false;
107: }
108:
109: if (ch <= this .lastPrintable)
110: return true;
111:
112: boolean printable = true;
113: synchronized (this ) {
114: try {
115: if (this .checkerWriter == null) {
116: this .checkerStream = new BAOutputStream(10);
117: this .checkerWriter = new OutputStreamWriter(
118: this .checkerStream, this .javaName);
119: }
120:
121: if (ch > 0xffff) {
122: this .checkerWriter
123: .write(((ch - 0x10000) >> 10) + 0xd800);
124: this .checkerWriter
125: .write(((ch - 0x10000) & 0x3ff) + 0xdc00);
126: byte[] result = this .checkerStream.getBuffer();
127: if (this .checkerStream.size() == 2
128: && result[0] == '?' && result[1] == '?')
129: printable = false;
130: } else {
131: this .checkerWriter.write(ch);
132: this .checkerWriter.flush();
133: byte[] result = this .checkerStream.getBuffer();
134: if (this .checkerStream.size() == 1
135: && result[0] == '?')
136: printable = false;
137: }
138: this .checkerStream.reset();
139: } catch (IOException ioe) {
140: printable = false;
141: }
142: }
143:
144: return printable;
145: }
146:
147: /**
148: * Why don't we use the original ByteArrayOutputStream?
149: * - Because the toByteArray() method of the ByteArrayOutputStream
150: * creates new byte[] instances for each call.
151: */
152: static class BAOutputStream extends ByteArrayOutputStream {
153: BAOutputStream() {
154: super ();
155: }
156:
157: BAOutputStream(int size) {
158: super (size);
159: }
160:
161: byte[] getBuffer() {
162: return this.buf;
163: }
164: }
165:
166: }
|