| 1 | /* |
| 2 | * jDTAUS Banking Charset Providers |
| 3 | * Copyright (C) 2005 Christian Schulte |
| 4 | * <cs@schulte.it> |
| 5 | * |
| 6 | * This library is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU Lesser General Public |
| 8 | * License as published by the Free Software Foundation; either |
| 9 | * version 2.1 of the License, or any later version. |
| 10 | * |
| 11 | * This library is distributed in the hope that it will be useful, |
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 14 | * Lesser General Public License for more details. |
| 15 | * |
| 16 | * You should have received a copy of the GNU Lesser General Public |
| 17 | * License along with this library; if not, write to the Free Software |
| 18 | * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA |
| 19 | * |
| 20 | */ |
| 21 | package org.jdtaus.banking.charsets.spi; |
| 22 | |
| 23 | import java.nio.ByteBuffer; |
| 24 | import java.nio.CharBuffer; |
| 25 | import java.nio.charset.Charset; |
| 26 | import java.nio.charset.CharsetDecoder; |
| 27 | import java.nio.charset.CharsetEncoder; |
| 28 | import java.nio.charset.CoderResult; |
| 29 | import java.nio.charset.CodingErrorAction; |
| 30 | import java.nio.charset.spi.CharsetProvider; |
| 31 | import java.util.Iterator; |
| 32 | import java.util.NoSuchElementException; |
| 33 | |
| 34 | /** |
| 35 | * {@code CharsetProvider} for DIN-66003 Charset. |
| 36 | * <p> |
| 37 | * Name: DIN_66003<br> |
| 38 | * MIBenum: 24<br> |
| 39 | * Source: ECMA registry<br> |
| 40 | * Alias: iso-ir-21<br> |
| 41 | * Alias: de<br> |
| 42 | * Alias: ISO646-DE<br> |
| 43 | * Alias: csISO21German<br> |
| 44 | * See: RFC1345, KXS2 |
| 45 | * |
| 46 | * @author <a href="mailto:cs@schulte.it">Christian Schulte</a> |
| 47 | * @version $JDTAUS: DIN66003CharsetProvider.java 8661 2012-09-27 11:29:58Z schulte $ |
| 48 | */ |
| 49 | public class DIN66003CharsetProvider extends CharsetProvider |
| 50 | { |
| 51 | |
| 52 | /** Common name. */ |
| 53 | static final String COMMON_NAME = "DIN_66003"; |
| 54 | |
| 55 | /** Alias names. */ |
| 56 | static final String[] ALIAS_NAMES = |
| 57 | { |
| 58 | "iso-ir-21", "de", "iso646-de", "csiso21german" |
| 59 | }; |
| 60 | |
| 61 | /** Supported character set names. */ |
| 62 | static final String[] SUPPORTED_NAMES = |
| 63 | { |
| 64 | COMMON_NAME.toLowerCase(), "iso-ir-21", "de", "iso646-de", "csiso21german" |
| 65 | }; |
| 66 | |
| 67 | static final char[] BYTE_TO_CHAR = new char[ 0xFF ]; |
| 68 | |
| 69 | static final byte[] CHAR_TO_BYTE = new byte[ 0xFF ]; |
| 70 | |
| 71 | static |
| 72 | { |
| 73 | for ( int i = 0x7F; i >= 0; i-- ) |
| 74 | { |
| 75 | CHAR_TO_BYTE[i] = (byte) i; |
| 76 | BYTE_TO_CHAR[i] = (char) i; |
| 77 | } |
| 78 | |
| 79 | CHAR_TO_BYTE['\u00A7'] = (byte) 0x40; |
| 80 | CHAR_TO_BYTE['\u00C4'] = (byte) 0x5B; |
| 81 | CHAR_TO_BYTE['\u00D6'] = (byte) 0x5C; |
| 82 | CHAR_TO_BYTE['\u00DC'] = (byte) 0x5D; |
| 83 | CHAR_TO_BYTE['\u00E4'] = (byte) 0x7B; |
| 84 | CHAR_TO_BYTE['\u00F6'] = (byte) 0x7C; |
| 85 | CHAR_TO_BYTE['\u00FC'] = (byte) 0x7D; |
| 86 | CHAR_TO_BYTE['\u00DF'] = (byte) 0x7E; |
| 87 | |
| 88 | BYTE_TO_CHAR[0x40] = '\u00A7'; |
| 89 | BYTE_TO_CHAR[0x5B] = '\u00C4'; |
| 90 | BYTE_TO_CHAR[0x5C] = '\u00D6'; |
| 91 | BYTE_TO_CHAR[0x5D] = '\u00DC'; |
| 92 | BYTE_TO_CHAR[0x7B] = '\u00E4'; |
| 93 | BYTE_TO_CHAR[0x7C] = '\u00F6'; |
| 94 | BYTE_TO_CHAR[0x7D] = '\u00FC'; |
| 95 | BYTE_TO_CHAR[0x7E] = '\u00DF'; |
| 96 | } |
| 97 | |
| 98 | /** Creates a new {@code DIN66003CharsetProvider} instance. */ |
| 99 | public DIN66003CharsetProvider() |
| 100 | { |
| 101 | super(); |
| 102 | } |
| 103 | |
| 104 | public Charset charsetForName( final String charsetName ) |
| 105 | { |
| 106 | Charset ret = null; |
| 107 | |
| 108 | if ( charsetName != null ) |
| 109 | { |
| 110 | final String lower = charsetName.toLowerCase(); |
| 111 | for ( int i = 0; i < SUPPORTED_NAMES.length; i++ ) |
| 112 | { |
| 113 | if ( SUPPORTED_NAMES[i].equals( lower ) ) |
| 114 | { |
| 115 | ret = new DIN66003Charset(); |
| 116 | break; |
| 117 | } |
| 118 | } |
| 119 | } |
| 120 | |
| 121 | return ret; |
| 122 | } |
| 123 | |
| 124 | public Iterator charsets() |
| 125 | { |
| 126 | return new Iterator() |
| 127 | { |
| 128 | |
| 129 | private boolean hasNext = true; |
| 130 | |
| 131 | public boolean hasNext() |
| 132 | { |
| 133 | return this.hasNext; |
| 134 | } |
| 135 | |
| 136 | public Object next() |
| 137 | { |
| 138 | if ( this.hasNext ) |
| 139 | { |
| 140 | this.hasNext = false; |
| 141 | return new DIN66003Charset(); |
| 142 | } |
| 143 | else |
| 144 | { |
| 145 | throw new NoSuchElementException(); |
| 146 | } |
| 147 | } |
| 148 | |
| 149 | public void remove() |
| 150 | { |
| 151 | throw new UnsupportedOperationException(); |
| 152 | } |
| 153 | |
| 154 | }; |
| 155 | } |
| 156 | |
| 157 | } |
| 158 | |
| 159 | /** DIN-66003 {@code Charset} implementation. */ |
| 160 | class DIN66003Charset extends Charset |
| 161 | { |
| 162 | |
| 163 | public DIN66003Charset() |
| 164 | { |
| 165 | super( DIN66003CharsetProvider.COMMON_NAME, DIN66003CharsetProvider.ALIAS_NAMES ); |
| 166 | } |
| 167 | |
| 168 | public CharsetEncoder newEncoder() |
| 169 | { |
| 170 | return new DIN66003CharsetEncoder( this ); |
| 171 | } |
| 172 | |
| 173 | public CharsetDecoder newDecoder() |
| 174 | { |
| 175 | return new DIN66003CharsetDecoder( this ); |
| 176 | } |
| 177 | |
| 178 | public boolean contains( final Charset charset ) |
| 179 | { |
| 180 | return false; |
| 181 | } |
| 182 | |
| 183 | static boolean isCharacterSupported( final char c ) |
| 184 | { |
| 185 | return ( c >= 0x00 && c <= 0x3F ) || ( c >= 0x41 && c <= 0x5A ) || ( c >= 0x5F && c <= 0x7A ) || |
| 186 | c == '\u00A7' || c == '\u00C4' || c == '\u00D6' || c == '\u00DC' || c == '\u00E4' || c == '\u00F6' || |
| 187 | c == '\u00FC' || c == '\u00DF'; |
| 188 | |
| 189 | } |
| 190 | |
| 191 | } |
| 192 | |
| 193 | class DIN66003CharsetEncoder extends CharsetEncoder |
| 194 | { |
| 195 | |
| 196 | private final char[] charBuf = new char[ 65536 ]; |
| 197 | |
| 198 | DIN66003CharsetEncoder( final Charset charset ) |
| 199 | { |
| 200 | super( charset, 1f, 1f ); |
| 201 | this.onUnmappableCharacter( CodingErrorAction.REPLACE ); |
| 202 | } |
| 203 | |
| 204 | protected CoderResult encodeLoop( final CharBuffer in, final ByteBuffer buf ) |
| 205 | { |
| 206 | if ( in.hasArray() && buf.hasArray() ) |
| 207 | { |
| 208 | return encodeLoopArray( in, buf ); |
| 209 | } |
| 210 | |
| 211 | while ( in.hasRemaining() ) |
| 212 | { |
| 213 | in.mark(); |
| 214 | |
| 215 | final int len; |
| 216 | if ( in.remaining() < this.charBuf.length ) |
| 217 | { |
| 218 | len = in.remaining(); |
| 219 | in.get( this.charBuf, 0, in.remaining() ); |
| 220 | } |
| 221 | else |
| 222 | { |
| 223 | in.get( this.charBuf, 0, this.charBuf.length ); |
| 224 | len = this.charBuf.length; |
| 225 | } |
| 226 | |
| 227 | for ( int i = 0; i < len; i++ ) |
| 228 | { |
| 229 | if ( !buf.hasRemaining() ) |
| 230 | { |
| 231 | in.reset(); |
| 232 | in.position( in.position() + i ); |
| 233 | return CoderResult.OVERFLOW; |
| 234 | } |
| 235 | |
| 236 | if ( !DIN66003Charset.isCharacterSupported( this.charBuf[i] ) ) |
| 237 | { |
| 238 | in.reset(); |
| 239 | in.position( in.position() + i ); |
| 240 | return CoderResult.unmappableForLength( 1 ); |
| 241 | } |
| 242 | |
| 243 | buf.put( DIN66003CharsetProvider.CHAR_TO_BYTE[this.charBuf[i]] ); |
| 244 | } |
| 245 | } |
| 246 | |
| 247 | return CoderResult.UNDERFLOW; |
| 248 | } |
| 249 | |
| 250 | private static CoderResult encodeLoopArray( final CharBuffer in, final ByteBuffer buf ) |
| 251 | { |
| 252 | final int len = in.remaining(); |
| 253 | for ( int i = 0; i < len; i++, in.position( in.position() + 1 ), buf.position( buf.position() + 1 ) ) |
| 254 | { |
| 255 | if ( !buf.hasRemaining() ) |
| 256 | { |
| 257 | return CoderResult.OVERFLOW; |
| 258 | } |
| 259 | |
| 260 | if ( !DIN66003Charset.isCharacterSupported( in.array()[in.position() + in.arrayOffset()] ) ) |
| 261 | { |
| 262 | return CoderResult.unmappableForLength( 1 ); |
| 263 | } |
| 264 | |
| 265 | buf.array()[buf.position() + buf.arrayOffset()] = |
| 266 | DIN66003CharsetProvider.CHAR_TO_BYTE[in.array()[in.position() + in.arrayOffset()]]; |
| 267 | |
| 268 | } |
| 269 | |
| 270 | return CoderResult.UNDERFLOW; |
| 271 | } |
| 272 | |
| 273 | } |
| 274 | |
| 275 | class DIN66003CharsetDecoder extends CharsetDecoder |
| 276 | { |
| 277 | |
| 278 | private final byte[] byteBuf = new byte[ 65536 ]; |
| 279 | |
| 280 | DIN66003CharsetDecoder( final Charset charset ) |
| 281 | { |
| 282 | super( charset, 1f, 1f ); |
| 283 | this.onUnmappableCharacter( CodingErrorAction.REPLACE ); |
| 284 | } |
| 285 | |
| 286 | protected CoderResult decodeLoop( final ByteBuffer in, final CharBuffer buf ) |
| 287 | { |
| 288 | if ( in.hasArray() && buf.hasArray() ) |
| 289 | { |
| 290 | return decodeLoopArray( in, buf ); |
| 291 | } |
| 292 | |
| 293 | while ( in.hasRemaining() ) |
| 294 | { |
| 295 | in.mark(); |
| 296 | |
| 297 | final int len; |
| 298 | if ( in.remaining() < this.byteBuf.length ) |
| 299 | { |
| 300 | len = in.remaining(); |
| 301 | in.get( this.byteBuf, 0, in.remaining() ); |
| 302 | } |
| 303 | else |
| 304 | { |
| 305 | in.get( this.byteBuf, 0, this.byteBuf.length ); |
| 306 | len = this.byteBuf.length; |
| 307 | } |
| 308 | |
| 309 | for ( int i = 0; i < len; i++ ) |
| 310 | { |
| 311 | if ( !buf.hasRemaining() ) |
| 312 | { |
| 313 | in.reset(); |
| 314 | in.position( in.position() + i ); |
| 315 | return CoderResult.OVERFLOW; |
| 316 | } |
| 317 | |
| 318 | if ( ( this.byteBuf[i] & 0xFF ) < 0x00 || ( this.byteBuf[i] & 0xFF ) > 0x7F ) |
| 319 | { |
| 320 | in.reset(); |
| 321 | in.position( in.position() + i ); |
| 322 | return CoderResult.unmappableForLength( 1 ); |
| 323 | } |
| 324 | |
| 325 | buf.put( DIN66003CharsetProvider.BYTE_TO_CHAR[this.byteBuf[i] & 0xFF] ); |
| 326 | } |
| 327 | } |
| 328 | |
| 329 | return CoderResult.UNDERFLOW; |
| 330 | } |
| 331 | |
| 332 | private static CoderResult decodeLoopArray( final ByteBuffer in, final CharBuffer buf ) |
| 333 | { |
| 334 | final int len = in.remaining(); |
| 335 | for ( int i = 0; i < len; i++, in.position( in.position() + 1 ), buf.position( buf.position() + 1 ) ) |
| 336 | { |
| 337 | if ( !buf.hasRemaining() ) |
| 338 | { |
| 339 | return CoderResult.OVERFLOW; |
| 340 | } |
| 341 | |
| 342 | if ( ( in.array()[in.position() + in.arrayOffset()] & 0xFF ) < 0x00 || |
| 343 | ( in.array()[in.position() + in.arrayOffset()] & 0xFF ) > 0x7F ) |
| 344 | { |
| 345 | return CoderResult.unmappableForLength( 1 ); |
| 346 | } |
| 347 | |
| 348 | buf.array()[buf.position() + buf.arrayOffset()] = |
| 349 | DIN66003CharsetProvider.BYTE_TO_CHAR[in.array()[in.position() + in.arrayOffset()] & 0xFF]; |
| 350 | |
| 351 | } |
| 352 | |
| 353 | return CoderResult.UNDERFLOW; |
| 354 | } |
| 355 | |
| 356 | } |