All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.cloudhopper.commons.charset.AirwideIA5Charset Maven / Gradle / Ivy

Go to download

Utility classes for converting between charsets (mostly "mobile" in nature) such as Unicode to GSM and vice versa

There is a newer version: 3.0.2
Show newest version
package com.cloudhopper.commons.charset;

/*
 * #%L
 * ch-commons-charset
 * %%
 * Copyright (C) 2012 Cloudhopper by Twitter
 * %%
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *      http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * #L%
 */

import java.util.Arrays;

/**
 * The AirwideIA5Charset class handles a charset unique to the "Airwide"
 * SMSC vendor.  Airwide basically took IA5 and GSM and then decided to treat just
 * a few characters different than other characters.  The result is that some
 * byte values will need transcoded first, then run thru the normal GSMCharset
 * class.  Stupid, stupid Airwide....
 * 
 * @author joelauer (twitter: @jjlauer or http://twitter.com/jjlauer)
 */
public class AirwideIA5Charset extends GSMCharset {

    private static final int GSM_COL = 0;
    private static final int AIRWIDE_COL = 1;
    private static final byte[][] AIRWIDE_OVERRIDE_TABLE = {
        { (byte)0x00, (byte)0x40 }, // @
        { (byte)0x02, (byte)0x24 }, // $
        { (byte)0x11, (byte)0x5F }, // _
    };

    @Override
    public byte[] encode(CharSequence str0) {
        // encoding of unicode to "AIRWIDE-GSM" is the exact same
        return super.encode(str0);
    }

    @Override
    public void decode(byte[] bytes, StringBuilder buffer) {
        int length = (bytes == null ? 0 : bytes.length);

        // we promise to not change any of the bytes -- an optimization is a
        // lazy "copy" of the byte array in case we don't encounter any bytes
        // that need to be converted
        byte[] bytes2 = null;

        // decoding "AIRWIDE-GSM" to unicode is nearly same process as "GSM", but
        // a few byte values need to be converted -- we'll first convert from AIRWIDE-GSM to GSM
        // a little slow to run thru this again, but SMS are so tiny its not worth optimizing
        MAIN_LOOP:
        for (int i = 0; i < length; i++) {
            OVERRIDE_LOOP:
            for (int j = 0; j < AIRWIDE_OVERRIDE_TABLE.length; j++) {
                // if we find a AIRWIDE-GSM byte value in our AIRWIDE column
                // we need to swap its value with a replacement value
                if (bytes[i] == AIRWIDE_OVERRIDE_TABLE[j][AIRWIDE_COL]) {
                    // we found a special byte value, check if we need to copy
                    // the byte array now for a "lazy" copy
                    if (bytes2 == null) {
                        bytes2 = Arrays.copyOf(bytes, bytes.length);
                    }
                    bytes2[i] = AIRWIDE_OVERRIDE_TABLE[j][GSM_COL];
                    // need to immediately exit search so that we don't run into
                    // the bug where 0x00 -> 0x40 and then 0x40 -> 0xA1
                    break OVERRIDE_LOOP;
                }
            }
        }

        // delegate to parent (pick which byte array is correct)
        super.decode((bytes2 == null ? bytes : bytes2), buffer);
    }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy