All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.axiom.attachments.utils.ByteSearch Maven / Gradle / Ivy

There is a newer version: 1.4.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements. See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership. The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License. You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied. See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.axiom.attachments.utils;

/**
 * ByteSearch
 *
 * Various byte array searching utilities.
 * This includes a "skip search", which is a 
 * an optimized search for finding a byte pattern in 
 * a large byte array.
 *
 * @author Richard Scheuerle ([email protected])
 *
 */
public class ByteSearch {

    
    /**
     * Search a byte sequence for a given pattern. The method uses the
     * skip search algorithm. The search can be performed in forward
     * or backward direction, i.e. beginning from the start or end of the
     * byte sequence.
     * 
     * @param pattern  byte[] 
     * @param direction true if forward, false if backward
     * @param buffer byte[] to search
     * @param start index to start search
     * @param end index to end search (end index is not within the search)
     * @param skip short[256]  A skipArray generated from a call to 
     * generateSkipArray. 
     * @return index or -1 if not found
     */
    public static int skipSearch(byte[] pattern,
                                 boolean direction,
                                 byte[] buffer,
                                 int start,
                                 int end,
                                 short[] skip) {
        
        int patternLength = pattern.length;
        
        // If patternLength is larger than buffer,
        // return not found
        if (patternLength > (end - start)) {
            return -1;
        }
        
        if (direction) {
            int k = 0;
            for (k = start + patternLength - 1; 
                k < end; // end is exclusive
                k += skip[buffer[k] & (0xff)])   // SKIP NOTE below
            {
                try {
                    // k is the location in the buffer
                    // that may match the last byte in the pattern.
                    if (isEqual(pattern, buffer, (k-patternLength)+1, end)) {
                        return (k-patternLength)+1;
                    }
                    // SKIP NOTE: The next k index is calculated from 
                    // the skip array.  Basically if the k byte is not
                    // within the pattern, we skip ahead the length of the
                    // pattern.  Otherwise we skip ahead a distance less
                    // than the length.
                } catch (ArrayIndexOutOfBoundsException e) {
                    throw e;
                }
            }
        } else {
            for (int k = end - patternLength; 
                k <= start;
                k -= skip[buffer[k] & (0xff)]) 
            {
                try {
                    // k is the location in the buffer
                    // that may match the first byte in the pattern.
                    if (isEqual(pattern, buffer, k, end)) {
                        return k;
                    }
                } catch (ArrayIndexOutOfBoundsException e) {
                    throw e;
                }
            }
        }
        return -1;            
    }
    
    /**
     * skipArray
     * Builds a skip array for this pattern and direction.
     * The skipArray is used in the optimized skipSearch
     * @param pattern
     * @param direction
     * @return short[256]
     */
    public static short[] getSkipArray(byte[] pattern,
                    boolean direction) {
        
        // The index key is a byte.
        // The short[key] is the number of bytes that can
        // be skipped that won't match the pattern
        short[] skip = new short[256];

        // If a byte is not within pattern, then we can
        // skip ahead the entire length of the pattern.
        // So fill the skip array with the pattern length
        java.util.Arrays.fill(skip, (short) pattern.length);

        if (direction) {
            // If the byte is found in the pattern,
            // this affects how far we can skip.
            // The skip distance is the distance of the
            // character from the end of the pattern.
            // The last character in the pattern is excluded.
            for (int k = 0; k < pattern.length -1; k++) {
                skip[pattern[k] & (0xff)] = (short)(pattern.length - k - 1);
            }
        } else {
            for (int k = pattern.length-2; k >= 0; k--) {
                skip[pattern[k] &(0xff)] = (short)(pattern.length - k - 1);
            }
        }
        return skip;
    }
    
    /**
     * 
     * isEqual
     * @param pattern
     * @param buffer
     * @param start index
     * @param end index
     * @return true if the bytes in buffer[start] equal pattern
     * 
     */
    public static boolean isEqual(byte[] pattern, byte[] buffer, int start, int end) {
//        if (pattern.length >= end-start) {
        if (pattern.length > end-start) {
            return false;
        }
        for (int j=0; j= end) {
                            found = false;
                        } else {
                            found = (bytes[i+i2] == search[i2]); 
                        }
                    }
                    // If found match, set return idx
                    if (found) {
                        idx = i;
                    }
                }
            }
        } else {
            for (int i=end-1; idx < 0 && i>=start; i--) {
                if (bytes[i] == search[0]) {
                    // Potential match..check remaining bytes
                    boolean found = true;  // assume found
                    for (int i2=1; found && i2= end) {
                            found = false;
                        } else {
                            found = (bytes[i+i2] == search[i2]); 
                        }
                    }
                    // If found match, set return idx
                    if (found) {
                        idx = i;
                    }
                }
            }
        }

        return idx;
    }
}

 




© 2015 - 2025 Weber Informatics LLC | Privacy Policy