All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hudi.org.apache.commons.io.filefilter.MagicNumberFileFilter Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.commons.io.filefilter;

import java.io.File;
import java.io.IOException;
import java.io.RandomAccessFile;
import java.io.Serializable;
import java.nio.ByteBuffer;
import java.nio.channels.FileChannel;
import java.nio.charset.Charset;
import java.nio.file.FileVisitResult;
import java.nio.file.Files;
import java.nio.file.Path;
import java.nio.file.attribute.BasicFileAttributes;
import java.util.Arrays;

import org.apache.commons.io.IOUtils;

/**
 * 

* File filter for matching files containing a "magic number". A magic number * is a unique series of bytes common to all files of a specific file format. * For instance, all Java class files begin with the bytes * {@code 0xCAFEBABE}. *

*

Using Classic IO

*
 * File dir = new File(".");
 * MagicNumberFileFilter javaClassFileFilter =
 *     MagicNumberFileFilter(new byte[] {(byte) 0xCA, (byte) 0xFE,
 *       (byte) 0xBA, (byte) 0xBE});
 * String[] javaClassFiles = dir.list(javaClassFileFilter);
 * for (String javaClassFile : javaClassFiles) {
 *     System.out.println(javaClassFile);
 * }
 * 
* *

* Sometimes, such as in the case of TAR files, the * magic number will be offset by a certain number of bytes in the file. In the * case of TAR archive files, this offset is 257 bytes. *

* *
 * File dir = new File(".");
 * MagicNumberFileFilter tarFileFilter =
 *     MagicNumberFileFilter("ustar", 257);
 * String[] tarFiles = dir.list(tarFileFilter);
 * for (String tarFile : tarFiles) {
 *     System.out.println(tarFile);
 * }
 * 
*

Using NIO

*
 * final Path dir = Paths.get("");
 * final AccumulatorPathVisitor visitor = AccumulatorPathVisitor.withLongCounters(MagicNumberFileFilter("ustar", 257));
 * //
 * // Walk one dir
 * Files.walkFileTree(dir, Collections.emptySet(), 1, visitor);
 * System.out.println(visitor.getPathCounters());
 * System.out.println(visitor.getFileList());
 * //
 * visitor.getPathCounters().reset();
 * //
 * // Walk dir tree
 * Files.walkFileTree(dir, visitor);
 * System.out.println(visitor.getPathCounters());
 * System.out.println(visitor.getDirList());
 * System.out.println(visitor.getFileList());
 * 
* * @since 2.0 * @see FileFilterUtils#magicNumberFileFilter(byte[]) * @see FileFilterUtils#magicNumberFileFilter(String) * @see FileFilterUtils#magicNumberFileFilter(byte[], long) * @see FileFilterUtils#magicNumberFileFilter(String, long) */ public class MagicNumberFileFilter extends AbstractFileFilter implements Serializable { /** * The serialization version unique identifier. */ private static final long serialVersionUID = -547733176983104172L; /** * The magic number to compare against the file's bytes at the provided * offset. */ private final byte[] magicNumbers; /** * The offset (in bytes) within the files that the magic number's bytes * should appear. */ private final long byteOffset; /** *

* Constructs a new MagicNumberFileFilter and associates it with the magic * number to test for in files. This constructor assumes a starting offset * of {@code 0}. *

* *

* It is important to note that the array is not cloned and that * any changes to the magic number array after construction will affect the * behavior of this file filter. *

* *
     * MagicNumberFileFilter javaClassFileFilter =
     *     MagicNumberFileFilter(new byte[] {(byte) 0xCA, (byte) 0xFE,
     *       (byte) 0xBA, (byte) 0xBE});
     * 
* * @param magicNumber the magic number to look for in the file. * * @throws IllegalArgumentException if {@code magicNumber} is * {@code null}, or contains no bytes. */ public MagicNumberFileFilter(final byte[] magicNumber) { this(magicNumber, 0); } /** *

* Constructs a new MagicNumberFileFilter and associates it with the magic * number to test for in files and the byte offset location in the file to * to look for that magic number. *

* *
     * MagicNumberFileFilter tarFileFilter =
     *     MagicNumberFileFilter(new byte[] {0x75, 0x73, 0x74, 0x61, 0x72}, 257);
     * 
* *
     * MagicNumberFileFilter javaClassFileFilter =
     *     MagicNumberFileFilter(new byte[] {0xCA, 0xFE, 0xBA, 0xBE}, 0);
     * 
* * @param magicNumber the magic number to look for in the file. * @param offset the byte offset in the file to start comparing bytes. * * @throws IllegalArgumentException if {@code magicNumber} is * {@code null}, or contains no bytes, or {@code offset} * is a negative number. */ public MagicNumberFileFilter(final byte[] magicNumber, final long offset) { if (magicNumber == null) { throw new IllegalArgumentException("The magic number cannot be null"); } if (magicNumber.length == 0) { throw new IllegalArgumentException("The magic number must contain at least one byte"); } if (offset < 0) { throw new IllegalArgumentException("The offset cannot be negative"); } this.magicNumbers = IOUtils.byteArray(magicNumber.length); System.arraycopy(magicNumber, 0, this.magicNumbers, 0, magicNumber.length); this.byteOffset = offset; } /** *

* Constructs a new MagicNumberFileFilter and associates it with the magic * number to test for in files. This constructor assumes a starting offset * of {@code 0}. *

* * Example usage: *
     * {@code
     * MagicNumberFileFilter xmlFileFilter =
     *     MagicNumberFileFilter("
     *
     * @param magicNumber the magic number to look for in the file.
     *        The string is converted to bytes using the platform default charset.
     *
     * @throws IllegalArgumentException if {@code magicNumber} is
     *         {@code null} or the empty String.
     */
    public MagicNumberFileFilter(final String magicNumber) {
        this(magicNumber, 0);
    }

    /**
     * 

* Constructs a new MagicNumberFileFilter and associates it with the magic * number to test for in files and the byte offset location in the file to * to look for that magic number. *

* *
     * MagicNumberFileFilter tarFileFilter =
     *     MagicNumberFileFilter("ustar", 257);
     * 
* * @param magicNumber the magic number to look for in the file. * The string is converted to bytes using the platform default charset. * @param offset the byte offset in the file to start comparing bytes. * * @throws IllegalArgumentException if {@code magicNumber} is * {@code null} or the empty String, or {@code offset} is * a negative number. */ public MagicNumberFileFilter(final String magicNumber, final long offset) { if (magicNumber == null) { throw new IllegalArgumentException("The magic number cannot be null"); } if (magicNumber.isEmpty()) { throw new IllegalArgumentException("The magic number must contain at least one byte"); } if (offset < 0) { throw new IllegalArgumentException("The offset cannot be negative"); } this.magicNumbers = magicNumber.getBytes(Charset.defaultCharset()); // explicitly uses the platform default // charset this.byteOffset = offset; } /** *

* Accepts the provided file if the file contains the file filter's magic * number at the specified offset. *

* *

* If any {@link IOException}s occur while reading the file, the file will * be rejected. *

* * @param file the file to accept or reject. * * @return {@code true} if the file contains the filter's magic number * at the specified offset, {@code false} otherwise. */ @Override public boolean accept(final File file) { if (file != null && file.isFile() && file.canRead()) { try { try (RandomAccessFile randomAccessFile = new RandomAccessFile(file, "r")) { final byte[] fileBytes = IOUtils.byteArray(this.magicNumbers.length); randomAccessFile.seek(byteOffset); final int read = randomAccessFile.read(fileBytes); if (read != magicNumbers.length) { return false; } return Arrays.equals(this.magicNumbers, fileBytes); } } catch (final IOException ioe) { // Do nothing, fall through and do not accept file } } return false; } /** *

* Accepts the provided file if the file contains the file filter's magic * number at the specified offset. *

* *

* If any {@link IOException}s occur while reading the file, the file will * be rejected. *

* @param file the file to accept or reject. * * @return {@code true} if the file contains the filter's magic number * at the specified offset, {@code false} otherwise. * @since 2.9.0 */ @Override public FileVisitResult accept(final Path file, final BasicFileAttributes attributes) { if (file != null && Files.isRegularFile(file) && Files.isReadable(file)) { try { try (final FileChannel fileChannel = FileChannel.open(file)) { final ByteBuffer byteBuffer = ByteBuffer.allocate(this.magicNumbers.length); final int read = fileChannel.read(byteBuffer); if (read != magicNumbers.length) { return FileVisitResult.TERMINATE; } return toFileVisitResult(Arrays.equals(this.magicNumbers, byteBuffer.array()), file); } } catch (final IOException ioe) { // Do nothing, fall through and do not accept file } } return FileVisitResult.TERMINATE; } /** * Returns a String representation of the file filter, which includes the * magic number bytes and byte offset. * * @return a String representation of the file filter. */ @Override public String toString() { final StringBuilder builder = new StringBuilder(super.toString()); builder.append("("); builder.append(new String(magicNumbers, Charset.defaultCharset()));// TODO perhaps use hex if value is not // printable builder.append(","); builder.append(this.byteOffset); builder.append(")"); return builder.toString(); } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy