All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hudi.hadoop.fs.inline.InLineFileSystem Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.hudi.hadoop.fs.inline;

import org.apache.hudi.storage.StoragePath;
import org.apache.hudi.storage.inline.InLineFSUtils;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.permission.FsPermission;
import org.apache.hadoop.util.Progressable;

import java.io.IOException;
import java.net.URI;

import static org.apache.hudi.hadoop.fs.HadoopFSUtils.convertToStoragePath;

/**
 * Enables reading any inline file at a given offset and length. This {@link FileSystem} is used only in read path and does not support
 * any write apis.
 * 

* - Reading an inlined file at a given offset, length, read it out as if it were an independent file of that length * - Inlined path is of the form "inlinefs:///path/to/outer/file//?start_offset=&length= *

* TODO: The reader/writer may try to use relative paths based on the inlinepath and it may not work. Need to handle * this gracefully eg. the parquet summary metadata reading. TODO: If this shows promise, also support directly writing * the inlined file to the underneath file without buffer */ public class InLineFileSystem extends FileSystem { public static final String SCHEME = InLineFSUtils.SCHEME; private Configuration conf = null; @Override public void initialize(URI name, Configuration conf) throws IOException { super.initialize(name, conf); this.conf = conf; } @Override public URI getUri() { return URI.create(getScheme()); } @Override public String getScheme() { return SCHEME; } @Override public FSDataInputStream open(Path inlinePath, int bufferSize) throws IOException { Path outerPath = HadoopInLineFSUtils.getOuterFilePathFromInlinePath(inlinePath); FileSystem outerFs = outerPath.getFileSystem(conf); FSDataInputStream outerStream = outerFs.open(outerPath, bufferSize); StoragePath inlineStoragePath = convertToStoragePath(inlinePath); return new InLineFsDataInputStream(HadoopInLineFSUtils.startOffset(inlineStoragePath), outerStream, HadoopInLineFSUtils.length(inlineStoragePath)); } @Override public boolean exists(Path f) { try { return getFileStatus(f) != null; } catch (Exception e) { return false; } } @Override public FileStatus getFileStatus(Path inlinePath) throws IOException { Path outerPath = HadoopInLineFSUtils.getOuterFilePathFromInlinePath(inlinePath); FileSystem outerFs = outerPath.getFileSystem(conf); FileStatus status = outerFs.getFileStatus(outerPath); FileStatus toReturn = new FileStatus(HadoopInLineFSUtils.length(convertToStoragePath(inlinePath)), status.isDirectory(), status.getReplication(), status.getBlockSize(), status.getModificationTime(), status.getAccessTime(), status.getPermission(), status.getOwner(), status.getGroup(), inlinePath); return toReturn; } @Override public FSDataOutputStream create(Path path, FsPermission fsPermission, boolean b, int i, short i1, long l, Progressable progressable) throws IOException { throw new UnsupportedOperationException("Can't rename files"); } @Override public FSDataOutputStream append(Path path, int i, Progressable progressable) throws IOException { throw new UnsupportedOperationException("Can't rename files"); } @Override public boolean rename(Path path, Path path1) throws IOException { throw new UnsupportedOperationException("Can't rename files"); } @Override public boolean delete(Path path, boolean b) throws IOException { throw new UnsupportedOperationException("Can't delete files"); } @Override public FileStatus[] listStatus(Path inlinePath) throws IOException { return new FileStatus[] {getFileStatus(inlinePath)}; } @Override public void setWorkingDirectory(Path path) { throw new UnsupportedOperationException("Can't set working directory"); } @Override public Path getWorkingDirectory() { throw new UnsupportedOperationException("Can't get working directory"); } @Override public boolean mkdirs(Path path, FsPermission fsPermission) throws IOException { throw new UnsupportedOperationException("Can't set working directory"); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy