All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hudi.common.model.HoodieLogFile Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.hudi.common.model;

import org.apache.hudi.common.fs.FSUtils;
import org.apache.hudi.exception.InvalidHoodiePathException;
import org.apache.hudi.hadoop.CachingPath;

import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;

import java.io.IOException;
import java.io.Serializable;
import java.util.Comparator;
import java.util.Objects;
import java.util.regex.Matcher;

import static org.apache.hudi.common.fs.FSUtils.LOG_FILE_PATTERN;

/**
 * Abstracts a single log file. Contains methods to extract metadata like the fileId, version and extension from the log
 * file path.
 * 

* Also contains logic to roll-over the log file */ public class HoodieLogFile implements Serializable { private static final long serialVersionUID = 1L; public static final String DELTA_EXTENSION = ".log"; public static final String LOG_FILE_PREFIX = "."; public static final Integer LOGFILE_BASE_VERSION = 1; private static final Comparator LOG_FILE_COMPARATOR = new LogFileComparator(); private static final Comparator LOG_FILE_COMPARATOR_REVERSED = new LogFileComparator().reversed(); private transient FileStatus fileStatus; private transient Path path; private final String pathStr; private String fileId; private String baseCommitTime; private int logVersion; private String logWriteToken; private String fileExtension; private String suffix; private long fileLen; public HoodieLogFile(HoodieLogFile logFile) { this.fileStatus = logFile.getFileStatus(); this.path = logFile.getPath(); this.pathStr = logFile.pathStr; this.fileId = logFile.getFileId(); this.baseCommitTime = logFile.getBaseCommitTime(); this.logVersion = logFile.getLogVersion(); this.logWriteToken = logFile.getLogWriteToken(); this.fileExtension = logFile.getFileExtension(); this.suffix = logFile.getSuffix(); this.fileLen = logFile.getFileSize(); } public HoodieLogFile(FileStatus fileStatus) { this(fileStatus, fileStatus.getPath(), fileStatus.getPath().toString(), fileStatus.getLen()); } public HoodieLogFile(Path logPath) { this(null, logPath, logPath.toString(), -1); } public HoodieLogFile(Path logPath, long fileLen) { this(null, logPath, logPath.toString(), fileLen); } public HoodieLogFile(String logPathStr) { this(null, null, logPathStr, -1); } private HoodieLogFile(FileStatus fileStatus, Path logPath, String logPathStr, long fileLen) { this.fileStatus = fileStatus; this.pathStr = logPathStr; this.fileLen = fileLen; this.logVersion = -1; // mark version as uninitialized if (logPath instanceof CachingPath) { this.path = logPath; } } private void parseFieldsFromPath() { Matcher matcher = LOG_FILE_PATTERN.matcher(getPath().getName()); if (!matcher.find()) { throw new InvalidHoodiePathException(path, "LogFile"); } this.fileId = matcher.group(1); this.baseCommitTime = matcher.group(2); this.fileExtension = matcher.group(3); this.logVersion = Integer.parseInt(matcher.group(4)); this.logWriteToken = matcher.group(6); this.suffix = matcher.group(10) == null ? "" : matcher.group(10); } public String getFileId() { if (fileId == null) { parseFieldsFromPath(); } return fileId; } public String getBaseCommitTime() { if (baseCommitTime == null) { parseFieldsFromPath(); } return baseCommitTime; } public int getLogVersion() { if (logVersion == -1) { parseFieldsFromPath(); } return logVersion; } public String getLogWriteToken() { if (logWriteToken == null) { parseFieldsFromPath(); } return logWriteToken; } public String getFileExtension() { if (fileExtension == null) { parseFieldsFromPath(); } return fileExtension; } public String getSuffix() { if (suffix == null) { parseFieldsFromPath(); } return suffix; } public Path getPath() { if (path == null) { path = new CachingPath(pathStr); } return path; } public String getFileName() { return getPath().getName(); } public void setFileLen(long fileLen) { this.fileLen = fileLen; } public long getFileSize() { return fileLen; } public FileStatus getFileStatus() { return fileStatus; } public void setFileStatus(FileStatus fileStatus) { this.fileStatus = fileStatus; } public HoodieLogFile rollOver(FileSystem fs, String logWriteToken) throws IOException { String fileId = getFileId(); String baseCommitTime = getBaseCommitTime(); Path path = getPath(); String extension = "." + fileExtension; int newVersion = FSUtils.computeNextLogVersion(fs, path.getParent(), fileId, extension, baseCommitTime); return new HoodieLogFile(new CachingPath(path.getParent(), FSUtils.makeLogFileName(fileId, extension, baseCommitTime, newVersion, logWriteToken))); } public static Comparator getLogFileComparator() { return LOG_FILE_COMPARATOR; } public static Comparator getReverseLogFileComparator() { return LOG_FILE_COMPARATOR_REVERSED; } /** * Comparator to order log-files. */ public static class LogFileComparator implements Comparator, Serializable { private static final long serialVersionUID = 1L; private transient Comparator writeTokenComparator; private Comparator getWriteTokenComparator() { if (null == writeTokenComparator) { // writeTokenComparator is not serializable. Hence, lazy loading writeTokenComparator = Comparator.nullsFirst(Comparator.naturalOrder()); } return writeTokenComparator; } @Override public int compare(HoodieLogFile o1, HoodieLogFile o2) { String baseInstantTime1 = o1.getBaseCommitTime(); String baseInstantTime2 = o2.getBaseCommitTime(); if (baseInstantTime1.equals(baseInstantTime2)) { if (o1.getLogVersion() == o2.getLogVersion()) { int compareWriteToken = getWriteTokenComparator().compare(o1.getLogWriteToken(), o2.getLogWriteToken()); if (compareWriteToken == 0) { // Compare by suffix when write token is same return o1.getSuffix().compareTo(o2.getSuffix()); } // Compare by write token when base-commit and log-version is same return compareWriteToken; } // compare by log-version when base-commit is same return Integer.compare(o1.getLogVersion(), o2.getLogVersion()); } // compare by base-commits return baseInstantTime1.compareTo(baseInstantTime2); } } @Override public boolean equals(Object o) { if (this == o) { return true; } if (o == null || getClass() != o.getClass()) { return false; } HoodieLogFile that = (HoodieLogFile) o; return Objects.equals(pathStr, that.pathStr); } @Override public int hashCode() { return Objects.hash(pathStr); } @Override public String toString() { return "HoodieLogFile{pathStr='" + pathStr + '\'' + ", fileLen=" + fileLen + '}'; } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy