All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hudi.sink.meta.CkpMetadata Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.hudi.sink.meta;

import org.apache.hudi.common.table.HoodieTableMetaClient;
import org.apache.hudi.common.util.StringUtils;
import org.apache.hudi.common.util.ValidationUtils;
import org.apache.hudi.common.util.VisibleForTesting;
import org.apache.hudi.exception.HoodieException;
import org.apache.hudi.storage.StoragePath;

import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import javax.annotation.Nullable;

import java.io.IOException;
import java.io.Serializable;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import java.util.stream.Collectors;
import java.util.stream.Stream;

/**
 * The checkpoint metadata for bookkeeping the checkpoint messages.
 *
 * 

Each time the driver starts a new instant, it writes a commit message into the metadata, the write tasks * then consume the message and unblock the data flushing. * *

Why we use the DFS based message queue instead of sending * the {@link org.apache.flink.runtime.operators.coordination.OperatorEvent} ? * The writer task thread handles the operator event using the main mailbox executor which has the lowest priority for mails, * it is also used to process the inputs. When the writer task blocks and waits for the operator event to ack the valid instant to write, * it actually blocks all the subsequent events in the mailbox, the operator event would never be consumed then it causes deadlock. * *

The checkpoint metadata is also more lightweight than the active timeline. * *

NOTE: should be removed in the future if we have good manner to handle the async notifications from driver. */ public class CkpMetadata implements Serializable, AutoCloseable { private static final long serialVersionUID = 1L; private static final Logger LOG = LoggerFactory.getLogger(CkpMetadata.class); // 1 is actually enough for fetching the latest pending instant, // keep 3 instants here for purpose of debugging. private static final int MAX_RETAIN_CKP_NUM = 3; // the ckp metadata directory private static final String CKP_META = "ckp_meta"; private final FileSystem fs; protected final Path path; private List messages; private List instantCache; CkpMetadata(FileSystem fs, String basePath, String uniqueId) { this.fs = fs; this.path = new Path(ckpMetaPath(basePath, uniqueId)); } public void close() { this.instantCache = null; } // ------------------------------------------------------------------------- // WRITE METHODS // ------------------------------------------------------------------------- /** * Initialize the message bus, would clean all the messages * *

This expects to be called by the driver. */ public void bootstrap() throws IOException { fs.delete(path, true); fs.mkdirs(path); } public void startInstant(String instant) { Path path = fullPath(CkpMessage.getFileName(instant, CkpMessage.State.INFLIGHT)); try { fs.createNewFile(path); } catch (IOException e) { throw new HoodieException("Exception while adding checkpoint start metadata for instant: " + instant, e); } // cache the instant cache(instant); // cleaning clean(); } private void cache(String newInstant) { if (this.instantCache == null) { this.instantCache = new ArrayList<>(); } this.instantCache.add(newInstant); } private void clean() { if (instantCache.size() > MAX_RETAIN_CKP_NUM) { final String instant = instantCache.get(0); boolean[] error = new boolean[1]; CkpMessage.getAllFileNames(instant).stream().map(this::fullPath).forEach(path -> { try { fs.delete(path, false); } catch (IOException e) { error[0] = true; LOG.warn("Exception while cleaning the checkpoint meta file: " + path); } }); if (!error[0]) { instantCache.remove(0); } } } /** * Add a checkpoint commit message. * * @param instant The committed instant */ public void commitInstant(String instant) { Path path = fullPath(CkpMessage.getFileName(instant, CkpMessage.State.COMPLETED)); try { fs.createNewFile(path); } catch (IOException e) { throw new HoodieException("Exception while adding checkpoint commit metadata for instant: " + instant, e); } } /** * Add an aborted checkpoint message. */ public void abortInstant(String instant) { Path path = fullPath(CkpMessage.getFileName(instant, CkpMessage.State.ABORTED)); try { fs.createNewFile(path); } catch (IOException e) { throw new HoodieException("Exception while adding checkpoint abort metadata for instant: " + instant); } } // ------------------------------------------------------------------------- // READ METHODS // ------------------------------------------------------------------------- private void load() { try { this.messages = scanCkpMetadata(this.path); } catch (IOException e) { throw new HoodieException("Exception while scanning the checkpoint meta files under path: " + this.path, e); } } @Nullable public String lastPendingInstant() { load(); if (this.messages.size() > 0) { CkpMessage ckpMsg = this.messages.get(this.messages.size() - 1); // consider 'aborted' as pending too to reuse the instant if (!ckpMsg.isComplete()) { return ckpMsg.getInstant(); } } return null; } public List getMessages() { load(); return messages; } public boolean isAborted(String instant) { ValidationUtils.checkState(this.messages != null, "The checkpoint metadata should #load first"); return this.messages.stream().anyMatch(ckpMsg -> instant.equals(ckpMsg.getInstant()) && ckpMsg.isAborted()); } @VisibleForTesting public List getInstantCache() { return this.instantCache; } @Nullable @VisibleForTesting public String lastCompleteInstant() { load(); for (int i = this.messages.size() - 1; i >= 0; i--) { CkpMessage ckpMsg = this.messages.get(i); if (ckpMsg.isComplete()) { return ckpMsg.getInstant(); } } return null; } // ------------------------------------------------------------------------- // Utilities // ------------------------------------------------------------------------- protected static String ckpMetaPath(String basePath, String uniqueId) { // .hoodie/.aux/ckp_meta String metaPath = basePath + StoragePath.SEPARATOR + HoodieTableMetaClient.AUXILIARYFOLDER_NAME + StoragePath.SEPARATOR + CKP_META; return StringUtils.isNullOrEmpty(uniqueId) ? metaPath : metaPath + "_" + uniqueId; } private Path fullPath(String fileName) { return new Path(path, fileName); } protected Stream fetchCkpMessages(Path ckpMetaPath) throws IOException { // This is required when the storage is minio if (!this.fs.exists(ckpMetaPath)) { return Stream.empty(); } return Arrays.stream(this.fs.listStatus(ckpMetaPath)).map(CkpMessage::new); } protected List scanCkpMetadata(Path ckpMetaPath) throws IOException { return fetchCkpMessages(ckpMetaPath) .collect(Collectors.groupingBy(CkpMessage::getInstant)).values().stream() .map(messages -> messages.stream().reduce((x, y) -> { // Pick the one with the highest state if (x.getState().compareTo(y.getState()) >= 0) { return x; } return y; }).get()) .sorted().collect(Collectors.toList()); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy