net.snowflake.ingest.streaming.internal.FlushService Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of snowflake-ingest-sdk Show documentation
Snowflake Ingest SDK
There is a newer version: 3.0.0
/*
 * Copyright (c) 2021-2024 Snowflake Computing Inc. All rights reserved.
 */

package net.snowflake.ingest.streaming.internal;

import static net.snowflake.ingest.utils.Constants.DISABLE_BACKGROUND_FLUSH;
import static net.snowflake.ingest.utils.Constants.MAX_BLOB_SIZE_IN_BYTES;
import static net.snowflake.ingest.utils.Constants.MAX_THREAD_COUNT;
import static net.snowflake.ingest.utils.Constants.THREAD_SHUTDOWN_TIMEOUT_IN_SEC;
import static net.snowflake.ingest.utils.Utils.getStackTrace;

import com.codahale.metrics.Timer;
import com.google.common.annotations.VisibleForTesting;
import java.io.IOException;
import java.lang.management.ManagementFactory;
import java.security.InvalidAlgorithmParameterException;
import java.security.InvalidKeyException;
import java.security.NoSuchAlgorithmException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Set;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.ThreadFactory;
import java.util.concurrent.ThreadPoolExecutor;
import java.util.concurrent.TimeUnit;
import java.util.stream.Collectors;
import javax.crypto.BadPaddingException;
import javax.crypto.IllegalBlockSizeException;
import javax.crypto.NoSuchPaddingException;
import net.snowflake.client.jdbc.internal.google.common.util.concurrent.ThreadFactoryBuilder;
import net.snowflake.ingest.utils.Constants;
import net.snowflake.ingest.utils.ErrorCode;
import net.snowflake.ingest.utils.Logging;
import net.snowflake.ingest.utils.Pair;
import net.snowflake.ingest.utils.SFException;
import net.snowflake.ingest.utils.Utils;

/**
 * Responsible for flushing data from client to Snowflake tables. When a flush is triggered, it will
 * do the following in order:
 * take the data from all the channel row buffers
 * 
build the blob using the ChannelData returned from previous step
 * 
upload the blob to stage
 * register the blob to the targeted Snowflake table
 *
 * @param  type of column data ({@link ParquetChunkData})
 */
class FlushService {

  // The max number of upload retry attempts to the stage
  private static final int DEFAULT_MAX_UPLOAD_RETRIES = 5;

  // Static class to save the list of channels that are used to build a blob, which is mainly used
  // to invalidate all the channels when there is a failure
  static class BlobData {
    private final String path;
    private final List>> data;

    BlobData(String path, List>> data) {
      this.path = path;
      this.data = data;
    }

    String getPath() {
      return path;
    }

    List>> getData() {
      return data;
    }
  }

  private static final Logging logger = new Logging(FlushService.class);

  // The client that owns this flush service
  private final SnowflakeStreamingIngestClientInternal owningClient;

  // Thread to schedule the flush job
  @VisibleForTesting ScheduledExecutorService flushWorker;

  // Thread to register the blob
  @VisibleForTesting ExecutorService registerWorker;

  // Threads to build and upload the blob
  @VisibleForTesting ExecutorService buildUploadWorkers;

  // Reference to the channel cache
  private final ChannelCache channelCache;

  // Reference to the Streaming Ingest storage manager
  private final IStorageManager storageManager;

  // Reference to register service
  private final RegisterService registerService;

  /**
   * Client level last flush time and need flush flag. This two variables are used when max chunk in
   * blob is not 1. When max chunk in blob is 1, flush service ignores these variables and uses
   * table level last flush time and need flush flag. See {@link ChannelCache.FlushInfo}.
   */
  @VisibleForTesting volatile long lastFlushTime;

  @VisibleForTesting volatile boolean isNeedFlush;

  // Indicates whether it's running as part of the test
  private final boolean isTestMode;

  // A map which stores the timer for each blob in order to capture the flush latency
  private final Map latencyTimerContextMap;

  // blob encoding version
  private final Constants.BdecVersion bdecVersion;
  private volatile int numProcessors = Runtime.getRuntime().availableProcessors();

  /**
   * Default constructor
   *
   * @param client the owning client
   * @param cache the channel cache
   * @param storageManager the storage manager
   * @param isTestMode whether the service is running in test mode
   */
  FlushService(
      SnowflakeStreamingIngestClientInternal client,
      ChannelCache cache,
      IStorageManager storageManager,
      boolean isTestMode) {
    this.owningClient = client;
    this.channelCache = cache;
    this.storageManager = storageManager;
    this.registerService = new RegisterService<>(client, isTestMode);
    this.isNeedFlush = false;
    this.lastFlushTime = System.currentTimeMillis();
    this.isTestMode = isTestMode;
    this.latencyTimerContextMap = new ConcurrentHashMap<>();
    this.bdecVersion = this.owningClient.getParameterProvider().getBlobFormatVersion();
    createWorkers();
  }

  /**
   * Updates performance stats enabled
   *
   * @return
   */
  private CompletableFuture statsFuture() {
    return CompletableFuture.runAsync(
        () -> {
          if (this.owningClient.cpuHistogram != null) {
            double cpuLoad =
                ManagementFactory.getPlatformMXBean(com.sun.management.OperatingSystemMXBean.class)
                    .getProcessCpuLoad();
            this.owningClient.cpuHistogram.update((long) (cpuLoad * 100));
          }
          return;
        },
        this.flushWorker);
  }

  /**
   * @param isForce if true will flush regardless of other conditions
   * @param tablesToFlush list of tables to flush
   * @param flushStartTime the time when the flush started
   * @return
   */
  private CompletableFuture distributeFlush(
      boolean isForce, Set tablesToFlush, Long flushStartTime) {
    return CompletableFuture.runAsync(
        () -> {
          logFlushTask(isForce, tablesToFlush, flushStartTime);
          distributeFlushTasks(tablesToFlush);
          long prevFlushEndTime = System.currentTimeMillis();
          this.lastFlushTime = prevFlushEndTime;
          this.isNeedFlush = false;
          tablesToFlush.forEach(
              table -> {
                this.channelCache.setLastFlushTime(table, prevFlushEndTime);
                this.channelCache.setNeedFlush(table, false);
              });
        },
        this.flushWorker);
  }

  /** If tracing is enabled, print always else, check if it needs flush or is forceful. */
  private void logFlushTask(boolean isForce, Set tablesToFlush, long flushStartTime) {
    boolean isNeedFlush =
        this.owningClient.getParameterProvider().getMaxChunksInBlob() == 1
            ? tablesToFlush.stream().anyMatch(channelCache::getNeedFlush)
            : this.isNeedFlush;
    long currentTime = System.currentTimeMillis();
    final String logInfo;
    if (this.owningClient.getParameterProvider().getMaxChunksInBlob() == 1) {
      logInfo =
          String.format(
              "Tables=[%s]",
              tablesToFlush.stream()
                  .map(
                      table ->
                          String.format(
                              "(name=%s, isNeedFlush=%s, timeDiffMillis=%s, currentDiffMillis=%s)",
                              table,
                              channelCache.getNeedFlush(table),
                              flushStartTime - channelCache.getLastFlushTime(table),
                              currentTime - channelCache.getLastFlushTime(table)))
                  .collect(Collectors.joining(", ")));
    } else {
      logInfo =
          String.format(
              "isNeedFlush=%s, timeDiffMillis=%s, currentDiffMillis=%s",
              isNeedFlush, flushStartTime - this.lastFlushTime, currentTime - this.lastFlushTime);
    }

    final String flushTaskLogFormat =
        String.format(
            "Submit forced or ad-hoc flush task on client=%s, isForce=%s, %s",
            this.owningClient.getName(), isForce, logInfo);
    if (logger.isTraceEnabled()) {
      logger.logTrace(flushTaskLogFormat);
    }
    if (!logger.isTraceEnabled() && (isNeedFlush || isForce)) {
      logger.logDebug(flushTaskLogFormat);
    }
  }

  /**
   * Registers blobs with Snowflake
   *
   * @return
   */
  private CompletableFuture registerFuture() {
    return CompletableFuture.runAsync(
        () -> this.registerService.registerBlobs(latencyTimerContextMap), this.registerWorker);
  }

  /**
   * Kick off a flush job and distribute the tasks. The flush service behaves differently based on
   * the max chunks in blob:
   *
   * 
   *   The max chunks in blob is not 1 (interleaving is allowed), every channel will be flushed
   *       together if one of the following conditions is met:
   *       
   *         Flush is forced by the users
   *         
One or more buffers have reached the flush size
   *         
Periodical background flush when a time interval has reached
   *       
   *   
The max chunks in blob is 1 (interleaving is not allowed), a channel will be flushed if
   *       one of the following conditions is met:
   *       
   *         Flush is forced by the users
   *         
One or more buffers with the same target table as the channel have reached the
   *             flush size
   *         
Periodical background flush of the target table when a time interval has reached
   *       
   * 
   *
   * @param isForce
   * @return Completable future that will return when the blobs are registered successfully, or null
   *     if none of the conditions is met above
   */
  CompletableFuture flush(boolean isForce) {
    final long flushStartTime = System.currentTimeMillis();
    final long flushingInterval =
        this.owningClient.getParameterProvider().getCachedMaxClientLagInMs();

    final Set tablesToFlush;
    if (this.owningClient.getParameterProvider().getMaxChunksInBlob() == 1) {
      tablesToFlush =
          this.channelCache.keySet().stream()
              .filter(
                  key ->
                      isForce
                          || flushStartTime - this.channelCache.getLastFlushTime(key)
                              >= flushingInterval
                          || this.channelCache.getNeedFlush(key))
              .collect(Collectors.toSet());
    } else {
      if (isForce
          || (!DISABLE_BACKGROUND_FLUSH
              && !isTestMode()
              && (this.isNeedFlush || flushStartTime - this.lastFlushTime >= flushingInterval))) {
        tablesToFlush = this.channelCache.keySet();
      } else {
        tablesToFlush = null;
      }
    }

    if (isForce
        || (!DISABLE_BACKGROUND_FLUSH
            && !isTestMode()
            && tablesToFlush != null
            && !tablesToFlush.isEmpty())) {
      return this.statsFuture()
          .thenCompose((v) -> this.distributeFlush(isForce, tablesToFlush, flushStartTime))
          .thenCompose((v) -> this.registerFuture());
    }
    return this.statsFuture();
  }

  /** Create the workers for each specific job */
  private void createWorkers() {
    // Create thread for checking and scheduling flush job
    ThreadFactory flushThreadFactory =
        new ThreadFactoryBuilder().setNameFormat("ingest-flush-thread").build();
    this.flushWorker = Executors.newSingleThreadScheduledExecutor(flushThreadFactory);
    this.flushWorker.scheduleWithFixedDelay(
        () -> {
          try {
            flush(false)
                .exceptionally(
                    e -> {
                      String errorMessage =
                          String.format(
                              "Background flush task failed, client=%s, exception=%s, detail=%s,"
                                  + " trace=%s.",
                              this.owningClient.getName(),
                              e.getCause(),
                              e.getCause().getMessage(),
                              getStackTrace(e.getCause()));
                      logger.logError(errorMessage);
                      if (this.owningClient.getTelemetryService() != null) {
                        this.owningClient
                            .getTelemetryService()
                            .reportClientFailure(this.getClass().getSimpleName(), errorMessage);
                      }
                      return null;
                    });
          } catch (Exception e) {
            String errorMessage =
                String.format(
                    "Failed to schedule a flush task, client=%s, exception=%s, detail=%s,"
                        + " trace=%s.",
                    this.owningClient.getName(),
                    e.getClass().getName(),
                    e.getMessage(),
                    getStackTrace(e));
            logger.logError(errorMessage);
            if (this.owningClient.getTelemetryService() != null) {
              this.owningClient
                  .getTelemetryService()
                  .reportClientFailure(this.getClass().getSimpleName(), errorMessage);
            }
            throw e;
          }
        },
        0,
        this.owningClient.getParameterProvider().getBufferFlushCheckIntervalInMs(),
        TimeUnit.MILLISECONDS);

    // Create thread for registering blobs
    ThreadFactory registerThreadFactory =
        new ThreadFactoryBuilder().setNameFormat("ingest-register-thread").build();
    this.registerWorker = Executors.newSingleThreadExecutor(registerThreadFactory);

    // Create threads for building and uploading blobs
    // Size: number of available processors * (1 + IO time/CPU time)
    ThreadFactory buildUploadThreadFactory =
        new ThreadFactoryBuilder().setNameFormat("ingest-build-upload-thread-%d").build();
    int buildUploadThreadCount =
        Math.min(
            Runtime.getRuntime().availableProcessors()
                * (1 + this.owningClient.getParameterProvider().getIOTimeCpuRatio()),
            MAX_THREAD_COUNT);
    this.buildUploadWorkers =
        Executors.newFixedThreadPool(buildUploadThreadCount, buildUploadThreadFactory);

    logger.logInfo(
        "Create {} threads for build/upload blobs for client={}, total available processors={}",
        buildUploadThreadCount,
        this.owningClient.getName(),
        Runtime.getRuntime().availableProcessors());
  }

  /**
   * Distribute the flush tasks by iterating through all the channels in the channel cache and kick
   * off a build blob work when certain size has reached or we have reached the end
   *
   * @param tablesToFlush list of tables to flush
   */
  void distributeFlushTasks(Set tablesToFlush) {
    Iterator<
            Map.Entry<
                String, ConcurrentHashMap>>>
        itr =
            this.channelCache.entrySet().stream()
                .filter(e -> tablesToFlush.contains(e.getKey()))
                .iterator();
    List, CompletableFuture>> blobs = new ArrayList<>();
    List> leftoverChannelsDataPerTable = new ArrayList<>();

    // The API states that the number of available processors reported can change and therefore, we
    // should poll it occasionally.
    numProcessors = Runtime.getRuntime().availableProcessors();
    while (itr.hasNext() || !leftoverChannelsDataPerTable.isEmpty()) {
      List>> blobData = new ArrayList<>();
      float totalBufferSizeInBytes = 0F;
      final String blobPath = this.storageManager.generateBlobPath();

      // Distribute work at table level, split the blob if reaching the blob size limit or the
      // channel has different encryption key ids
      while (itr.hasNext() || !leftoverChannelsDataPerTable.isEmpty()) {
        List> channelsDataPerTable = Collections.synchronizedList(new ArrayList<>());
        if (!leftoverChannelsDataPerTable.isEmpty()) {
          channelsDataPerTable.addAll(leftoverChannelsDataPerTable);
          leftoverChannelsDataPerTable.clear();
        } else if (blobData.size()
            >= this.owningClient.getParameterProvider().getMaxChunksInBlob()) {
          // Create a new blob if the current one already contains max allowed number of chunks
          logger.logInfo(
              "Max allowed number of chunks in the current blob reached. chunkCount={}"
                  + " maxChunkCount={} currentBlobPath={}",
              blobData.size(),
              this.owningClient.getParameterProvider().getMaxChunksInBlob(),
              blobPath);
          break;
        } else {
          ConcurrentHashMap> table =
              itr.next().getValue();
          // Use parallel stream since getData could be the performance bottleneck when we have a
          // high number of channels
          table.values().parallelStream()
              .forEach(
                  channel -> {
                    if (channel.isValid()) {
                      ChannelData data = channel.getData();
                      if (data != null) {
                        channelsDataPerTable.add(data);
                      }
                    }
                  });
        }

        if (!channelsDataPerTable.isEmpty()) {
          int idx = 0;
          float totalBufferSizePerTableInBytes = 0F;
          while (idx < channelsDataPerTable.size()) {
            ChannelData channelData = channelsDataPerTable.get(idx);
            // Stop processing the rest of channels when needed
            if (idx > 0
                && shouldStopProcessing(
                    totalBufferSizeInBytes,
                    totalBufferSizePerTableInBytes,
                    channelData,
                    channelsDataPerTable.get(idx - 1))) {
              leftoverChannelsDataPerTable.addAll(
                  channelsDataPerTable.subList(idx, channelsDataPerTable.size()));
              logger.logInfo(
                  "Creation of another blob is needed because of blob/chunk size limit or"
                      + " different encryption ids or different schema, client={}, table={},"
                      + " blobSize={}, chunkSize={}, nextChannelSize={}, encryptionId1={},"
                      + " encryptionId2={}, schema1={}, schema2={}",
                  this.owningClient.getName(),
                  channelData.getChannelContext().getTableName(),
                  totalBufferSizeInBytes,
                  totalBufferSizePerTableInBytes,
                  channelData.getBufferSize(),
                  channelData.getChannelContext().getEncryptionKeyId(),
                  channelsDataPerTable.get(idx - 1).getChannelContext().getEncryptionKeyId(),
                  channelData.getColumnEps().keySet(),
                  channelsDataPerTable.get(idx - 1).getColumnEps().keySet());
              break;
            }
            totalBufferSizeInBytes += channelData.getBufferSize();
            totalBufferSizePerTableInBytes += channelData.getBufferSize();
            idx++;
          }
          // Add processed channels to the current blob, stop if we need to create a new blob
          blobData.add(channelsDataPerTable.subList(0, idx));
          if (idx != channelsDataPerTable.size()) {
            break;
          }
        }
      }

      // Kick off a build job
      if (blobData.isEmpty()) {
        // we decrement the blob sequencer so that we do not have gaps in the blob names created by
        // this client.
        this.storageManager.decrementBlobSequencer();
      } else {
        long flushStartMs = System.currentTimeMillis();
        if (this.owningClient.flushLatency != null) {
          latencyTimerContextMap.putIfAbsent(blobPath, this.owningClient.flushLatency.time());
        }
        blobs.add(
            new Pair<>(
                new BlobData<>(blobPath, blobData),
                CompletableFuture.supplyAsync(
                    () -> {
                      try {
                        // Get the fully qualified table name from the first channel in the blob.
                        // This only matters when the client is in Iceberg mode. In Iceberg mode,
                        // all channels in the blob belong to the same table.
                        String fullyQualifiedTableName =
                            blobData.get(0).get(0).getChannelContext().getFullyQualifiedTableName();
                        BlobMetadata blobMetadata =
                            buildAndUpload(blobPath, blobData, fullyQualifiedTableName);
                        blobMetadata.getBlobStats().setFlushStartMs(flushStartMs);
                        return blobMetadata;
                      } catch (Throwable e) {
                        Throwable ex = e.getCause() == null ? e : e.getCause();
                        String errorMessage =
                            String.format(
                                "Building blob failed, client=%s, blob=%s, exception=%s,"
                                    + " detail=%s, trace=%s, all channels in the blob will be"
                                    + " invalidated",
                                this.owningClient.getName(),
                                blobPath,
                                ex,
                                ex.getMessage(),
                                getStackTrace(ex));
                        logger.logError(errorMessage);
                        if (this.owningClient.getTelemetryService() != null) {
                          this.owningClient
                              .getTelemetryService()
                              .reportClientFailure(this.getClass().getSimpleName(), errorMessage);
                        }

                        if (e instanceof IOException) {
                          invalidateAllChannelsInBlob(blobData, errorMessage);
                          return null;
                        } else if (e instanceof NoSuchAlgorithmException) {
                          throw new SFException(e, ErrorCode.MD5_HASHING_NOT_AVAILABLE);
                        } else if (e instanceof InvalidAlgorithmParameterException
                            | e instanceof NoSuchPaddingException
                            | e instanceof IllegalBlockSizeException
                            | e instanceof BadPaddingException
                            | e instanceof InvalidKeyException) {
                          throw new SFException(e, ErrorCode.ENCRYPTION_FAILURE);
                        } else {
                          throw new SFException(e, ErrorCode.INTERNAL_ERROR, e.getMessage());
                        }
                      }
                    },
                    this.buildUploadWorkers)));
        logger.logInfo(
            "buildAndUpload task added for client={}, blob={}, buildUploadWorkers stats={}",
            this.owningClient.getName(),
            blobPath,
            this.buildUploadWorkers.toString());
      }
    }

    // Add the flush task futures to the register service
    this.registerService.addBlobs(blobs);
  }

  /**
   * Check whether we should stop merging more channels into the same chunk, we need to stop in a
   * few cases:
   *
   * When the blob size is larger than a certain threshold
   *
   * 
When the chunk size is larger than a certain threshold
   *
   * 
When the encryption key ids are not the same
   *
   * When the schemas are not the same
   */
  private boolean shouldStopProcessing(
      float totalBufferSizeInBytes,
      float totalBufferSizePerTableInBytes,
      ChannelData current,
      ChannelData prev) {
    return totalBufferSizeInBytes + current.getBufferSize() > MAX_BLOB_SIZE_IN_BYTES
        || totalBufferSizePerTableInBytes + current.getBufferSize()
            > this.owningClient.getParameterProvider().getMaxChunkSizeInBytes()
        || !Objects.equals(
            current.getChannelContext().getEncryptionKeyId(),
            prev.getChannelContext().getEncryptionKeyId())
        || !current.getColumnEps().keySet().equals(prev.getColumnEps().keySet());
  }

  /**
   * Builds and uploads blob to cloud storage.
   *
   * @param blobPath Path of the destination blob in cloud storage
   * @param blobData All the data for one blob. Assumes that all ChannelData in the inner List
   *     belongs to the same table. Will error if this is not the case
   * @param fullyQualifiedTableName the table name of the first channel in the blob, only matters in
   *     Iceberg mode
   * @return BlobMetadata for FlushService.upload
   */
  BlobMetadata buildAndUpload(
      String blobPath, List>> blobData, String fullyQualifiedTableName)
      throws IOException, NoSuchAlgorithmException, InvalidAlgorithmParameterException,
          NoSuchPaddingException, IllegalBlockSizeException, BadPaddingException,
          InvalidKeyException {
    Timer.Context buildContext = Utils.createTimerContext(this.owningClient.buildLatency);

    // Construct the blob along with the metadata of the blob
    BlobBuilder.Blob blob =
        BlobBuilder.constructBlobAndMetadata(
            blobPath,
            blobData,
            bdecVersion,
            this.owningClient.getInternalParameterProvider().getEnableChunkEncryption());

    blob.blobStats.setBuildDurationMs(buildContext);

    return upload(
        this.storageManager.getStorage(fullyQualifiedTableName),
        blobPath,
        blob.blobBytes,
        blob.chunksMetadataList,
        blob.blobStats);
  }

  /**
   * Upload a blob to Streaming Ingest dedicated stage
   *
   * @param storage the storage to upload the blob
   * @param blobPath full path of the blob
   * @param blob blob data
   * @param metadata a list of chunk metadata
   * @param blobStats an object to track latencies and other stats of the blob
   * @return BlobMetadata object used to create the register blob request
   */
  BlobMetadata upload(
      StreamingIngestStorage storage,
      String blobPath,
      byte[] blob,
      List metadata,
      BlobStats blobStats)
      throws NoSuchAlgorithmException {
    logger.logInfo("Start uploading blob={}, size={}", blobPath, blob.length);
    long startTime = System.currentTimeMillis();

    Timer.Context uploadContext = Utils.createTimerContext(this.owningClient.uploadLatency);
    storage.put(blobPath, blob);

    if (uploadContext != null) {
      blobStats.setUploadDurationMs(uploadContext);
      this.owningClient.uploadThroughput.mark(blob.length);
      this.owningClient.blobSizeHistogram.update(blob.length);
      this.owningClient.blobRowCountHistogram.update(
          metadata.stream().mapToLong(i -> i.getEpInfo().getRowCount()).sum());
    }

    logger.logInfo(
        "Finish uploading blob={}, size={}, timeInMillis={}",
        blobPath,
        blob.length,
        System.currentTimeMillis() - startTime);

    // at this point we know for sure if the BDEC file has data for more than one chunk, i.e.
    // spans mixed tables or not
    return BlobMetadata.createBlobMetadata(
        blobPath,
        BlobBuilder.computeMD5(blob),
        bdecVersion,
        metadata,
        blobStats,
        metadata == null ? false : metadata.size() > 1);
  }

  /**
   * Release all resources
   *
   * @throws InterruptedException
   */
  void shutdown() throws InterruptedException {
    this.flushWorker.shutdown();
    this.registerWorker.shutdown();
    this.buildUploadWorkers.shutdown();

    boolean isTerminated =
        this.flushWorker.awaitTermination(THREAD_SHUTDOWN_TIMEOUT_IN_SEC, TimeUnit.SECONDS)
            && this.registerWorker.awaitTermination(
                THREAD_SHUTDOWN_TIMEOUT_IN_SEC, TimeUnit.SECONDS)
            && this.buildUploadWorkers.awaitTermination(
                THREAD_SHUTDOWN_TIMEOUT_IN_SEC, TimeUnit.SECONDS);

    if (!isTerminated) {
      logger.logWarn("Tasks can't be terminated within the timeout, force shutdown now.");
      this.flushWorker.shutdownNow();
      this.registerWorker.shutdownNow();
      this.buildUploadWorkers.shutdownNow();
    }
  }

  /**
   * Set the flag to indicate that a flush is needed
   *
   * @param fullyQualifiedTableName the fully qualified table name
   */
  void setNeedFlush(String fullyQualifiedTableName) {
    this.isNeedFlush = true;
    if (this.owningClient.getParameterProvider().getMaxChunksInBlob() == 1) {
      this.channelCache.setNeedFlush(fullyQualifiedTableName, true);
    }
  }

  /**
   * Invalidate all the channels in the blob data
   *
   * @param blobData list of channels that belongs to the blob
   */
   void invalidateAllChannelsInBlob(
      List>> blobData, String invalidationCause) {
    blobData.forEach(
        chunkData ->
            chunkData.forEach(
                channelData -> {
                  this.owningClient
                      .getChannelCache()
                      .invalidateChannelIfSequencersMatch(
                          channelData.getChannelContext().getDbName(),
                          channelData.getChannelContext().getSchemaName(),
                          channelData.getChannelContext().getTableName(),
                          channelData.getChannelContext().getName(),
                          channelData.getChannelContext().getChannelSequencer(),
                          invalidationCause);
                }));
  }

  /**
   * Throttle if the number of queued buildAndUpload tasks is bigger than the total number of
   * available processors
   */
  boolean throttleDueToQueuedFlushTasks() {
    ThreadPoolExecutor buildAndUpload = (ThreadPoolExecutor) this.buildUploadWorkers;
    boolean throttleOnQueuedTasks = buildAndUpload.getQueue().size() > numProcessors;
    if (throttleOnQueuedTasks) {
      logger.logWarn(
          "Throttled due too many queue flush tasks (probably because of slow uploading speed),"
              + " client={}, buildUploadWorkers stats={}",
          this.owningClient.getName(),
          this.buildUploadWorkers.toString());
    }
    return throttleOnQueuedTasks;
  }

  /** Get whether we're running under test mode */
  boolean isTestMode() {
    return this.isTestMode;
  }
}