All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.netease.arctic.scan.BasicArcticFileScanTask Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.netease.arctic.scan;

import com.netease.arctic.data.DataTreeNode;
import com.netease.arctic.data.DefaultKeyedFile;
import com.netease.arctic.data.PrimaryKeyedFile;
import com.netease.arctic.data.file.FileNameGenerator;
import com.netease.arctic.shade.org.apache.iceberg.DeleteFile;
import com.netease.arctic.shade.org.apache.iceberg.FileScanTask;
import com.netease.arctic.shade.org.apache.iceberg.PartitionSpec;
import com.netease.arctic.shade.org.apache.iceberg.expressions.Expression;
import com.netease.arctic.shade.org.apache.iceberg.expressions.Expressions;

import java.util.Collections;
import java.util.List;
import java.util.stream.Collectors;

/**
 * Basic implementation of {@link ArcticFileScanTask}
 */
public class BasicArcticFileScanTask implements ArcticFileScanTask {

  private final PrimaryKeyedFile baseFile;

  private final List posDeleteFiles;

  private final PartitionSpec spec;

  private final Expression expression;

  private FileScanTask fileScanTask;

  public BasicArcticFileScanTask(PrimaryKeyedFile baseFile, List posDeleteFiles, PartitionSpec spec) {
    this(baseFile, posDeleteFiles, spec, Expressions.alwaysTrue());
  }

  public BasicArcticFileScanTask(
      PrimaryKeyedFile baseFile, List posDeleteFiles, PartitionSpec spec,
      Expression expression) {
    this.baseFile = baseFile;
    this.posDeleteFiles = posDeleteFiles == null ? Collections.emptyList() :
        posDeleteFiles.stream().filter(s -> {
          DataTreeNode node = FileNameGenerator.parseFileNodeFromFileName(s.path().toString());
          return node.index() == baseFile.node().index() && node.mask() == baseFile.node().mask();
        }).collect(Collectors.toList());
    this.spec = spec;
    this.expression = expression;
  }

  /**
   * Only for iceberg wrap
   * @param fileScanTask
   */
  public BasicArcticFileScanTask(FileScanTask fileScanTask) {
    this(DefaultKeyedFile.parseBase(fileScanTask.file()), fileScanTask.deletes(),
        fileScanTask.spec(), fileScanTask.residual());
    this.fileScanTask = fileScanTask;
  }

  @Override
  public PrimaryKeyedFile file() {
    return baseFile;
  }

  @Override
  public List deletes() {
    return posDeleteFiles;
  }

  @Override
  public PartitionSpec spec() {
    return spec;
  }

  @Override
  public long start() {
    if (fileScanTask != null) {
      return fileScanTask.start();
    }
    return 0;
  }

  @Override
  public long length() {
    if (fileScanTask != null) {
      return fileScanTask.length();
    }
    return baseFile.fileSizeInBytes();
  }

  @Override
  public Expression residual() {
    return expression;
  }

  @Override
  public Iterable split(long splitSize) {
    throw new UnsupportedOperationException("Unsupported split");
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy