org.dinky.shaded.paimon.table.system.ManifestsTable Maven / Gradle / Ivy
The newest version!
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.dinky.shaded.paimon.table.system;
import org.dinky.shaded.paimon.CoreOptions;
import org.dinky.shaded.paimon.Snapshot;
import org.dinky.shaded.paimon.data.BinaryString;
import org.dinky.shaded.paimon.data.GenericRow;
import org.dinky.shaded.paimon.data.InternalRow;
import org.dinky.shaded.paimon.disk.IOManager;
import org.dinky.shaded.paimon.format.FileFormat;
import org.dinky.shaded.paimon.fs.FileIO;
import org.dinky.shaded.paimon.fs.Path;
import org.dinky.shaded.paimon.manifest.ManifestFileMeta;
import org.dinky.shaded.paimon.manifest.ManifestList;
import org.dinky.shaded.paimon.predicate.Predicate;
import org.dinky.shaded.paimon.reader.RecordReader;
import org.dinky.shaded.paimon.table.ReadonlyTable;
import org.dinky.shaded.paimon.table.Table;
import org.dinky.shaded.paimon.table.source.InnerTableRead;
import org.dinky.shaded.paimon.table.source.InnerTableScan;
import org.dinky.shaded.paimon.table.source.ReadOnceTableScan;
import org.dinky.shaded.paimon.table.source.Split;
import org.dinky.shaded.paimon.table.source.TableRead;
import org.dinky.shaded.paimon.types.BigIntType;
import org.dinky.shaded.paimon.types.DataField;
import org.dinky.shaded.paimon.types.RowType;
import org.dinky.shaded.paimon.utils.FileStorePathFactory;
import org.dinky.shaded.paimon.utils.IteratorRecordReader;
import org.dinky.shaded.paimon.utils.ProjectedRow;
import org.dinky.shaded.paimon.utils.SerializationUtils;
import org.dinky.shaded.paimon.utils.SnapshotManager;
import org.dinky.shaded.paimon.shade.guava30.com.google.common.collect.Iterators;
import java.io.IOException;
import java.util.Arrays;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import static org.dinky.shaded.paimon.catalog.Catalog.SYSTEM_TABLE_SPLITTER;
/** A {@link Table} for showing committing snapshots of table. */
public class ManifestsTable implements ReadonlyTable {
private static final long serialVersionUID = 1L;
public static final String MANIFESTS = "manifests";
public static final RowType TABLE_TYPE =
new RowType(
Arrays.asList(
new DataField(0, "file_name", SerializationUtils.newStringType(false)),
new DataField(1, "file_size", new BigIntType(false)),
new DataField(2, "num_added_files", new BigIntType(false)),
new DataField(3, "num_deleted_files", new BigIntType(false)),
new DataField(4, "schema_id", new BigIntType(false))));
private final FileIO fileIO;
private final Path location;
private final Table dataTable;
public ManifestsTable(FileIO fileIO, Path location, Table dataTable) {
this.fileIO = fileIO;
this.location = location;
this.dataTable = dataTable;
}
@Override
public InnerTableScan newScan() {
return new ManifestsScan();
}
@Override
public InnerTableRead newRead() {
return new ManifestsRead(fileIO, dataTable);
}
@Override
public String name() {
return location.getName() + SYSTEM_TABLE_SPLITTER + MANIFESTS;
}
@Override
public RowType rowType() {
return TABLE_TYPE;
}
@Override
public List primaryKeys() {
return Collections.singletonList("file_name");
}
@Override
public Table copy(Map dynamicOptions) {
return new ManifestsTable(fileIO, location, dataTable.copy(dynamicOptions));
}
private class ManifestsScan extends ReadOnceTableScan {
@Override
public InnerTableScan withFilter(Predicate predicate) {
// TODO
return this;
}
@Override
protected Plan innerPlan() {
return () -> Collections.singletonList(new ManifestsSplit(fileIO, location, dataTable));
}
}
private static class ManifestsSplit implements Split {
private static final long serialVersionUID = 1L;
private final FileIO fileIO;
private final Path location;
private final Table dataTable;
private ManifestsSplit(FileIO fileIO, Path location, Table dataTable) {
this.fileIO = fileIO;
this.location = location;
this.dataTable = dataTable;
}
@Override
public long rowCount() {
return allManifests(fileIO, location, dataTable).size();
}
@Override
public boolean equals(Object o) {
if (this == o) {
return true;
}
if (o == null || getClass() != o.getClass()) {
return false;
}
ManifestsSplit that = (ManifestsSplit) o;
return Objects.equals(location, that.location);
}
@Override
public int hashCode() {
return Objects.hash(location);
}
}
private static class ManifestsRead implements InnerTableRead {
private int[][] projection;
private final FileIO fileIO;
private final Table dataTable;
public ManifestsRead(FileIO fileIO, Table dataTable) {
this.fileIO = fileIO;
this.dataTable = dataTable;
}
@Override
public InnerTableRead withFilter(Predicate predicate) {
// TODO
return this;
}
@Override
public InnerTableRead withProjection(int[][] projection) {
this.projection = projection;
return this;
}
@Override
public TableRead withIOManager(IOManager ioManager) {
return this;
}
@Override
public RecordReader createReader(Split split) throws IOException {
if (!(split instanceof ManifestsSplit)) {
throw new IllegalArgumentException("Unsupported split: " + split.getClass());
}
Path location = ((ManifestsSplit) split).location;
List manifestFileMetas = allManifests(fileIO, location, dataTable);
Iterator rows =
Iterators.transform(manifestFileMetas.iterator(), this::toRow);
if (projection != null) {
rows =
Iterators.transform(
rows, row -> ProjectedRow.from(projection).replaceRow(row));
}
return new IteratorRecordReader<>(rows);
}
private InternalRow toRow(ManifestFileMeta manifestFileMeta) {
return GenericRow.of(
BinaryString.fromString(manifestFileMeta.fileName()),
manifestFileMeta.fileSize(),
manifestFileMeta.numAddedFiles(),
manifestFileMeta.numDeletedFiles(),
manifestFileMeta.schemaId());
}
}
private static List allManifests(
FileIO fileIO, Path location, Table dataTable) {
CoreOptions coreOptions = CoreOptions.fromMap(dataTable.options());
SnapshotManager snapshotManager = new SnapshotManager(fileIO, location);
Long snapshotId = coreOptions.scanSnapshotId();
Snapshot snapshot = null;
if (snapshotId != null && snapshotManager.snapshotExists(snapshotId)) {
snapshot = snapshotManager.snapshot(snapshotId);
} else if (snapshotId == null) {
snapshot = snapshotManager.latestSnapshot();
}
if (snapshot == null) {
return Collections.emptyList();
}
FileStorePathFactory fileStorePathFactory = new FileStorePathFactory(location);
FileFormat fileFormat = coreOptions.manifestFormat();
ManifestList manifestList =
new ManifestList.Factory(fileIO, fileFormat, fileStorePathFactory, null).create();
return snapshot.allManifests(manifestList);
}
}