
org.dinky.shaded.paimon.mergetree.compact.UniversalCompaction Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.dinky.shaded.paimon.mergetree.compact;
import org.dinky.shaded.paimon.annotation.VisibleForTesting;
import org.dinky.shaded.paimon.compact.CompactUnit;
import org.dinky.shaded.paimon.mergetree.LevelSortedRun;
import org.dinky.shaded.paimon.mergetree.SortedRun;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.util.List;
import java.util.Optional;
/**
* Universal Compaction Style is a compaction style, targeting the use cases requiring lower write
* amplification, trading off read amplification and space amplification.
*
* See RocksDb Universal-Compaction:
* https://github.com/facebook/rocksdb/wiki/Universal-Compaction.
*/
public class UniversalCompaction implements CompactStrategy {
private static final Logger LOG = LoggerFactory.getLogger(UniversalCompaction.class);
private final int maxSizeAmp;
private final int sizeRatio;
private final int numRunCompactionTrigger;
public UniversalCompaction(int maxSizeAmp, int sizeRatio, int numRunCompactionTrigger) {
this.maxSizeAmp = maxSizeAmp;
this.sizeRatio = sizeRatio;
this.numRunCompactionTrigger = numRunCompactionTrigger;
}
@Override
public Optional pick(int numLevels, List runs) {
int maxLevel = numLevels - 1;
// 1 checking for reducing size amplification
CompactUnit unit = pickForSizeAmp(maxLevel, runs);
if (unit != null) {
if (LOG.isDebugEnabled()) {
LOG.debug("Universal compaction due to size amplification");
}
return Optional.of(unit);
}
// 2 checking for size ratio
unit = pickForSizeRatio(maxLevel, runs);
if (unit != null) {
if (LOG.isDebugEnabled()) {
LOG.debug("Universal compaction due to size ratio");
}
return Optional.of(unit);
}
// 3 checking for file num
if (runs.size() > numRunCompactionTrigger) {
// compacting for file num
int candidateCount = runs.size() - numRunCompactionTrigger + 1;
if (LOG.isDebugEnabled()) {
LOG.debug("Universal compaction due to file num");
}
return Optional.ofNullable(pickForSizeRatio(maxLevel, runs, candidateCount));
}
return Optional.empty();
}
@VisibleForTesting
CompactUnit pickForSizeAmp(int maxLevel, List runs) {
if (runs.size() < numRunCompactionTrigger) {
return null;
}
long candidateSize =
runs.subList(0, runs.size() - 1).stream()
.map(LevelSortedRun::run)
.mapToLong(SortedRun::totalSize)
.sum();
long earliestRunSize = runs.get(runs.size() - 1).run().totalSize();
// size amplification = percentage of additional size
if (candidateSize * 100 > maxSizeAmp * earliestRunSize) {
return CompactUnit.fromLevelRuns(maxLevel, runs);
}
return null;
}
@VisibleForTesting
CompactUnit pickForSizeRatio(int maxLevel, List runs) {
if (runs.size() < numRunCompactionTrigger) {
return null;
}
return pickForSizeRatio(maxLevel, runs, 1);
}
private CompactUnit pickForSizeRatio(
int maxLevel, List runs, int candidateCount) {
return pickForSizeRatio(maxLevel, runs, candidateCount, false);
}
public CompactUnit pickForSizeRatio(
int maxLevel, List runs, int candidateCount, boolean forcePick) {
long candidateSize = candidateSize(runs, candidateCount);
for (int i = candidateCount; i < runs.size(); i++) {
LevelSortedRun next = runs.get(i);
if (candidateSize * (100.0 + sizeRatio) / 100.0 < next.run().totalSize()) {
break;
}
candidateSize += next.run().totalSize();
candidateCount++;
}
if (forcePick || candidateCount > 1) {
return createUnit(runs, maxLevel, candidateCount);
}
return null;
}
private long candidateSize(List runs, int candidateCount) {
long size = 0;
for (int i = 0; i < candidateCount; i++) {
size += runs.get(i).run().totalSize();
}
return size;
}
@VisibleForTesting
static CompactUnit createUnit(List runs, int maxLevel, int runCount) {
int outputLevel;
if (runCount == runs.size()) {
outputLevel = maxLevel;
} else {
// level of next run - 1
outputLevel = Math.max(0, runs.get(runCount).level() - 1);
}
if (outputLevel == 0) {
// do not output level 0
for (int i = runCount; i < runs.size(); i++) {
LevelSortedRun next = runs.get(i);
runCount++;
if (next.level() != 0) {
outputLevel = next.level();
break;
}
}
}
if (runCount == runs.size()) {
outputLevel = maxLevel;
}
return CompactUnit.fromLevelRuns(outputLevel, runs.subList(0, runCount));
}
}