com.facebook.presto.verifier.resolver.StructuredColumnMismatchResolver Maven / Gradle / Ivy
The newest version!
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.facebook.presto.verifier.resolver;
import com.facebook.presto.common.type.ArrayType;
import com.facebook.presto.common.type.DoubleType;
import com.facebook.presto.common.type.MapType;
import com.facebook.presto.common.type.RealType;
import com.facebook.presto.common.type.RowType;
import com.facebook.presto.common.type.Type;
import com.facebook.presto.verifier.checksum.ArrayColumnChecksum;
import com.facebook.presto.verifier.checksum.ColumnMatchResult;
import com.facebook.presto.verifier.checksum.MapColumnChecksum;
import com.facebook.presto.verifier.checksum.StructureColumnChecksum;
import com.facebook.presto.verifier.framework.DataMatchResult;
import com.facebook.presto.verifier.framework.QueryBundle;
import java.util.Objects;
import java.util.Optional;
import static com.facebook.presto.common.type.RowType.Field;
import static com.facebook.presto.verifier.framework.DataMatchResult.MatchType.COLUMN_MISMATCH;
import static com.google.common.base.Preconditions.checkArgument;
public class StructuredColumnMismatchResolver
implements FailureResolver
{
public static final String NAME = "structured-column";
@Override
public Optional resolveResultMismatch(DataMatchResult matchResult, QueryBundle control)
{
checkArgument(!matchResult.isMatched(), "Expect not matched");
if (matchResult.getMatchType() != COLUMN_MISMATCH) {
return Optional.empty();
}
for (ColumnMatchResult> mismatchedColumn : matchResult.getMismatchedColumns()) {
Type columnType = mismatchedColumn.getColumn().getType();
if (columnType instanceof ArrayType) {
ArrayColumnChecksum controlChecksum = (ArrayColumnChecksum) mismatchedColumn.getControlChecksum();
ArrayColumnChecksum testChecksum = (ArrayColumnChecksum) mismatchedColumn.getTestChecksum();
// If this checksum is null then we have FloatingPointColumnChecksum as part of the ArrayColumnChecksum,
// which tackles the floating point imprecision. So we don't resolve.
if (Objects.isNull(controlChecksum.getChecksum())) {
return Optional.empty();
}
if (!containsFloatingPointType(((ArrayType) columnType).getElementType())
|| !isCardinalityMatched(controlChecksum, testChecksum)) {
return Optional.empty();
}
}
else if (columnType instanceof MapType) {
MapColumnChecksum controlChecksum = (MapColumnChecksum) mismatchedColumn.getControlChecksum();
MapColumnChecksum testChecksum = (MapColumnChecksum) mismatchedColumn.getTestChecksum();
// Cardinality mismatch. Do not resolve.
if (!isCardinalityMatched(controlChecksum, testChecksum)) {
return Optional.empty();
}
boolean keyContainsFloatingPoint = containsFloatingPointType(((MapType) columnType).getKeyType());
boolean valueContainsFloatingPoint = containsFloatingPointType(((MapType) columnType).getValueType());
// No pure floating point types. Do not resolve.
if (!keyContainsFloatingPoint && !valueContainsFloatingPoint) {
return Optional.empty();
}
// Not-floating point keys mismatch. Do not resolve.
if (!keyContainsFloatingPoint &&
!Objects.equals(controlChecksum.getKeysChecksum(), testChecksum.getKeysChecksum())) {
return Optional.empty();
}
// Not-floating point values.
if (!valueContainsFloatingPoint) {
// If we got values checksums and they are not matching, then do not resolve.
if (!Objects.equals(controlChecksum.getValuesChecksum(), testChecksum.getValuesChecksum())) {
return Optional.empty();
}
// Values checksums either match or missing (being nulls).
// They can be missing because omitted or in corner cases of no rows, null maps, no elements, etc.
// Checking the whole checksum if the values checksums are missing.
if (Objects.isNull(controlChecksum.getValuesChecksum())) {
if (!Objects.equals(controlChecksum.getChecksum(), testChecksum.getChecksum())) {
return Optional.empty();
}
}
}
}
else {
return Optional.empty();
}
}
return Optional.of("Structured columns auto-resolved");
}
private static boolean containsFloatingPointType(Type type)
{
if (type instanceof DoubleType || type instanceof RealType) {
return true;
}
if (type instanceof ArrayType) {
return containsFloatingPointType(((ArrayType) type).getElementType());
}
if (type instanceof MapType) {
return containsFloatingPointType(((MapType) type).getKeyType()) || containsFloatingPointType(((MapType) type).getValueType());
}
if (type instanceof RowType) {
for (Field field : ((RowType) type).getFields()) {
if (containsFloatingPointType(field.getType())) {
return true;
}
}
return false;
}
return false;
}
private static boolean isCardinalityMatched(T controlChecksum, T testChecksum)
{
return Objects.equals(controlChecksum.getCardinalityChecksum(), testChecksum.getCardinalityChecksum())
&& Objects.equals(controlChecksum.getCardinalitySum(), testChecksum.getCardinalitySum());
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy