com.facebook.presto.tpcds.statistics.TpcdsTableStatisticsFactory Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.facebook.presto.tpcds.statistics;
import com.facebook.presto.common.type.CharType;
import com.facebook.presto.common.type.DecimalType;
import com.facebook.presto.common.type.Decimals;
import com.facebook.presto.common.type.Type;
import com.facebook.presto.common.type.VarcharType;
import com.facebook.presto.spi.ColumnHandle;
import com.facebook.presto.spi.statistics.ColumnStatistics;
import com.facebook.presto.spi.statistics.DoubleRange;
import com.facebook.presto.spi.statistics.Estimate;
import com.facebook.presto.spi.statistics.TableStatistics;
import com.facebook.presto.tpcds.TpcdsColumnHandle;
import com.teradata.tpcds.Table;
import io.airlift.slice.Slice;
import java.time.LocalDate;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import static com.facebook.presto.common.type.BigintType.BIGINT;
import static com.facebook.presto.common.type.DateType.DATE;
import static com.facebook.presto.common.type.Decimals.isLongDecimal;
import static com.facebook.presto.common.type.Decimals.isShortDecimal;
import static com.facebook.presto.common.type.DoubleType.DOUBLE;
import static com.facebook.presto.common.type.IntegerType.INTEGER;
import static com.facebook.presto.common.type.TimeType.TIME;
import static java.lang.Double.parseDouble;
public class TpcdsTableStatisticsFactory
{
private final TableStatisticsDataRepository statisticsDataRepository = new TableStatisticsDataRepository();
public TableStatistics create(String schemaName, Table table, List columnHandles)
{
Optional statisticsDataOptional = statisticsDataRepository.load(schemaName, table);
return statisticsDataOptional.map(statisticsData -> toTableStatistics(columnHandles, statisticsData))
.orElse(TableStatistics.empty());
}
private TableStatistics toTableStatistics(List columnHandles, TableStatisticsData statisticsData)
{
long rowCount = statisticsData.getRowCount();
TableStatistics.Builder tableStatistics = TableStatistics.builder()
.setRowCount(Estimate.of(rowCount));
if (rowCount > 0) {
Map columnsData = statisticsData.getColumns();
for (ColumnHandle handle : columnHandles) {
TpcdsColumnHandle columnHandle = (TpcdsColumnHandle) handle;
tableStatistics.setColumnStatistics(columnHandle, toColumnStatistics(columnsData.get(columnHandle.getColumnName()), columnHandle.getType(), rowCount));
}
}
return tableStatistics.build();
}
private ColumnStatistics toColumnStatistics(ColumnStatisticsData columnStatisticsData, Type type, long rowCount)
{
ColumnStatistics.Builder columnStatistics = ColumnStatistics.builder();
long nullCount = columnStatisticsData.getNullsCount();
columnStatistics.setNullsFraction(Estimate.of((double) nullCount / rowCount));
columnStatistics.setRange(toRange(columnStatisticsData.getMin(), columnStatisticsData.getMax(), type));
columnStatistics.setDistinctValuesCount(Estimate.of(columnStatisticsData.getDistinctValuesCount()));
columnStatistics.setDataSize(columnStatisticsData.getDataSize().map(Estimate::of).orElse(Estimate.unknown()));
return columnStatistics.build();
}
private static Optional toRange(Optional