org.apache.parquet.column.page.DataPageV2 Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.parquet.column.page;
import java.util.Optional;
import org.apache.parquet.bytes.BytesInput;
import org.apache.parquet.column.Encoding;
import org.apache.parquet.column.statistics.Statistics;
public class DataPageV2 extends DataPage {
/**
* @param rowCount count of rows
* @param nullCount count of nulls
* @param valueCount count of values
* @param repetitionLevels RLE encoded repetition levels
* @param definitionLevels RLE encoded definition levels
* @param dataEncoding encoding for the data
* @param data data encoded with dataEncoding
* @param statistics optional statistics for this page
* @return an uncompressed page
*/
public static DataPageV2 uncompressed(
int rowCount,
int nullCount,
int valueCount,
BytesInput repetitionLevels,
BytesInput definitionLevels,
Encoding dataEncoding,
BytesInput data,
Statistics> statistics) {
return new DataPageV2(
rowCount,
nullCount,
valueCount,
repetitionLevels,
definitionLevels,
dataEncoding,
data,
Math.toIntExact(repetitionLevels.size() + definitionLevels.size() + data.size()),
statistics,
false);
}
/**
* @param rowCount count of rows
* @param nullCount count of nulls
* @param valueCount count of values
* @param firstRowIndex the index of the first row in this page
* @param repetitionLevels RLE encoded repetition levels
* @param definitionLevels RLE encoded definition levels
* @param dataEncoding encoding for the data
* @param data data encoded with dataEncoding
* @param statistics optional statistics for this page
* @return an uncompressed page
*/
public static DataPageV2 uncompressed(
int rowCount,
int nullCount,
int valueCount,
long firstRowIndex,
BytesInput repetitionLevels,
BytesInput definitionLevels,
Encoding dataEncoding,
BytesInput data,
Statistics> statistics) {
return new DataPageV2(
rowCount,
nullCount,
valueCount,
firstRowIndex,
repetitionLevels,
definitionLevels,
dataEncoding,
data,
Math.toIntExact(repetitionLevels.size() + definitionLevels.size() + data.size()),
statistics,
false);
}
/**
* @param rowCount count of rows
* @param nullCount count of nulls
* @param valueCount count of values
* @param repetitionLevels RLE encoded repetition levels
* @param definitionLevels RLE encoded definition levels
* @param dataEncoding encoding for the data
* @param data data encoded with dataEncoding and compressed
* @param uncompressedSize total size uncompressed (rl + dl + data)
* @param statistics optional statistics for this page
* @return a compressed page
*/
public static DataPageV2 compressed(
int rowCount,
int nullCount,
int valueCount,
BytesInput repetitionLevels,
BytesInput definitionLevels,
Encoding dataEncoding,
BytesInput data,
int uncompressedSize,
Statistics> statistics) {
return new DataPageV2(
rowCount,
nullCount,
valueCount,
repetitionLevels,
definitionLevels,
dataEncoding,
data,
uncompressedSize,
statistics,
true);
}
private final int rowCount;
private final int nullCount;
private final BytesInput repetitionLevels;
private final BytesInput definitionLevels;
private final Encoding dataEncoding;
private final BytesInput data;
private final Statistics> statistics;
private final boolean isCompressed;
public DataPageV2(
int rowCount,
int nullCount,
int valueCount,
BytesInput repetitionLevels,
BytesInput definitionLevels,
Encoding dataEncoding,
BytesInput data,
int uncompressedSize,
Statistics> statistics,
boolean isCompressed) {
super(
Math.toIntExact(repetitionLevels.size() + definitionLevels.size() + data.size()),
uncompressedSize,
valueCount);
this.rowCount = rowCount;
this.nullCount = nullCount;
this.repetitionLevels = repetitionLevels;
this.definitionLevels = definitionLevels;
this.dataEncoding = dataEncoding;
this.data = data;
this.statistics = statistics;
this.isCompressed = isCompressed;
}
private DataPageV2(
int rowCount,
int nullCount,
int valueCount,
long firstRowIndex,
BytesInput repetitionLevels,
BytesInput definitionLevels,
Encoding dataEncoding,
BytesInput data,
int uncompressedSize,
Statistics> statistics,
boolean isCompressed) {
super(
Math.toIntExact(repetitionLevels.size() + definitionLevels.size() + data.size()),
uncompressedSize,
valueCount,
firstRowIndex);
this.rowCount = rowCount;
this.nullCount = nullCount;
this.repetitionLevels = repetitionLevels;
this.definitionLevels = definitionLevels;
this.dataEncoding = dataEncoding;
this.data = data;
this.statistics = statistics;
this.isCompressed = isCompressed;
}
public int getRowCount() {
return rowCount;
}
public int getNullCount() {
return nullCount;
}
public BytesInput getRepetitionLevels() {
return repetitionLevels;
}
public BytesInput getDefinitionLevels() {
return definitionLevels;
}
public Encoding getDataEncoding() {
return dataEncoding;
}
public BytesInput getData() {
return data;
}
public Statistics> getStatistics() {
return statistics;
}
public boolean isCompressed() {
return isCompressed;
}
@Override
public Optional getIndexRowCount() {
return Optional.of(rowCount);
}
@Override
public T accept(Visitor visitor) {
return visitor.visit(this);
}
@Override
public String toString() {
return "Page V2 ["
+ "dl size=" + definitionLevels.size() + ", "
+ "rl size=" + repetitionLevels.size() + ", "
+ "data size=" + data.size() + ", "
+ "data enc=" + dataEncoding + ", "
+ "valueCount=" + getValueCount() + ", "
+ "rowCount=" + getRowCount() + ", "
+ "is compressed=" + isCompressed + ", "
+ "uncompressedSize=" + getUncompressedSize() + "]";
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy