org.apache.iceberg.parquet.ApplyNameMapping Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of iceberg-parquet Show documentation
Show all versions of iceberg-parquet Show documentation
A table format for huge analytic datasets
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.iceberg.parquet;
import java.util.List;
import java.util.Objects;
import java.util.stream.Collectors;
import org.apache.iceberg.mapping.MappedField;
import org.apache.iceberg.mapping.NameMapping;
import org.apache.parquet.Preconditions;
import org.apache.parquet.schema.GroupType;
import org.apache.parquet.schema.MessageType;
import org.apache.parquet.schema.PrimitiveType;
import org.apache.parquet.schema.Type;
import org.apache.parquet.schema.Types;
class ApplyNameMapping extends ParquetTypeVisitor {
private final NameMapping nameMapping;
ApplyNameMapping(NameMapping nameMapping) {
this.nameMapping = nameMapping;
}
@Override
public Type message(MessageType message, List fields) {
Types.MessageTypeBuilder builder = org.apache.parquet.schema.Types.buildMessage();
fields.stream().filter(Objects::nonNull).forEach(builder::addField);
return builder.named(message.getName());
}
@Override
public Type struct(GroupType struct, List types) {
MappedField field = nameMapping.find(currentPath());
List actualTypes = types.stream().filter(Objects::nonNull).collect(Collectors.toList());
Type structType = struct.withNewFields(actualTypes);
return field == null ? structType : structType.withId(field.id());
}
@Override
public Type list(GroupType list, Type elementType) {
Preconditions.checkArgument(elementType != null,
"List type must have element field");
MappedField field = nameMapping.find(currentPath());
Type listType = org.apache.parquet.schema.Types.list(list.getRepetition())
.element(elementType)
.named(list.getName());
return field == null ? listType : listType.withId(field.id());
}
@Override
public Type map(GroupType map, Type keyType, Type valueType) {
Preconditions.checkArgument(keyType != null && valueType != null,
"Map type must have both key field and value field");
MappedField field = nameMapping.find(currentPath());
Type mapType = org.apache.parquet.schema.Types.map(map.getRepetition())
.key(keyType)
.value(valueType)
.named(map.getName());
return field == null ? mapType : mapType.withId(field.id());
}
@Override
public Type primitive(PrimitiveType primitive) {
MappedField field = nameMapping.find(currentPath());
return field == null ? primitive : primitive.withId(field.id());
}
@Override
public void beforeRepeatedElement(Type element) {
// do not add the repeated element's name
}
@Override
public void afterRepeatedElement(Type element) {
// do not remove the repeated element's name
}
@Override
public void beforeRepeatedKeyValue(Type keyValue) {
// do not add the repeated element's name
}
@Override
public void afterRepeatedKeyValue(Type keyValue) {
// do not remove the repeated element's name
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy