org.apache.hudi.metadata.AbstractHoodieTableMetadata Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hudi.metadata;
import org.apache.hadoop.fs.Path;
import org.apache.hudi.common.config.SerializableConfiguration;
import org.apache.hudi.common.engine.HoodieEngineContext;
import org.apache.hudi.common.util.PartitionPathEncodeUtils;
import org.apache.hudi.common.util.StringUtils;
import org.apache.hudi.expression.ArrayData;
import org.apache.hudi.hadoop.CachingPath;
import org.apache.hudi.hadoop.SerializablePath;
import org.apache.hudi.internal.schema.Type;
import org.apache.hudi.internal.schema.Types;
import java.util.Collections;
import java.util.List;
import java.util.stream.Collectors;
import java.util.stream.IntStream;
public abstract class AbstractHoodieTableMetadata implements HoodieTableMetadata {
protected transient HoodieEngineContext engineContext;
protected final SerializableConfiguration hadoopConf;
protected final SerializablePath dataBasePath;
// TODO get this from HoodieConfig
protected final boolean caseSensitive = false;
public AbstractHoodieTableMetadata(HoodieEngineContext engineContext, SerializableConfiguration conf, String dataBasePath) {
this.engineContext = engineContext;
this.hadoopConf = conf;
this.dataBasePath = new SerializablePath(new CachingPath(dataBasePath));
}
protected static int getPathPartitionLevel(Types.RecordType partitionFields, String path) {
if (StringUtils.isNullOrEmpty(path) || partitionFields == null) {
return 0;
}
int level = 1;
for (int i = 1; i < path.length() - 1; i++) {
if (path.charAt(i) == Path.SEPARATOR_CHAR) {
level++;
}
}
if (path.startsWith(Path.SEPARATOR)) {
level--;
}
if (path.endsWith(Path.SEPARATOR)) {
level--;
}
return level;
}
protected static ArrayData extractPartitionValues(Types.RecordType partitionFields,
String relativePartitionPath,
boolean urlEncodePartitioningEnabled) {
if (partitionFields.fields().size() == 1) {
// SinglePartPartitionValue, which might contain slashes.
String partitionValue = relativePartitionPath.split("=")[1];
return new ArrayData(Collections.singletonList(Type.fromPartitionString(
urlEncodePartitioningEnabled ? PartitionPathEncodeUtils.unescapePathName(partitionValue) : partitionValue,
partitionFields.field(0).type())));
}
List