
com.facebook.presto.elasticsearch.ElasticsearchMetadata Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.facebook.presto.elasticsearch;
import com.facebook.airlift.json.JsonObjectMapperProvider;
import com.facebook.airlift.log.Logger;
import com.facebook.presto.common.type.ArrayType;
import com.facebook.presto.common.type.RowType;
import com.facebook.presto.common.type.StandardTypes;
import com.facebook.presto.common.type.Type;
import com.facebook.presto.common.type.TypeManager;
import com.facebook.presto.common.type.TypeSignature;
import com.facebook.presto.elasticsearch.client.ElasticsearchClient;
import com.facebook.presto.elasticsearch.client.IndexMetadata;
import com.facebook.presto.elasticsearch.client.IndexMetadata.DateTimeType;
import com.facebook.presto.elasticsearch.client.IndexMetadata.ObjectType;
import com.facebook.presto.elasticsearch.client.IndexMetadata.PrimitiveType;
import com.facebook.presto.spi.ColumnHandle;
import com.facebook.presto.spi.ColumnMetadata;
import com.facebook.presto.spi.ConnectorSession;
import com.facebook.presto.spi.ConnectorTableHandle;
import com.facebook.presto.spi.ConnectorTableLayout;
import com.facebook.presto.spi.ConnectorTableLayoutHandle;
import com.facebook.presto.spi.ConnectorTableLayoutResult;
import com.facebook.presto.spi.ConnectorTableMetadata;
import com.facebook.presto.spi.Constraint;
import com.facebook.presto.spi.PrestoException;
import com.facebook.presto.spi.SchemaTableName;
import com.facebook.presto.spi.SchemaTablePrefix;
import com.facebook.presto.spi.connector.ConnectorMetadata;
import com.fasterxml.jackson.core.JsonProcessingException;
import com.fasterxml.jackson.databind.ObjectMapper;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.common.io.BaseEncoding;
import javax.inject.Inject;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.Set;
import java.util.stream.Collectors;
import static com.facebook.presto.common.type.BigintType.BIGINT;
import static com.facebook.presto.common.type.BooleanType.BOOLEAN;
import static com.facebook.presto.common.type.DoubleType.DOUBLE;
import static com.facebook.presto.common.type.IntegerType.INTEGER;
import static com.facebook.presto.common.type.RealType.REAL;
import static com.facebook.presto.common.type.RowType.Field;
import static com.facebook.presto.common.type.SmallintType.SMALLINT;
import static com.facebook.presto.common.type.TimestampType.TIMESTAMP;
import static com.facebook.presto.common.type.TinyintType.TINYINT;
import static com.facebook.presto.common.type.VarbinaryType.VARBINARY;
import static com.facebook.presto.common.type.VarcharType.VARCHAR;
import static com.facebook.presto.elasticsearch.ElasticsearchTableHandle.Type.QUERY;
import static com.facebook.presto.elasticsearch.ElasticsearchTableHandle.Type.SCAN;
import static com.facebook.presto.spi.StandardErrorCode.INVALID_ARGUMENTS;
import static com.google.common.collect.ImmutableMap.toImmutableMap;
import static java.lang.String.format;
import static java.nio.charset.StandardCharsets.UTF_8;
import static java.util.Locale.ENGLISH;
import static java.util.Objects.requireNonNull;
public class ElasticsearchMetadata
implements ConnectorMetadata
{
private static final Logger log = Logger.get(ElasticsearchMetadata.class);
private static final ObjectMapper JSON_PARSER = new JsonObjectMapperProvider().get();
private static final String PASSTHROUGH_QUERY_SUFFIX = "$query";
private final Map queryTableColumns;
private final ColumnMetadata queryResultColumnMetadata;
private final ElasticsearchClient client;
private final String schemaName;
private final Type ipAddressType;
@Inject
public ElasticsearchMetadata(TypeManager typeManager, ElasticsearchClient client, ElasticsearchConfig config)
{
requireNonNull(config, "config is null");
this.ipAddressType = typeManager.getType(new TypeSignature(StandardTypes.IPADDRESS));
this.client = requireNonNull(client, "client is null");
requireNonNull(config, "config is null");
this.schemaName = config.getDefaultSchema();
Type jsonType = typeManager.getType(new TypeSignature(StandardTypes.JSON));
queryResultColumnMetadata = ColumnMetadata.builder()
.setName("result")
.setType(jsonType)
.setNullable(true)
.setHidden(false)
.build();
queryTableColumns = ImmutableMap.of("result", new ElasticsearchColumnHandle("result", jsonType, false));
}
@Override
public List listSchemaNames(ConnectorSession session)
{
return ImmutableList.of(schemaName);
}
@Override
public ElasticsearchTableHandle getTableHandle(ConnectorSession session, SchemaTableName tableName)
{
requireNonNull(tableName, "tableName is null");
if (tableName.getSchemaName().equals(schemaName)) {
String[] parts = tableName.getTableName().split(":", 2);
String table = parts[0];
Optional query = Optional.empty();
ElasticsearchTableHandle.Type type = SCAN;
if (parts.length == 2) {
if (table.endsWith(PASSTHROUGH_QUERY_SUFFIX)) {
table = table.substring(0, table.length() - PASSTHROUGH_QUERY_SUFFIX.length());
byte[] decoded;
try {
decoded = BaseEncoding.base32().decode(parts[1].toUpperCase(ENGLISH));
}
catch (IllegalArgumentException e) {
throw new PrestoException(INVALID_ARGUMENTS, format("Elasticsearch query for '%s' is not base32-encoded correctly", table), e);
}
String queryJson = new String(decoded, UTF_8);
try {
// Ensure this is valid json
JSON_PARSER.readTree(queryJson);
}
catch (JsonProcessingException e) {
throw new PrestoException(INVALID_ARGUMENTS, format("Elasticsearch query for '%s' is not valid JSON", table), e);
}
query = Optional.of(queryJson);
type = QUERY;
}
else {
query = Optional.of(parts[1]);
}
}
if (listTables(session, Optional.of(schemaName)).contains(new SchemaTableName(schemaName, table))) {
return new ElasticsearchTableHandle(type, schemaName, table, query);
}
}
return null;
}
@Override
public List getTableLayouts(ConnectorSession session, ConnectorTableHandle table, Constraint constraint, Optional> desiredColumns)
{
ElasticsearchTableHandle handle = (ElasticsearchTableHandle) table;
ConnectorTableLayout layout = new ConnectorTableLayout(new ElasticsearchTableLayoutHandle(handle, constraint.getSummary()));
return ImmutableList.of(new ConnectorTableLayoutResult(layout, constraint.getSummary()));
}
@Override
public ConnectorTableLayout getTableLayout(ConnectorSession session, ConnectorTableLayoutHandle handle)
{
return new ConnectorTableLayout(handle);
}
@Override
public ConnectorTableMetadata getTableMetadata(ConnectorSession session, ConnectorTableHandle table)
{
ElasticsearchTableHandle handle = (ElasticsearchTableHandle) table;
if (isPassthroughQuery(handle)) {
return new ConnectorTableMetadata(
new SchemaTableName(handle.getSchema(), handle.getIndex()),
ImmutableList.of(queryResultColumnMetadata));
}
return getTableMetadata(handle.getSchema(), handle.getIndex());
}
private ConnectorTableMetadata getTableMetadata(String schemaName, String tableName)
{
InternalTableMetadata internalTableMetadata = makeInternalTableMetadata(schemaName, tableName);
return new ConnectorTableMetadata(new SchemaTableName(schemaName, tableName), internalTableMetadata.getColumnMetadata());
}
private InternalTableMetadata makeInternalTableMetadata(ConnectorTableHandle table)
{
ElasticsearchTableHandle handle = (ElasticsearchTableHandle) table;
return makeInternalTableMetadata(handle.getSchema(), handle.getIndex());
}
private InternalTableMetadata makeInternalTableMetadata(String schema, String tableName)
{
IndexMetadata metadata = client.getIndexMetadata(tableName);
List fields = getColumnFields(metadata);
return new InternalTableMetadata(new SchemaTableName(schema, tableName), makeColumnMetadata(fields), makeColumnHandles(fields));
}
private List getColumnFields(IndexMetadata metadata)
{
ImmutableList.Builder result = ImmutableList.builder();
Map counts = metadata.getSchema()
.getFields().stream()
.collect(Collectors.groupingBy(f -> f.getName().toLowerCase(ENGLISH), Collectors.counting()));
for (IndexMetadata.Field field : metadata.getSchema().getFields()) {
Type type = toPrestoType(field);
if (type == null || counts.get(field.getName().toLowerCase(ENGLISH)) > 1) {
continue;
}
result.add(field);
}
return result.build();
}
private List makeColumnMetadata(List fields)
{
ImmutableList.Builder result = ImmutableList.builder();
for (BuiltinColumns builtinColumn : BuiltinColumns.values()) {
result.add(builtinColumn.getMetadata());
}
for (IndexMetadata.Field field : fields) {
result.add(new ColumnMetadata(field.getName(), toPrestoType(field)));
}
return result.build();
}
private Map makeColumnHandles(List fields)
{
ImmutableMap.Builder result = ImmutableMap.builder();
for (BuiltinColumns builtinColumn : BuiltinColumns.values()) {
result.put(builtinColumn.getName(), builtinColumn.getColumnHandle());
}
for (IndexMetadata.Field field : fields) {
result.put(field.getName(), new ElasticsearchColumnHandle(
field.getName(),
toPrestoType(field),
supportsPredicates(field.getType())));
}
return result.build();
}
private static boolean supportsPredicates(IndexMetadata.Type type)
{
if (type instanceof DateTimeType) {
return true;
}
if (type instanceof PrimitiveType) {
switch (((PrimitiveType) type).getName().toLowerCase(ENGLISH)) {
case "boolean":
case "byte":
case "short":
case "integer":
case "long":
case "double":
case "float":
case "keyword":
return true;
}
}
return false;
}
private Type toPrestoType(IndexMetadata.Field metaDataField)
{
return toPrestoType(metaDataField, metaDataField.isArray());
}
private Type toPrestoType(IndexMetadata.Field metaDataField, boolean isArray)
{
IndexMetadata.Type type = metaDataField.getType();
if (isArray) {
Type elementType = toPrestoType(metaDataField, false);
return new ArrayType(elementType);
}
else if (type instanceof PrimitiveType) {
switch (((PrimitiveType) type).getName()) {
case "float":
return REAL;
case "double":
return DOUBLE;
case "byte":
return TINYINT;
case "short":
return SMALLINT;
case "integer":
return INTEGER;
case "long":
return BIGINT;
case "string":
case "text":
case "keyword":
return VARCHAR;
case "boolean":
return BOOLEAN;
case "binary":
return VARBINARY;
case "ip":
return ipAddressType;
}
}
else if (type instanceof DateTimeType) {
if (((DateTimeType) type).getFormats().isEmpty()) {
return TIMESTAMP;
}
// otherwise, skip -- we don't support custom formats, yet
}
else if (type instanceof ObjectType) {
ObjectType objectType = (ObjectType) type;
ImmutableList.Builder builder = ImmutableList.builder();
for (IndexMetadata.Field field : objectType.getFields()) {
Type prestoType = toPrestoType(field);
if (prestoType != null) {
builder.add(RowType.field(field.getName(), prestoType));
}
else {
log.warn("Type is not implemented: %s", field.getType());
}
}
List fields = builder.build();
if (!fields.isEmpty()) {
return RowType.from(fields);
}
}
return null;
}
@Override
public List listTables(ConnectorSession session, Optional schemaName)
{
if (schemaName.isPresent() && !schemaName.get().equals(this.schemaName)) {
return ImmutableList.of();
}
ImmutableList.Builder result = ImmutableList.builder();
Set indexes = ImmutableSet.copyOf(client.getIndexes());
indexes.stream()
.map(index -> new SchemaTableName(this.schemaName, index))
.forEach(result::add);
client.getAliases().entrySet().stream()
.filter(entry -> indexes.contains(entry.getKey()))
.flatMap(entry -> entry.getValue().stream()
.map(alias -> new SchemaTableName(this.schemaName, alias)))
.distinct()
.forEach(result::add);
return result.build();
}
@Override
public Map getColumnHandles(ConnectorSession session, ConnectorTableHandle tableHandle)
{
ElasticsearchTableHandle table = (ElasticsearchTableHandle) tableHandle;
if (isPassthroughQuery(table)) {
return queryTableColumns;
}
InternalTableMetadata tableMetadata = makeInternalTableMetadata(tableHandle);
return tableMetadata.getColumnHandles();
}
@Override
public ColumnMetadata getColumnMetadata(ConnectorSession session, ConnectorTableHandle tableHandle, ColumnHandle columnHandle)
{
ElasticsearchTableHandle table = (ElasticsearchTableHandle) tableHandle;
ElasticsearchColumnHandle column = (ElasticsearchColumnHandle) columnHandle;
if (isPassthroughQuery(table)) {
if (column.getName().equals(queryResultColumnMetadata.getName())) {
return queryResultColumnMetadata;
}
throw new IllegalArgumentException(format("Unexpected column for table '%s$query': %s", table.getIndex(), column.getName()));
}
return ColumnMetadata.builder()
.setName(column.getName())
.setType(column.getType())
.build();
}
private static boolean isPassthroughQuery(ElasticsearchTableHandle table)
{
return table.getType().equals(QUERY);
}
@Override
public Map> listTableColumns(ConnectorSession session, SchemaTablePrefix prefix)
{
if (prefix.getSchemaName() != null && !prefix.getSchemaName().equals(schemaName)) {
return ImmutableMap.of();
}
if (prefix.getSchemaName() != null && prefix.getTableName() != null) {
ConnectorTableMetadata metadata = getTableMetadata(prefix.getSchemaName(), prefix.getTableName());
return ImmutableMap.of(metadata.getTable(), metadata.getColumns());
}
return listTables(session, prefix.getSchemaName()).stream()
.map(name -> getTableMetadata(name.getSchemaName(), name.getTableName()))
.collect(toImmutableMap(ConnectorTableMetadata::getTable, ConnectorTableMetadata::getColumns));
}
private static class InternalTableMetadata
{
private final SchemaTableName tableName;
private final List columnMetadata;
private final Map columnHandles;
public InternalTableMetadata(
SchemaTableName tableName,
List columnMetadata,
Map columnHandles)
{
this.tableName = tableName;
this.columnMetadata = columnMetadata;
this.columnHandles = columnHandles;
}
public SchemaTableName getTableName()
{
return tableName;
}
public List getColumnMetadata()
{
return columnMetadata;
}
public Map getColumnHandles()
{
return columnHandles;
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy