All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.google.zetasql.PreparedExpression Maven / Gradle / Ivy

/*
 * Copyright 2019 Google LLC
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 */

package com.google.zetasql;

import static com.google.common.base.Verify.verify;

import com.google.common.base.Ascii;
import com.google.common.base.Preconditions;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.Queues;
import com.google.common.util.concurrent.ListenableFuture;
import com.google.common.util.concurrent.SettableFuture;
import com.google.errorprone.annotations.CanIgnoreReturnValue;
import com.google.zetasql.LocalService.EvaluateRequest;
import com.google.zetasql.LocalService.EvaluateRequestBatch;
import com.google.zetasql.LocalService.EvaluateResponse;
import com.google.zetasql.LocalService.EvaluateResponseBatch;
import com.google.zetasql.LocalService.PrepareRequest;
import com.google.zetasql.LocalService.PrepareResponse;
import com.google.zetasql.LocalService.PreparedState;
import com.google.zetasql.LocalService.UnprepareRequest;
import io.grpc.Channel;
import io.grpc.ManagedChannel;
import io.grpc.StatusRuntimeException;
import io.grpc.stub.ClientCallStreamObserver;
import io.grpc.stub.ClientResponseObserver;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Optional;
import java.util.Queue;
import java.util.concurrent.atomic.AtomicLong;

/**
 * ZetaSQL expression evaluation using Service RPC.
 *
 * 

When evaluating an expression, callers can provide * *

    *
  • A set of expression columns - column names usable in the expression. *
  • A set of parameters - parameters usable in the expression as \@param. *
* *

Columns / Parameters are passed as String:Value Maps. * *

A prepared expression will create server side state, which should be released by calling * close() when the expression is no longer used. Note that the close() method is called in * finalize(), but you should not rely on that because the Java garbage collector has no idea how * much memory is used on C++ side and GC may happen later than necessary. * *

Read the unit tests for examples. * *

This class is not thread-safe. External synchronization is needed when it is shared by * multiple threads. */ public class PreparedExpression implements AutoCloseable { private final String sql; private boolean prepared = false; private boolean closed = false; private Type outputType; private long preparedId; private FileDescriptorSetsBuilder fileDescriptorSetsBuilder; private TypeFactory factory = TypeFactory.nonUniqueNames(); private AnalyzerOptions options; // expected are the fields we expect the user to provide to execute, but not all are required. private Map expectedColumns; private Map expectedParameters; // referenced is the subset of expected that the analyzer determined are actually required. private List referencedColumns; private List referencedParameters; public PreparedExpression(String sql) { this.sql = sql; } /** * Prepare the expression with given options. Throwing SqlException if there's an error (not * necessarily network/server failure). See unit tests for examples how options can be set. * * @param options */ public void prepare(AnalyzerOptions options) { prepareInternal(options, Optional.empty()); } public void prepareWithCatalog(AnalyzerOptions options, SimpleCatalog catalog) { Preconditions.checkNotNull(catalog); prepareInternal(options, Optional.of(catalog)); } private void prepareInternal(AnalyzerOptions options, Optional maybeCatalog) { Preconditions.checkState(!prepared); Preconditions.checkState(!closed); this.options = options; fileDescriptorSetsBuilder = new FileDescriptorSetsBuilder(); fileDescriptorSetsBuilder.addAllFileDescriptors(BuiltinDescriptorPool.getInstance()); PrepareRequest.Builder request = PrepareRequest.newBuilder(); request.setSql(sql); request.setOptions(options.serialize(fileDescriptorSetsBuilder)); Map catalogRegisteredDescriptorPoolIds = Collections.emptyMap(); if (maybeCatalog.isPresent()) { SimpleCatalog catalog = maybeCatalog.get(); if (catalog.isRegistered()) { catalogRegisteredDescriptorPoolIds = catalog.getRegisteredDescriptorPoolIds(); for (DescriptorPool pool : catalogRegisteredDescriptorPoolIds.keySet()) { fileDescriptorSetsBuilder.addAllFileDescriptors(pool); } request.setRegisteredCatalogId(catalog.getRegisteredId()); } else { request.setSimpleCatalog(catalog.serialize(fileDescriptorSetsBuilder)); } } else { // A catalog must be provided, so we request a default initialized catalog with all of // the builtin functions. request .getSimpleCatalogBuilder() .getBuiltinFunctionOptionsBuilder() .setLanguageOptions(request.getOptions().getLanguageOptions()); } request.setDescriptorPoolList( DescriptorPoolSerializer.createDescriptorPoolListWithRegisteredIds( fileDescriptorSetsBuilder, catalogRegisteredDescriptorPoolIds)); PrepareResponse resp; try { resp = Client.getStub().prepare(request.build()); } catch (StatusRuntimeException e) { throw new SqlException(e); } setPrepared(resp.getPrepared()); } private void setPrepared(PreparedState resp) { preparedId = resp.getPreparedExpressionId(); outputType = factory.deserialize(resp.getOutputType(), fileDescriptorSetsBuilder.getDescriptorPools()); expectedColumns = toLower(options.getExpressionColumns()); expectedParameters = toLower(options.getQueryParameters()); referencedColumns = resp.getReferencedColumnsList(); referencedParameters = resp.getReferencedParametersList(); prepared = true; } /** Get the output type of this expression. */ public Type getOutputType() { Preconditions.checkState(prepared); Preconditions.checkState(!closed); return outputType; } /** * Get the list of column names referenced in this expression. * *

The columns will be returned in lower case, as column expressions are case-insensitive when * evaluated. This can be used for efficiency, the list of columns returned from this method are * the minimal set that must be provided to execute(). */ public List getReferencedColumns() { Preconditions.checkState(prepared); Preconditions.checkState(!closed); return referencedColumns; } /** * Get the list of parameters referenced in this expression. * *

This is similar to getReferencedColumns(), but for parameters. */ public List getReferencedParameters() { Preconditions.checkState(prepared); Preconditions.checkState(!closed); return referencedParameters; } /** * Evaluate the sql expression via Service RPC. * * @return The evaluation result. */ @CanIgnoreReturnValue // TODO: consider removing this? public Value execute() { return execute(Collections.emptyMap(), Collections.emptyMap()); } /** * Evaluate the sql expression via Service RPC. * * @param columns Map of column name:value pairs used in the sql expression. * @param parameters Map of parameter name:value pairs. * @return The evaluation result. */ @CanIgnoreReturnValue // TODO: consider removing this? public Value execute(Map columns, Map parameters) { return execute(buildRequest(columns, parameters)); } private Value execute(EvaluateRequest request) { Preconditions.checkState(!closed); final EvaluateResponse resp; try { resp = Client.getStub().evaluate(request); } catch (StatusRuntimeException e) { throw new SqlException(e); } if (!prepared) { setPrepared(resp.getPrepared()); } return Value.deserialize(outputType, resp.getValue()); } private EvaluateRequest buildRequest(Map columns, Map parameters) { Preconditions.checkNotNull(columns); Preconditions.checkNotNull(parameters); EvaluateRequest.Builder request = EvaluateRequest.newBuilder(); if (prepared) { request.setPreparedExpressionId(preparedId); final Map normalizedColumns = normalizeParameters(columns, expectedColumns, "column"); final Map normalizedParameters = normalizeParameters(parameters, expectedParameters, "query"); for (String column : referencedColumns) { Value value = normalizedColumns.get(column); if (value == null) { throw new SqlException("Incomplete column parameters " + column); } request.addColumns(serializeParameter(column, value)); } for (String param : referencedParameters) { Value value = normalizedParameters.get(param); if (value == null) { throw new SqlException("Incomplete query parameters " + param); } request.addParams(serializeParameter(param, value)); } // TODO: Remove once new descriptor pool is the default // Force adding this field, as empty to ensure we use the 'new' local_service // descriptor pool codepath. It is not really needed, as all of the descriptor // pools are already synchronized via prepare. request.getDescriptorPoolListBuilder(); } else { request.setSql(sql); fileDescriptorSetsBuilder = new FileDescriptorSetsBuilder(); fileDescriptorSetsBuilder.addAllFileDescriptors(BuiltinDescriptorPool.getInstance()); ImmutableMap registeredDescriptorPoolIds = ImmutableMap.of(); options = new AnalyzerOptions(); for (Entry column : columns.entrySet()) { options.addExpressionColumn(column.getKey(), column.getValue().getType()); request.addColumns(serializeParameter(column.getKey(), column.getValue())); } for (Entry param : parameters.entrySet()) { options.addQueryParameter(param.getKey(), param.getValue().getType()); request.addParams(serializeParameter(param.getKey(), param.getValue())); } request.setOptions(options.serialize(fileDescriptorSetsBuilder)); request.setDescriptorPoolList( DescriptorPoolSerializer.createDescriptorPoolListWithRegisteredIds( fileDescriptorSetsBuilder, registeredDescriptorPoolIds)); } return request.build(); } private static Map normalizeParameters( Map parameters, Map expected, String kind) { HashMap lower = new HashMap<>(); for (Map.Entry entry : parameters.entrySet()) { String name = Ascii.toLowerCase(entry.getKey()); if (!expected.containsKey(name)) { throw new SqlException("Unexpected " + kind + " parameter '" + name + "'"); } Value value = entry.getValue(); Type type = expected.get(name); if (!type.equals(value.getType())) { throw new SqlException( "Expected " + kind + " parameter '" + name + "' to be of type " + type); } if (lower.putIfAbsent(name, value) != null) { throw new SqlException("Duplicate expression " + kind + " name '" + name + "'"); } } return lower; } private static ImmutableMap toLower(Map parameters) { ImmutableMap.Builder b = new ImmutableMap.Builder<>(); for (Map.Entry entry : parameters.entrySet()) { b.put(Ascii.toLowerCase(entry.getKey()), entry.getValue()); } return b.buildOrThrow(); } /** Opens a handle for streaming execution */ public Stream stream() { Preconditions.checkState(prepared); Preconditions.checkState(!closed); return new Stream(); } /** * ZetaSQL streaming expression evaluation. * *

Streaming evaluation requests are buffered until there is either no outstanding work or an * optimal number of pending requests (tuned by benchmarks) to send as a single batch. This * minimizes the average latency, but increases deviation in request latency. * *

This class is not thread-safe. External synchronization is needed when it is shared by * multiple threads. */ public final class Stream implements AutoCloseable { private final Queue> pending; private final Queue batch; private final AtomicLong batchCount; // eventually consistent private final AtomicLong batchSerializedSize; // eventually consistent private final AtomicLong outstandingCount; private final Channel channel; private final ClientCallStreamObserver requestObserver; private Stream() { pending = Queues.newConcurrentLinkedQueue(); batch = Queues.newConcurrentLinkedQueue(); batchCount = new AtomicLong(); batchSerializedSize = new AtomicLong(); outstandingCount = new AtomicLong(); channel = ClientChannelProvider.loadChannel(); ZetaSqlLocalServiceGrpc.ZetaSqlLocalServiceStub stub = ZetaSqlLocalServiceGrpc.newStub(channel); requestObserver = (ClientCallStreamObserver) stub.evaluateStream(new ResponseObserver()); } /** * Evaluate the sql expression via streaming RPC. * *

This method is not thread-safe. External synchronization is needed when it is shared by * multiple threads. * * @param columns Map of column name:value pairs used in the sql expression. * @param parameters Map of parameter name:value pairs. * @return The evaluation result. */ public ListenableFuture execute( Map columns, Map parameters) { final SettableFuture f = SettableFuture.create(); final EvaluateRequest r = buildRequest(columns, parameters); final int size = r.getSerializedSize(); /* critical block: This block is not thread safe, as documented in the * PreparedExpression class comment, for maximal performance. The order * of these operations is critical to the correctness of this code. */ pending.add(f); batch.add(r); batchCount.getAndIncrement(); batchSerializedSize.getAndAdd(size); // end critical block maybeFlush(); return f; } private void maybeFlush() { /* batchCount and batchSerializedSize are eventually consistent hints. * They may be too low if called concurrently with execute, which will * be mitigated when execute calls this method. They may be too high * if called concurrently with flush, which will result in an unneeded * call to flush. */ final long batchCount = this.batchCount.get(); if (batchCount <= 0) { return; } if (outstandingCount.get() != 0 && batchSerializedSize.get() < 65536 && (batchCount < 16 || !requestObserver.isReady())) { return; } flush(); } /** Flush buffered requests to RPC. */ public synchronized void flush() { try { final EvaluateRequestBatch.Builder b = EvaluateRequestBatch.newBuilder(); for (EvaluateRequest r; (r = batch.poll()) != null; ) { batchSerializedSize.getAndAdd(-r.getSerializedSize()); b.addRequest(r); } if (b.getRequestCount() > 0) { batchCount.getAndAdd(-b.getRequestCount()); outstandingCount.getAndAdd(b.getRequestCount()); requestObserver.onNext(b.build()); } } catch (RuntimeException e) { requestObserver.onError(e); throw e; } } private class ResponseObserver implements ClientResponseObserver { @Override public void onNext(EvaluateResponseBatch respb) { long remain = outstandingCount.addAndGet(-respb.getResponseCount()); verify(remain >= 0); for (EvaluateResponse resp : respb.getResponseList()) { final SettableFuture f = pending.remove(); final Value v; try { v = Value.deserialize(outputType, resp.getValue()); } catch (RuntimeException e) { f.setException(e); continue; } f.set(v); } if (remain == 0) { /* If no outstanding requests remain, flush the current batch. This * avoids a hang if the caller stops calling evaluate but doesn't * call flush and limits the latency of a request to 2T (where T is * the round-trip latency of a single request). This may result in * suboptimal behavior for a time if the request rate slows to * between T and 2T. */ flush(); } } private void setException(Throwable t) { for (SettableFuture f; (f = pending.poll()) != null; ) { f.setException(t); } } @Override public void onError(Throwable t) { if (t instanceof StatusRuntimeException) { setException(new SqlException((StatusRuntimeException) t)); } else { setException(t); } } @Override public void onCompleted() { setException(new RuntimeException("Stream closed")); } @Override public void beforeStart(final ClientCallStreamObserver requestStream) { requestStream.setOnReadyHandler(this::onReady); } private void onReady() { maybeFlush(); } } @Override public void close() { synchronized (this) { requestObserver.onCompleted(); } if (channel instanceof ManagedChannel) { ((ManagedChannel) channel).shutdown(); } } @Override protected void finalize() throws Throwable { super.finalize(); close(); } } /** Release the server side state for this prepared expression. */ @Override public void close() { if (prepared && !closed) { try { Client.getStub() .unprepare(UnprepareRequest.newBuilder().setPreparedExpressionId(preparedId).build()); } catch (StatusRuntimeException e) { // ignore } prepared = false; closed = true; } } @Override protected void finalize() throws Throwable { super.finalize(); close(); } private static EvaluateRequest.Parameter serializeParameter(String name, Value value) { return EvaluateRequest.Parameter.newBuilder() .setName(name) .setValue(value.serialize()) .build(); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy