
io.trino.execution.QueryStateMachine Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.execution;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Ticker;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.common.collect.Sets;
import com.google.common.util.concurrent.FutureCallback;
import com.google.common.util.concurrent.Futures;
import com.google.common.util.concurrent.ListenableFuture;
import com.google.errorprone.annotations.ThreadSafe;
import com.google.errorprone.annotations.concurrent.GuardedBy;
import io.airlift.log.Logger;
import io.airlift.units.Duration;
import io.opentelemetry.api.common.Attributes;
import io.opentelemetry.api.trace.Span;
import io.opentelemetry.api.trace.StatusCode;
import io.trino.Session;
import io.trino.client.NodeVersion;
import io.trino.exchange.ExchangeInput;
import io.trino.execution.QueryExecution.QueryOutputInfo;
import io.trino.execution.StateMachine.StateChangeListener;
import io.trino.execution.querystats.PlanOptimizersStatsCollector;
import io.trino.execution.warnings.WarningCollector;
import io.trino.metadata.Metadata;
import io.trino.operator.BlockedReason;
import io.trino.operator.OperatorStats;
import io.trino.security.AccessControl;
import io.trino.server.BasicQueryInfo;
import io.trino.server.BasicQueryStats;
import io.trino.spi.ErrorCode;
import io.trino.spi.QueryId;
import io.trino.spi.TrinoException;
import io.trino.spi.eventlistener.RoutineInfo;
import io.trino.spi.eventlistener.StageGcStatistics;
import io.trino.spi.eventlistener.TableInfo;
import io.trino.spi.resourcegroups.QueryType;
import io.trino.spi.resourcegroups.ResourceGroupId;
import io.trino.spi.security.SelectedRole;
import io.trino.spi.type.Type;
import io.trino.sql.analyzer.Output;
import io.trino.sql.planner.PlanFragment;
import io.trino.tracing.TrinoAttributes;
import io.trino.transaction.TransactionId;
import io.trino.transaction.TransactionInfo;
import io.trino.transaction.TransactionManager;
import jakarta.annotation.Nullable;
import org.joda.time.DateTime;
import java.net.URI;
import java.util.ArrayDeque;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.OptionalDouble;
import java.util.Queue;
import java.util.Set;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentLinkedQueue;
import java.util.concurrent.Executor;
import java.util.concurrent.atomic.AtomicBoolean;
import java.util.concurrent.atomic.AtomicLong;
import java.util.concurrent.atomic.AtomicReference;
import java.util.function.Consumer;
import java.util.function.Supplier;
import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Preconditions.checkState;
import static com.google.common.base.Strings.nullToEmpty;
import static com.google.common.util.concurrent.MoreExecutors.directExecutor;
import static io.airlift.units.DataSize.succinctBytes;
import static io.trino.SystemSessionProperties.getRetryPolicy;
import static io.trino.execution.BasicStageStats.EMPTY_STAGE_STATS;
import static io.trino.execution.QueryState.DISPATCHING;
import static io.trino.execution.QueryState.FAILED;
import static io.trino.execution.QueryState.FINISHED;
import static io.trino.execution.QueryState.FINISHING;
import static io.trino.execution.QueryState.PLANNING;
import static io.trino.execution.QueryState.QUEUED;
import static io.trino.execution.QueryState.RUNNING;
import static io.trino.execution.QueryState.STARTING;
import static io.trino.execution.QueryState.TERMINAL_QUERY_STATES;
import static io.trino.execution.QueryState.WAITING_FOR_RESOURCES;
import static io.trino.execution.StageInfo.getAllStages;
import static io.trino.operator.RetryPolicy.TASK;
import static io.trino.server.DynamicFilterService.DynamicFiltersStats;
import static io.trino.spi.StandardErrorCode.NOT_FOUND;
import static io.trino.spi.StandardErrorCode.USER_CANCELED;
import static io.trino.util.Ciphers.createRandomAesEncryptionKey;
import static io.trino.util.Ciphers.serializeAesEncryptionKey;
import static io.trino.util.Failures.toFailure;
import static java.lang.Math.min;
import static java.util.Objects.requireNonNull;
import static java.util.concurrent.TimeUnit.MILLISECONDS;
import static java.util.concurrent.TimeUnit.NANOSECONDS;
@ThreadSafe
public class QueryStateMachine
{
private static final Logger QUERY_STATE_LOG = Logger.get(QueryStateMachine.class);
private final QueryId queryId;
private final String query;
private final Optional preparedQuery;
private final Session session;
private final URI self;
private final ResourceGroupId resourceGroup;
private final TransactionManager transactionManager;
private final Metadata metadata;
private final QueryOutputManager outputManager;
private final Executor stateMachineExecutor;
private final AtomicLong currentUserMemory = new AtomicLong();
private final AtomicLong peakUserMemory = new AtomicLong();
private final AtomicLong currentRevocableMemory = new AtomicLong();
private final AtomicLong peakRevocableMemory = new AtomicLong();
// peak of the user + system + revocable memory reservation
private final AtomicLong currentTotalMemory = new AtomicLong();
private final AtomicLong peakTotalMemory = new AtomicLong();
private final AtomicLong peakTaskUserMemory = new AtomicLong();
private final AtomicLong peakTaskRevocableMemory = new AtomicLong();
private final AtomicLong peakTaskTotalMemory = new AtomicLong();
private final QueryStateTimer queryStateTimer;
private final StateMachine queryState;
private final AtomicBoolean queryCleanedUp = new AtomicBoolean();
private final AtomicReference setCatalog = new AtomicReference<>();
private final AtomicReference setSchema = new AtomicReference<>();
private final AtomicReference setPath = new AtomicReference<>();
private final AtomicReference setAuthorizationUser = new AtomicReference<>();
private final AtomicBoolean resetAuthorizationUser = new AtomicBoolean();
private final Map setSessionProperties = new ConcurrentHashMap<>();
private final Set resetSessionProperties = Sets.newConcurrentHashSet();
private final Map setRoles = new ConcurrentHashMap<>();
private final Map addedPreparedStatements = new ConcurrentHashMap<>();
private final Set deallocatedPreparedStatements = Sets.newConcurrentHashSet();
private final AtomicReference startedTransactionId = new AtomicReference<>();
private final AtomicBoolean clearTransactionId = new AtomicBoolean();
private final AtomicReference updateType = new AtomicReference<>();
private final AtomicReference failureCause = new AtomicReference<>();
private final AtomicReference> inputs = new AtomicReference<>(ImmutableSet.of());
private final AtomicReference> output = new AtomicReference<>(Optional.empty());
private final AtomicReference> referencedTables = new AtomicReference<>(ImmutableList.of());
private final AtomicReference> routines = new AtomicReference<>(ImmutableList.of());
private final StateMachine> finalQueryInfo;
private final WarningCollector warningCollector;
private final PlanOptimizersStatsCollector planOptimizersStatsCollector;
private final Optional queryType;
@GuardedBy("dynamicFiltersStatsSupplierLock")
private Supplier dynamicFiltersStatsSupplier = () -> DynamicFiltersStats.EMPTY;
private final Object dynamicFiltersStatsSupplierLock = new Object();
private final AtomicBoolean committed = new AtomicBoolean();
private final AtomicBoolean consumed = new AtomicBoolean();
private final NodeVersion version;
private QueryStateMachine(
String query,
Optional preparedQuery,
Session session,
URI self,
ResourceGroupId resourceGroup,
TransactionManager transactionManager,
Executor stateMachineExecutor,
Ticker ticker,
Metadata metadata,
WarningCollector warningCollector,
PlanOptimizersStatsCollector queryStatsCollector,
Optional queryType,
NodeVersion version)
{
this.query = requireNonNull(query, "query is null");
this.preparedQuery = requireNonNull(preparedQuery, "preparedQuery is null");
this.session = requireNonNull(session, "session is null");
this.queryId = session.getQueryId();
this.self = requireNonNull(self, "self is null");
this.resourceGroup = requireNonNull(resourceGroup, "resourceGroup is null");
this.transactionManager = requireNonNull(transactionManager, "transactionManager is null");
this.queryStateTimer = new QueryStateTimer(ticker);
this.metadata = requireNonNull(metadata, "metadata is null");
this.stateMachineExecutor = requireNonNull(stateMachineExecutor, "stateMachineExecutor is null");
this.planOptimizersStatsCollector = requireNonNull(queryStatsCollector, "queryStatsCollector is null");
this.queryState = new StateMachine<>("query " + query, stateMachineExecutor, QUEUED, TERMINAL_QUERY_STATES);
this.finalQueryInfo = new StateMachine<>("finalQueryInfo-" + queryId, stateMachineExecutor, Optional.empty());
this.outputManager = new QueryOutputManager(stateMachineExecutor);
this.warningCollector = requireNonNull(warningCollector, "warningCollector is null");
this.queryType = requireNonNull(queryType, "queryType is null");
this.version = requireNonNull(version, "version is null");
}
/**
* Created QueryStateMachines must be transitioned to terminal states to clean up resources.
*/
public static QueryStateMachine begin(
Optional existingTransactionId,
String query,
Optional preparedQuery,
Session session,
URI self,
ResourceGroupId resourceGroup,
boolean transactionControl,
TransactionManager transactionManager,
AccessControl accessControl,
Executor executor,
Metadata metadata,
WarningCollector warningCollector,
PlanOptimizersStatsCollector queryStatsCollector,
Optional queryType,
boolean faultTolerantExecutionExchangeEncryptionEnabled,
NodeVersion version)
{
return beginWithTicker(
existingTransactionId,
query,
preparedQuery,
session,
self,
resourceGroup,
transactionControl,
transactionManager,
accessControl,
executor,
Ticker.systemTicker(),
metadata,
warningCollector,
queryStatsCollector,
queryType,
faultTolerantExecutionExchangeEncryptionEnabled,
version);
}
static QueryStateMachine beginWithTicker(
Optional existingTransactionId,
String query,
Optional preparedQuery,
Session session,
URI self,
ResourceGroupId resourceGroup,
boolean transactionControl,
TransactionManager transactionManager,
AccessControl accessControl,
Executor executor,
Ticker ticker,
Metadata metadata,
WarningCollector warningCollector,
PlanOptimizersStatsCollector queryStatsCollector,
Optional queryType,
boolean faultTolerantExecutionExchangeEncryptionEnabled,
NodeVersion version)
{
// if there is an existing transaction, activate it
existingTransactionId.ifPresent(transactionId -> {
if (transactionControl) {
transactionManager.trySetActive(transactionId);
}
else {
transactionManager.checkAndSetActive(transactionId);
}
});
// add the session to the existing transaction, or create a new auto commit transaction for the session
// NOTE: for the start transaction command, no transaction is created
if (existingTransactionId.isPresent() || !transactionControl) {
// TODO: make autocommit isolation level a session parameter
TransactionId transactionId = existingTransactionId
.orElseGet(() -> transactionManager.beginTransaction(true));
session = session.beginTransactionId(transactionId, transactionManager, accessControl);
}
if (getRetryPolicy(session) == TASK && faultTolerantExecutionExchangeEncryptionEnabled) {
// encryption is mandatory for fault tolerant execution as it relies on an external storage to store intermediate data generated during an exchange
session = session.withExchangeEncryption(serializeAesEncryptionKey(createRandomAesEncryptionKey()));
}
Span querySpan = session.getQuerySpan();
querySpan.setAttribute(TrinoAttributes.QUERY_TYPE, queryType.map(Enum::name).orElse("UNKNOWN"));
QueryStateMachine queryStateMachine = new QueryStateMachine(
query,
preparedQuery,
session,
self,
resourceGroup,
transactionManager,
executor,
ticker,
metadata,
warningCollector,
queryStatsCollector,
queryType,
version);
queryStateMachine.addStateChangeListener(newState -> {
QUERY_STATE_LOG.debug("Query %s is %s", queryStateMachine.getQueryId(), newState);
if (newState.isDone()) {
queryStateMachine.getSession().getTransactionId().ifPresent(transactionManager::trySetInactive);
queryStateMachine.getOutputManager().setQueryCompleted();
}
});
queryStateMachine.addStateChangeListener(newState -> {
querySpan.addEvent("query_state", Attributes.of(
TrinoAttributes.EVENT_STATE, newState.toString()));
if (newState.isDone()) {
queryStateMachine.getFailureInfo().ifPresentOrElse(
failure -> {
ErrorCode errorCode = requireNonNull(failure.getErrorCode());
querySpan.setStatus(StatusCode.ERROR, nullToEmpty(failure.getMessage()))
.recordException(failure.toException())
.setAttribute(TrinoAttributes.ERROR_CODE, errorCode.getCode())
.setAttribute(TrinoAttributes.ERROR_NAME, errorCode.getName())
.setAttribute(TrinoAttributes.ERROR_TYPE, errorCode.getType().toString());
},
() -> querySpan.setStatus(StatusCode.OK));
querySpan.end();
}
});
metadata.beginQuery(session);
return queryStateMachine;
}
public QueryId getQueryId()
{
return queryId;
}
public Session getSession()
{
return session;
}
public Executor getStateMachineExecutor()
{
return stateMachineExecutor;
}
public long getPeakUserMemoryInBytes()
{
return peakUserMemory.get();
}
public long getPeakRevocableMemoryInBytes()
{
return peakRevocableMemory.get();
}
public long getPeakTotalMemoryInBytes()
{
return peakTotalMemory.get();
}
public long getPeakTaskUserMemory()
{
return peakTaskUserMemory.get();
}
public long getPeakTaskRevocableMemory()
{
return peakTaskRevocableMemory.get();
}
public long getPeakTaskTotalMemory()
{
return peakTaskTotalMemory.get();
}
public WarningCollector getWarningCollector()
{
return warningCollector;
}
public PlanOptimizersStatsCollector getPlanOptimizersStatsCollector()
{
return planOptimizersStatsCollector;
}
public void updateMemoryUsage(
long deltaUserMemoryInBytes,
long deltaRevocableMemoryInBytes,
long deltaTotalMemoryInBytes,
long taskUserMemoryInBytes,
long taskRevocableMemoryInBytes,
long taskTotalMemoryInBytes)
{
currentUserMemory.addAndGet(deltaUserMemoryInBytes);
currentRevocableMemory.addAndGet(deltaRevocableMemoryInBytes);
currentTotalMemory.addAndGet(deltaTotalMemoryInBytes);
peakUserMemory.updateAndGet(currentPeakValue -> Math.max(currentUserMemory.get(), currentPeakValue));
peakRevocableMemory.updateAndGet(currentPeakValue -> Math.max(currentRevocableMemory.get(), currentPeakValue));
peakTotalMemory.updateAndGet(currentPeakValue -> Math.max(currentTotalMemory.get(), currentPeakValue));
peakTaskUserMemory.accumulateAndGet(taskUserMemoryInBytes, Math::max);
peakTaskRevocableMemory.accumulateAndGet(taskRevocableMemoryInBytes, Math::max);
peakTaskTotalMemory.accumulateAndGet(taskTotalMemoryInBytes, Math::max);
}
public BasicQueryInfo getBasicQueryInfo(Optional rootStage)
{
// Query state must be captured first in order to provide a
// correct view of the query. For example, building this
// information, the query could finish, and the task states would
// never be visible.
QueryState state = queryState.get();
ErrorCode errorCode = null;
if (state == FAILED) {
ExecutionFailureInfo failureCause = this.failureCause.get();
if (failureCause != null) {
errorCode = failureCause.getErrorCode();
}
}
BasicStageStats stageStats = rootStage.orElse(EMPTY_STAGE_STATS);
BasicQueryStats queryStats = new BasicQueryStats(
queryStateTimer.getCreateTime(),
getEndTime().orElse(null),
queryStateTimer.getQueuedTime(),
queryStateTimer.getElapsedTime(),
queryStateTimer.getExecutionTime(),
stageStats.getFailedTasks(),
stageStats.getTotalDrivers(),
stageStats.getQueuedDrivers(),
stageStats.getRunningDrivers(),
stageStats.getCompletedDrivers(),
stageStats.getRawInputDataSize(),
stageStats.getRawInputPositions(),
stageStats.getPhysicalInputDataSize(),
stageStats.getCumulativeUserMemory(),
stageStats.getFailedCumulativeUserMemory(),
stageStats.getUserMemoryReservation(),
stageStats.getTotalMemoryReservation(),
succinctBytes(getPeakUserMemoryInBytes()),
succinctBytes(getPeakTotalMemoryInBytes()),
stageStats.getTotalCpuTime(),
stageStats.getFailedCpuTime(),
stageStats.getTotalScheduledTime(),
stageStats.getFailedScheduledTime(),
stageStats.isFullyBlocked(),
stageStats.getBlockedReasons(),
stageStats.getProgressPercentage(),
stageStats.getRunningPercentage());
return new BasicQueryInfo(
queryId,
session.toSessionRepresentation(),
Optional.of(resourceGroup),
state,
stageStats.isScheduled(),
self,
query,
Optional.ofNullable(updateType.get()),
preparedQuery,
queryStats,
errorCode == null ? null : errorCode.getType(),
errorCode,
queryType,
getRetryPolicy(session));
}
@VisibleForTesting
QueryInfo getQueryInfo(Optional rootStage)
{
// Query state must be captured first in order to provide a
// correct view of the query. For example, building this
// information, the query could finish, and the task states would
// never be visible.
QueryState state = queryState.get();
ExecutionFailureInfo failureCause = null;
ErrorCode errorCode = null;
if (state == FAILED) {
failureCause = this.failureCause.get();
if (failureCause != null) {
errorCode = failureCause.getErrorCode();
}
}
List allStages = getAllStages(rootStage);
QueryStats queryStats = getQueryStats(rootStage, allStages);
boolean finalInfo = state.isDone() && allStages.stream().allMatch(StageInfo::isFinalStageInfo);
return new QueryInfo(
queryId,
session.toSessionRepresentation(),
state,
self,
outputManager.getQueryOutputInfo().map(QueryOutputInfo::getColumnNames).orElse(ImmutableList.of()),
query,
preparedQuery,
queryStats,
Optional.ofNullable(setCatalog.get()),
Optional.ofNullable(setSchema.get()),
Optional.ofNullable(setPath.get()),
Optional.ofNullable(setAuthorizationUser.get()),
resetAuthorizationUser.get(),
setSessionProperties,
resetSessionProperties,
setRoles,
addedPreparedStatements,
deallocatedPreparedStatements,
Optional.ofNullable(startedTransactionId.get()),
clearTransactionId.get(),
updateType.get(),
rootStage,
failureCause,
errorCode,
warningCollector.getWarnings(),
inputs.get(),
output.get(),
referencedTables.get(),
routines.get(),
finalInfo,
Optional.of(resourceGroup),
queryType,
getRetryPolicy(session),
false,
version);
}
private QueryStats getQueryStats(Optional rootStage, List allStages)
{
int totalTasks = 0;
int runningTasks = 0;
int completedTasks = 0;
int failedTasks = 0;
int totalDrivers = 0;
int queuedDrivers = 0;
int runningDrivers = 0;
int blockedDrivers = 0;
int completedDrivers = 0;
double cumulativeUserMemory = 0;
double failedCumulativeUserMemory = 0;
long userMemoryReservation = 0;
long revocableMemoryReservation = 0;
long totalMemoryReservation = 0;
long totalScheduledTime = 0;
long failedScheduledTime = 0;
long totalCpuTime = 0;
long failedCpuTime = 0;
long totalBlockedTime = 0;
long physicalInputDataSize = 0;
long failedPhysicalInputDataSize = 0;
long physicalInputPositions = 0;
long failedPhysicalInputPositions = 0;
long physicalInputReadTime = 0;
long failedPhysicalInputReadTime = 0;
long internalNetworkInputDataSize = 0;
long failedInternalNetworkInputDataSize = 0;
long internalNetworkInputPositions = 0;
long failedInternalNetworkInputPositions = 0;
long rawInputDataSize = 0;
long failedRawInputDataSize = 0;
long rawInputPositions = 0;
long failedRawInputPositions = 0;
long processedInputDataSize = 0;
long failedProcessedInputDataSize = 0;
long processedInputPositions = 0;
long failedProcessedInputPositions = 0;
long inputBlockedTime = 0;
long failedInputBlockedTime = 0;
long outputDataSize = 0;
long failedOutputDataSize = 0;
long outputPositions = 0;
long failedOutputPositions = 0;
long outputBlockedTime = 0;
long failedOutputBlockedTime = 0;
long physicalWrittenDataSize = 0;
long failedPhysicalWrittenDataSize = 0;
ImmutableList.Builder stageGcStatistics = ImmutableList.builderWithExpectedSize(allStages.size());
boolean fullyBlocked = rootStage.isPresent();
Set blockedReasons = new HashSet<>();
ImmutableList.Builder operatorStatsSummary = ImmutableList.builder();
for (StageInfo stageInfo : allStages) {
StageStats stageStats = stageInfo.getStageStats();
totalTasks += stageStats.getTotalTasks();
runningTasks += stageStats.getRunningTasks();
completedTasks += stageStats.getCompletedTasks();
failedTasks += stageStats.getFailedTasks();
totalDrivers += stageStats.getTotalDrivers();
queuedDrivers += stageStats.getQueuedDrivers();
runningDrivers += stageStats.getRunningDrivers();
blockedDrivers += stageStats.getBlockedDrivers();
completedDrivers += stageStats.getCompletedDrivers();
cumulativeUserMemory += stageStats.getCumulativeUserMemory();
failedCumulativeUserMemory += stageStats.getFailedCumulativeUserMemory();
userMemoryReservation += stageStats.getUserMemoryReservation().toBytes();
revocableMemoryReservation += stageStats.getRevocableMemoryReservation().toBytes();
totalMemoryReservation += stageStats.getTotalMemoryReservation().toBytes();
totalScheduledTime += stageStats.getTotalScheduledTime().roundTo(MILLISECONDS);
failedScheduledTime += stageStats.getFailedScheduledTime().roundTo(MILLISECONDS);
totalCpuTime += stageStats.getTotalCpuTime().roundTo(MILLISECONDS);
failedCpuTime += stageStats.getFailedCpuTime().roundTo(MILLISECONDS);
totalBlockedTime += stageStats.getTotalBlockedTime().roundTo(MILLISECONDS);
if (!stageInfo.getState().isDone()) {
fullyBlocked &= stageStats.isFullyBlocked();
blockedReasons.addAll(stageStats.getBlockedReasons());
}
physicalInputDataSize += stageStats.getPhysicalInputDataSize().toBytes();
failedPhysicalInputDataSize += stageStats.getFailedPhysicalInputDataSize().toBytes();
physicalInputPositions += stageStats.getPhysicalInputPositions();
failedPhysicalInputPositions += stageStats.getFailedPhysicalInputPositions();
physicalInputReadTime += stageStats.getPhysicalInputReadTime().roundTo(MILLISECONDS);
failedPhysicalInputReadTime += stageStats.getFailedPhysicalInputReadTime().roundTo(MILLISECONDS);
internalNetworkInputDataSize += stageStats.getInternalNetworkInputDataSize().toBytes();
failedInternalNetworkInputDataSize += stageStats.getFailedInternalNetworkInputDataSize().toBytes();
internalNetworkInputPositions += stageStats.getInternalNetworkInputPositions();
failedInternalNetworkInputPositions += stageStats.getFailedInternalNetworkInputPositions();
PlanFragment plan = stageInfo.getPlan();
if (plan != null && plan.containsTableScanNode()) {
rawInputDataSize += stageStats.getRawInputDataSize().toBytes();
failedRawInputDataSize += stageStats.getFailedRawInputDataSize().toBytes();
rawInputPositions += stageStats.getRawInputPositions();
failedRawInputPositions += stageStats.getFailedRawInputPositions();
processedInputDataSize += stageStats.getProcessedInputDataSize().toBytes();
failedProcessedInputDataSize += stageStats.getFailedProcessedInputDataSize().toBytes();
processedInputPositions += stageStats.getProcessedInputPositions();
failedProcessedInputPositions += stageStats.getFailedProcessedInputPositions();
}
inputBlockedTime += stageStats.getInputBlockedTime().roundTo(NANOSECONDS);
failedInputBlockedTime += stageStats.getFailedInputBlockedTime().roundTo(NANOSECONDS);
outputBlockedTime += stageStats.getOutputBlockedTime().roundTo(NANOSECONDS);
failedOutputBlockedTime += stageStats.getFailedOutputBlockedTime().roundTo(NANOSECONDS);
physicalWrittenDataSize += stageStats.getPhysicalWrittenDataSize().toBytes();
failedPhysicalWrittenDataSize += stageStats.getFailedPhysicalWrittenDataSize().toBytes();
stageGcStatistics.add(stageStats.getGcInfo());
operatorStatsSummary.addAll(stageInfo.getStageStats().getOperatorSummaries());
}
if (rootStage.isPresent()) {
StageStats outputStageStats = rootStage.get().getStageStats();
outputDataSize += outputStageStats.getOutputDataSize().toBytes();
failedOutputDataSize += outputStageStats.getFailedOutputDataSize().toBytes();
outputPositions += outputStageStats.getOutputPositions();
failedOutputPositions += outputStageStats.getFailedOutputPositions();
}
boolean scheduled;
OptionalDouble progressPercentage;
OptionalDouble runningPercentage;
if (getRetryPolicy(session).equals(TASK)) {
// Unlike pipelined execution, fault tolerant execution doesn't execute stages all at
// once and some stages will be in PLANNED state in the middle of execution.
scheduled = rootStage.isPresent() && allStages.stream()
.map(StageInfo::getState)
.anyMatch(StageState::isScheduled);
if (!scheduled || totalDrivers == 0) {
progressPercentage = OptionalDouble.empty();
runningPercentage = OptionalDouble.empty();
}
else {
double completedPercentageSum = 0.0;
double runningPercentageSum = 0.0;
int totalStages = 0;
Queue queue = new ArrayDeque<>();
queue.add(rootStage.get());
while (!queue.isEmpty()) {
StageInfo stage = queue.poll();
StageStats stageStats = stage.getStageStats();
totalStages++;
if (stage.getState().isScheduled()) {
completedPercentageSum += 100.0 * stageStats.getCompletedDrivers() / stageStats.getTotalDrivers();
runningPercentageSum += 100.0 * stageStats.getRunningDrivers() / stageStats.getTotalDrivers();
}
queue.addAll(stage.getSubStages());
}
progressPercentage = OptionalDouble.of(min(100, completedPercentageSum / totalStages));
runningPercentage = OptionalDouble.of(min(100, runningPercentageSum / totalStages));
}
}
else {
scheduled = rootStage.isPresent() && allStages.stream()
.map(StageInfo::getState)
.allMatch(StageState::isScheduled);
if (!scheduled || totalDrivers == 0) {
progressPercentage = OptionalDouble.empty();
runningPercentage = OptionalDouble.empty();
}
else {
progressPercentage = OptionalDouble.of(min(100, (completedDrivers * 100.0) / totalDrivers));
runningPercentage = OptionalDouble.of(min(100, (runningDrivers * 100.0) / totalDrivers));
}
}
return new QueryStats(
queryStateTimer.getCreateTime(),
getExecutionStartTime().orElse(null),
getLastHeartbeat(),
getEndTime().orElse(null),
queryStateTimer.getElapsedTime(),
queryStateTimer.getQueuedTime(),
queryStateTimer.getResourceWaitingTime(),
queryStateTimer.getDispatchingTime(),
queryStateTimer.getExecutionTime(),
queryStateTimer.getAnalysisTime(),
queryStateTimer.getPlanningTime(),
queryStateTimer.getPlanningCpuTime(),
queryStateTimer.getFinishingTime(),
totalTasks,
runningTasks,
completedTasks,
failedTasks,
totalDrivers,
queuedDrivers,
runningDrivers,
blockedDrivers,
completedDrivers,
cumulativeUserMemory,
failedCumulativeUserMemory,
succinctBytes(userMemoryReservation),
succinctBytes(revocableMemoryReservation),
succinctBytes(totalMemoryReservation),
succinctBytes(getPeakUserMemoryInBytes()),
succinctBytes(getPeakRevocableMemoryInBytes()),
succinctBytes(getPeakTotalMemoryInBytes()),
succinctBytes(getPeakTaskUserMemory()),
succinctBytes(getPeakTaskRevocableMemory()),
succinctBytes(getPeakTaskTotalMemory()),
scheduled,
progressPercentage,
runningPercentage,
new Duration(totalScheduledTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
new Duration(failedScheduledTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
new Duration(totalCpuTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
new Duration(failedCpuTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
new Duration(totalBlockedTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
fullyBlocked,
blockedReasons,
succinctBytes(physicalInputDataSize),
succinctBytes(failedPhysicalInputDataSize),
physicalInputPositions,
failedPhysicalInputPositions,
new Duration(physicalInputReadTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
new Duration(failedPhysicalInputReadTime, MILLISECONDS).convertToMostSuccinctTimeUnit(),
succinctBytes(internalNetworkInputDataSize),
succinctBytes(failedInternalNetworkInputDataSize),
internalNetworkInputPositions,
failedInternalNetworkInputPositions,
succinctBytes(rawInputDataSize),
succinctBytes(failedRawInputDataSize),
rawInputPositions,
failedRawInputPositions,
succinctBytes(processedInputDataSize),
succinctBytes(failedProcessedInputDataSize),
processedInputPositions,
failedProcessedInputPositions,
new Duration(inputBlockedTime, NANOSECONDS).convertToMostSuccinctTimeUnit(),
new Duration(failedInputBlockedTime, NANOSECONDS).convertToMostSuccinctTimeUnit(),
succinctBytes(outputDataSize),
succinctBytes(failedOutputDataSize),
outputPositions,
failedOutputPositions,
new Duration(outputBlockedTime, NANOSECONDS).convertToMostSuccinctTimeUnit(),
new Duration(failedOutputBlockedTime, NANOSECONDS).convertToMostSuccinctTimeUnit(),
succinctBytes(physicalWrittenDataSize),
succinctBytes(failedPhysicalWrittenDataSize),
stageGcStatistics.build(),
getDynamicFiltersStats(),
operatorStatsSummary.build(),
planOptimizersStatsCollector.getTopRuleStats());
}
public void setOutputInfoListener(Consumer listener)
{
outputManager.setOutputInfoListener(listener);
}
public void addOutputTaskFailureListener(TaskFailureListener listener)
{
outputManager.addOutputTaskFailureListener(listener);
}
public void outputTaskFailed(TaskId taskId, Throwable failure)
{
outputManager.outputTaskFailed(taskId, failure);
}
public void setColumns(List columnNames, List columnTypes)
{
outputManager.setColumns(columnNames, columnTypes);
}
public void updateInputsForQueryResults(List inputs, boolean noMoreInputs)
{
outputManager.updateInputsForQueryResults(inputs, noMoreInputs);
}
public void setInputs(List inputs)
{
requireNonNull(inputs, "inputs is null");
this.inputs.set(ImmutableSet.copyOf(inputs));
}
public void setOutput(Optional
© 2015 - 2025 Weber Informatics LLC | Privacy Policy