io.trino.memory.TotalReservationOnBlockedNodesQueryLowMemoryKiller Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.memory;
import com.google.common.collect.Maps;
import io.trino.operator.RetryPolicy;
import io.trino.spi.QueryId;
import io.trino.spi.memory.MemoryPoolInfo;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import static java.util.Comparator.comparingLong;
public class TotalReservationOnBlockedNodesQueryLowMemoryKiller
implements LowMemoryKiller
{
@Override
public Optional chooseTargetToKill(List runningQueries, List nodes)
{
Map queriesById = Maps.uniqueIndex(runningQueries, RunningQueryInfo::getQueryId);
Map memoryReservationOnBlockedNodes = new HashMap<>();
for (MemoryInfo node : nodes) {
MemoryPoolInfo memoryPool = node.getPool();
if (memoryPool == null) {
continue;
}
if (memoryPool.getFreeBytes() + memoryPool.getReservedRevocableBytes() > 0) {
continue;
}
Map queryMemoryReservations = memoryPool.getQueryMemoryReservations();
queryMemoryReservations.forEach((queryId, memoryReservation) -> {
RunningQueryInfo queryMemoryInfo = queriesById.get(queryId);
if (queryMemoryInfo != null && queryMemoryInfo.getRetryPolicy() == RetryPolicy.TASK) {
// Do not kill whole queries which run with task retries enabled
// Most of the time if query with task retries enabled is a root cause of cluster out-of-memory error
// individual tasks should be already picked for killing by `chooseTasksToKill`. Yet sometimes there is a discrepancy between
// tasks listing and determining memory pool size. Pool may report it is fully reserved by Q, yet there are no running tasks from Q reported
// for given node.
return;
}
memoryReservationOnBlockedNodes.compute(queryId, (id, oldValue) -> oldValue == null ? memoryReservation : oldValue + memoryReservation);
});
}
return memoryReservationOnBlockedNodes.entrySet().stream()
.max(comparingLong(Map.Entry::getValue))
.map(Map.Entry::getKey)
.map(KillTarget::wholeQuery);
}
}