All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.cassandra.index.IndexStatusManager Maven / Gradle / Ivy

Go to download

The Apache Cassandra Project develops a highly scalable second-generation distributed database, bringing together Dynamo's fully distributed design and Bigtable's ColumnFamily-based data model.

There is a newer version: 5.0.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.cassandra.index;

import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;

import javax.annotation.Nonnull;
import javax.annotation.Nullable;

import com.google.common.annotations.VisibleForTesting;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import org.apache.cassandra.concurrent.ExecutorPlus;
import org.apache.cassandra.db.ConsistencyLevel;
import org.apache.cassandra.db.Keyspace;
import org.apache.cassandra.exceptions.ReadFailureException;
import org.apache.cassandra.exceptions.RequestFailureReason;
import org.apache.cassandra.gms.ApplicationState;
import org.apache.cassandra.gms.Gossiper;
import org.apache.cassandra.gms.VersionedValue;
import org.apache.cassandra.locator.Endpoints;
import org.apache.cassandra.locator.InetAddressAndPort;
import org.apache.cassandra.serializers.MarshalException;
import org.apache.cassandra.service.StorageService;
import org.apache.cassandra.utils.FBUtilities;
import org.apache.cassandra.utils.JsonUtils;

import static org.apache.cassandra.concurrent.ExecutorFactory.Global.executorFactory;

/**
 * Handles the status of an index across the ring, updating the status per index and endpoint
 * in a per-endpoint map.
 * 

* Peer status changes are recieved via the {@link StorageService} {@link org.apache.cassandra.gms.IEndpointStateChangeSubscriber}. *

* Local status changes are propagated to the {@link Gossiper} using an async executor. */ public class IndexStatusManager { private static final Logger logger = LoggerFactory.getLogger(IndexStatusManager.class); public static final IndexStatusManager instance = new IndexStatusManager(); // executes index status propagation task asynchronously to avoid potential deadlock on SIM private final ExecutorPlus statusPropagationExecutor = executorFactory().withJmxInternal() .sequential("StatusPropagationExecutor"); /** * A map of per-endpoint index statuses: the key of inner map is the identifier "keyspace.index" */ public final Map> peerIndexStatus = new HashMap<>(); private IndexStatusManager() {} /** * Remove endpoints whose indexes are not queryable for the specified {@link Index.QueryPlan}. * * @param liveEndpoints current live endpoints where non-queryable endpoints will be removed * @param keyspace to be queried * @param indexQueryPlan index query plan used in the read command * @param level consistency level of read command */ public > E filterForQuery(E liveEndpoints, Keyspace keyspace, Index.QueryPlan indexQueryPlan, ConsistencyLevel level) { E queryableEndpoints = liveEndpoints.filter(replica -> { for (Index index : indexQueryPlan.getIndexes()) { Index.Status status = getIndexStatus(replica.endpoint(), keyspace.getName(), index.getIndexMetadata().name); if (!index.isQueryable(status)) return false; } return true; }); int initial = liveEndpoints.size(); int filtered = queryableEndpoints.size(); // Throw ReadFailureException if read request cannot satisfy Consistency Level due to non-queryable indexes. // It is to provide a better UX, compared to throwing UnavailableException when the nodes are actually alive. if (initial != filtered) { int required = level.blockFor(keyspace.getReplicationStrategy()); if (required <= initial && required > filtered) { Map failureReasons = new HashMap<>(); liveEndpoints.without(queryableEndpoints.endpoints()) .forEach(replica -> failureReasons.put(replica.endpoint(), RequestFailureReason.INDEX_NOT_AVAILABLE)); throw new ReadFailureException(level, filtered, required, false, failureReasons); } } return queryableEndpoints; } /** * Recieve a new index status map from a peer. This will include the status for all the indexes on the peer. * * @param endpoint the {@link InetAddressAndPort} the index status map is coming from * @param versionedValue the {@link VersionedValue} containing the index status map */ public synchronized void receivePeerIndexStatus(InetAddressAndPort endpoint, VersionedValue versionedValue) { try { if (versionedValue == null) return; if (endpoint.equals(FBUtilities.getBroadcastAddressAndPort())) return; Map peerStatus = JsonUtils.fromJsonMap(versionedValue.value); Map indexStatus = new HashMap<>(); for (Map.Entry e : peerStatus.entrySet()) { String keyspaceIndex = e.getKey(); Index.Status status = Index.Status.valueOf(e.getValue()); indexStatus.put(keyspaceIndex, status); } Map oldStatus = peerIndexStatus.put(endpoint, indexStatus); Map updated = updatedIndexStatuses(oldStatus, indexStatus); Set removed = removedIndexStatuses(oldStatus, indexStatus); if (!updated.isEmpty() || !removed.isEmpty()) logger.debug("Received index status for peer {}:\n Updated: {}\n Removed: {}", endpoint, updated, removed); } catch (MarshalException | IllegalArgumentException e) { logger.warn("Unable to parse index status: {}", e.getMessage()); } } /** * Propagate a new index status to the ring. The new index status is added to the current index status map * and the whole map is sent to the ring as a {@link VersionedValue}. * * @param keyspace the keyspace name for the index * @param index the index name * @param status the new {@link Index.Status} */ public synchronized void propagateLocalIndexStatus(String keyspace, String index, Index.Status status) { try { Map states = peerIndexStatus.computeIfAbsent(FBUtilities.getBroadcastAddressAndPort(), k -> new HashMap<>()); String keyspaceIndex = identifier(keyspace, index); if (status == Index.Status.DROPPED) states.remove(keyspaceIndex); else states.put(keyspaceIndex, status); // Don't try and propagate if the gossiper isn't enabled. This is primarily for tests where the // Gossiper has not been started. If we attempt to propagate when not started an exception is // logged and this causes a number of dtests to fail. if (Gossiper.instance.isEnabled()) { String newStatus = JsonUtils.JSON_OBJECT_MAPPER.writeValueAsString(states); statusPropagationExecutor.submit(() -> { // schedule gossiper update asynchronously to avoid potential deadlock when another thread is holding // gossiper taskLock. VersionedValue value = StorageService.instance.valueFactory.indexStatus(newStatus); Gossiper.instance.addLocalApplicationState(ApplicationState.INDEX_STATUS, value); }); } } catch (Throwable e) { logger.warn("Unable to propagate index status: {}", e.getMessage()); } } @VisibleForTesting public synchronized Index.Status getIndexStatus(InetAddressAndPort peer, String keyspace, String index) { return peerIndexStatus.getOrDefault(peer, Collections.emptyMap()) .getOrDefault(identifier(keyspace, index), Index.Status.UNKNOWN); } /** * Returns the names of indexes that are present in oldStatus but absent in newStatus. */ private @Nonnull Set removedIndexStatuses(@Nullable Map oldStatus, @Nonnull Map newStatus) { if (oldStatus == null) return Collections.emptySet(); Set result = new HashSet<>(oldStatus.keySet()); result.removeAll(newStatus.keySet()); return result; } /** * Returns a new map containing only the entries from newStatus that differ from corresponding entries in oldStatus. */ private @Nonnull Map updatedIndexStatuses(@Nullable Map oldStatus, @Nonnull Map newStatus) { Map delta = new HashMap<>(); for (Map.Entry e : newStatus.entrySet()) { if (oldStatus == null || e.getValue() != oldStatus.get(e.getKey())) delta.put(e.getKey(), e.getValue()); } return delta; } private String identifier(String keyspace, String index) { return keyspace + '.' + index; } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy