All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.solr.common.cloud.DocCollection Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.solr.common.cloud;

import static org.apache.solr.common.util.Utils.toJSONString;

import java.io.IOException;
import java.lang.invoke.MethodHandles;
import java.time.Instant;
import java.util.ArrayList;
import java.util.Collection;
import java.util.EnumSet;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Set;
import java.util.concurrent.atomic.AtomicReference;
import java.util.function.BiConsumer;
import java.util.function.BiPredicate;
import java.util.function.Supplier;
import org.apache.solr.common.cloud.Replica.ReplicaStateProps;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * Models a Collection in zookeeper (but that Java name is obviously taken, hence "DocCollection")
 */
public class DocCollection extends ZkNodeProps implements Iterable {

  public static final String COLLECTIONS_ZKNODE = "/collections";
  private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());

  private final int znodeVersion;

  private final String name;
  private final String configName;
  private final Map slices;
  private final Map activeSlices;
  private final Slice[] activeSlicesArr;
  private final Map> nodeNameReplicas;
  private final Map> nodeNameLeaderReplicas;
  private final DocRouter router;
  private final String znode;

  private final Integer replicationFactor;
  private final Integer numNrtReplicas;
  private final Integer numTlogReplicas;
  private final Integer numPullReplicas;
  private final Boolean readOnly;
  private final Instant creationTime;
  private final Boolean perReplicaState;
  private final Map replicaMap = new HashMap<>();
  private AtomicReference perReplicaStatesRef;

  /**
   * @see DocCollection#create(String, Map, Map, DocRouter, int, Instant, PrsSupplier)
   */
  @Deprecated
  public DocCollection(
      String name, Map slices, Map props, DocRouter router) {
    this(name, slices, props, router, Integer.MAX_VALUE, Instant.EPOCH, null);
  }

  /**
   * @see DocCollection#create(String, Map, Map, DocRouter, int, Instant, PrsSupplier)
   */
  @Deprecated
  public DocCollection(
      String name,
      Map slices,
      Map props,
      DocRouter router,
      int zkVersion) {
    this(name, slices, props, router, zkVersion, Instant.EPOCH, null);
  }

  /**
   * @param name The name of the collection
   * @param slices The logical shards of the collection. This is used directly and a copy is not
   *     made.
   * @param props The properties of the slice. This is used directly and a copy is not made.
   * @param zkVersion The version of the Collection node in Zookeeper (used for conditional
   *     updates).
   * @param creationTime The creation time of the collection
   * @see DocCollection#create(String, Map, Map, DocRouter, int, Instant, PrsSupplier)
   */
  private DocCollection(
      String name,
      Map slices,
      Map props,
      DocRouter router,
      int zkVersion,
      Instant creationTime,
      AtomicReference perReplicaStatesRef) {
    super(props);
    // -1 means any version in ZK CAS, so we choose Integer.MAX_VALUE instead to avoid accidental
    // overwrites
    this.znodeVersion = zkVersion == -1 ? Integer.MAX_VALUE : zkVersion;
    this.name = name;
    this.configName = (String) props.get(CollectionStateProps.CONFIGNAME);
    this.slices = slices;
    this.activeSlices = new HashMap<>();
    this.nodeNameLeaderReplicas = new HashMap<>();
    this.nodeNameReplicas = new HashMap<>();
    this.replicationFactor = (Integer) verifyProp(props, CollectionStateProps.REPLICATION_FACTOR);
    this.numNrtReplicas = (Integer) verifyProp(props, CollectionStateProps.NRT_REPLICAS, 0);
    this.numTlogReplicas = (Integer) verifyProp(props, CollectionStateProps.TLOG_REPLICAS, 0);
    this.numPullReplicas = (Integer) verifyProp(props, CollectionStateProps.PULL_REPLICAS, 0);
    this.perReplicaState =
        (Boolean) verifyProp(props, CollectionStateProps.PER_REPLICA_STATE, Boolean.FALSE);
    if (this.perReplicaState) {
      if (perReplicaStatesRef == null || perReplicaStatesRef.get() == null) {
        throw new RuntimeException(
            CollectionStateProps.PER_REPLICA_STATE
                + " = true , but perReplicaStates param is not provided");
      }
      this.perReplicaStatesRef = perReplicaStatesRef;
      for (Slice s : this.slices.values()) { // set the same reference to all slices too
        s.setPerReplicaStatesRef(this.perReplicaStatesRef);
      }
    }
    Boolean readOnly = (Boolean) verifyProp(props, CollectionStateProps.READ_ONLY);
    this.readOnly = readOnly == null ? Boolean.FALSE : readOnly;
    this.creationTime = creationTime;

    Iterator> iter = slices.entrySet().iterator();

    while (iter.hasNext()) {
      Map.Entry slice = iter.next();
      if (slice.getValue().getState() == Slice.State.ACTIVE) {
        this.activeSlices.put(slice.getKey(), slice.getValue());
      }
      for (Replica replica : slice.getValue()) {
        addNodeNameReplica(replica);
        if (perReplicaState) {
          replicaMap.put(replica.getName(), replica);
        }
      }
    }
    this.activeSlicesArr = activeSlices.values().toArray(new Slice[0]);
    this.router = router;
    this.znode = getCollectionPath(name);
    assert name != null && slices != null;
  }

  /**
   * Builds a DocCollection with an optional PrsSupplier
   *
   * @param name The name of the collection
   * @param slices The logical shards of the collection. This is used directly and a copy is not
   *     made.
   * @param props The properties of the slice. This is used directly and a copy is not made.
   * @param router router to partition int range into n ranges
   * @param zkVersion The version of the Collection node in Zookeeper (used for conditional
   *     updates).
   * @param creationTime The creation time of the collection
   * @param prsSupplier optional supplier for PerReplicaStates (PRS) for PRS enabled collections
   * @return a newly constructed DocCollection
   */
  public static DocCollection create(
      String name,
      Map slices,
      Map props,
      DocRouter router,
      int zkVersion,
      Instant creationTime,
      DocCollection.PrsSupplier prsSupplier) {
    boolean perReplicaState =
        (Boolean) verifyProp(props, CollectionStateProps.PER_REPLICA_STATE, Boolean.FALSE);
    PerReplicaStates perReplicaStates;
    if (perReplicaState) {
      if (prsSupplier == null) {
        throw new IllegalArgumentException(
            CollectionStateProps.PER_REPLICA_STATE + " = true , but prsSupplier is not provided");
      }

      if (!hasAnyReplica(
          slices)) { // a special case, if there is no replica, it should not fetch (first PRS
        // collection creation with no replicas). Otherwise, it would trigger exception
        // on fetching a state.json that does not exist yet
        perReplicaStates = PerReplicaStates.empty(name);
      } else {
        perReplicaStates = prsSupplier.get();
      }
    } else {
      perReplicaStates = null;
    }
    return new DocCollection(
        name,
        slices,
        props,
        router,
        zkVersion,
        creationTime,
        perReplicaStates != null ? new AtomicReference<>(perReplicaStates) : null);
  }

  private static boolean hasAnyReplica(Map slices) {
    for (Slice slice : slices.values()) {
      if (!slice.getReplicasMap().isEmpty()) {
        return true;
      }
    }
    return false;
  }

  public static String getCollectionPath(String coll) {
    return getCollectionPathRoot(coll) + "/state.json";
  }

  public static String getCollectionPathRoot(String coll) {
    return COLLECTIONS_ZKNODE + "/" + coll;
  }

  /**
   * Update our state with a state of a {@link PerReplicaStates} which could override states of
   * {@link Replica}.
   *
   * 

Take note that it updates the underlying AtomicReference such that all Slice and Replica * that holds the same AtomicReference will see the same update * *

This does not create a new DocCollection. */ public final DocCollection setPerReplicaStates(PerReplicaStates newPerReplicaStates) { if (this.perReplicaStatesRef != null) { log.debug("In-place update of PRS: {}", newPerReplicaStates); this.perReplicaStatesRef.set(newPerReplicaStates); } return this; } private void addNodeNameReplica(Replica replica) { List replicas = nodeNameReplicas.get(replica.getNodeName()); if (replicas == null) { replicas = new ArrayList<>(); nodeNameReplicas.put(replica.getNodeName(), replicas); } replicas.add(replica); if (replica.getStr(ReplicaStateProps.LEADER) != null) { List leaderReplicas = nodeNameLeaderReplicas.get(replica.getNodeName()); if (leaderReplicas == null) { leaderReplicas = new ArrayList<>(); nodeNameLeaderReplicas.put(replica.getNodeName(), leaderReplicas); } leaderReplicas.add(replica); } } public static Object verifyProp(Map props, String propName) { return verifyProp(props, propName, null); } public static Object verifyProp(Map props, String propName, Object def) { Object o = props.get(propName); if (o == null) return def; switch (propName) { case CollectionStateProps.REPLICATION_FACTOR: case CollectionStateProps.NRT_REPLICAS: case CollectionStateProps.PULL_REPLICAS: case CollectionStateProps.TLOG_REPLICAS: return Integer.parseInt(o.toString()); case CollectionStateProps.PER_REPLICA_STATE: case CollectionStateProps.READ_ONLY: return Boolean.parseBoolean(o.toString()); case "snitch": default: return o; } } /** * Use this to make an exact copy of DocCollection with a new set of Slices and every other * property as is * * @param slices the new set of Slices * @return the resulting DocCollection */ public DocCollection copyWithSlices(Map slices) { DocCollection result = new DocCollection( getName(), slices, propMap, router, znodeVersion, creationTime, perReplicaStatesRef); return result; } /** Return collection name. */ public String getName() { return name; } /** Return non-null config name */ public String getConfigName() { assert configName != null; return configName; } public Slice getSlice(String sliceName) { return slices.get(sliceName); } /** * @param consumer consume shardName vs. replica */ public void forEachReplica(BiConsumer consumer) { slices.forEach( (shard, slice) -> slice.getReplicasMap().forEach((s, replica) -> consumer.accept(shard, replica))); } /** Gets the list of all slices for this collection. */ public Collection getSlices() { return slices.values(); } /** Return the list of active slices for this collection. */ public Collection getActiveSlices() { return activeSlices.values(); } /** Return array of active slices for this collection (performance optimization). */ public Slice[] getActiveSlicesArr() { return activeSlicesArr; } /** Get the map of all slices (sliceName->Slice) for this collection. */ public Map getSlicesMap() { return slices; } /** Get the map of active slices (sliceName->Slice) for this collection. */ public Map getActiveSlicesMap() { return activeSlices; } /** Get the list of replicas hosted on the given node or null if none. */ public List getReplicas(String nodeName) { return nodeNameReplicas.get(nodeName); } /** Get the list of all leaders hosted on the given node or null if none. */ public List getLeaderReplicas(String nodeName) { return nodeNameLeaderReplicas.get(nodeName); } public int getZNodeVersion() { return znodeVersion; } public int getChildNodesVersion() { return perReplicaStatesRef == null ? 0 : perReplicaStatesRef.get().cversion; } public boolean isModified(int dataVersion, int childVersion) { if (dataVersion > znodeVersion) return true; if (childVersion > getChildNodesVersion()) return true; return false; } /** * @return replication factor for this collection or null if no replication factor exists. */ public Integer getReplicationFactor() { return replicationFactor; } public String getZNode() { return znode; } public DocRouter getRouter() { return router; } public boolean isReadOnly() { return readOnly; } /** * The creation time of the Collection. When this collection is read from ZooKeeper, this is the * creation time of the collection node. */ public Instant getCreationTime() { return creationTime; } @Override public String toString() { return "DocCollection(" + name + "/" + getZNode() + "/" + znodeVersion + " " + (perReplicaStatesRef == null ? "" : perReplicaStatesRef.get()) + ")=" + toJSONString(this); } @Override public void writeMap(EntryWriter ew) throws IOException { propMap.forEach(ew.getBiConsumer()); ew.put(CollectionStateProps.SHARDS, slices); } public Replica getReplica(String coreNodeName) { if (perReplicaState) { return replicaMap.get(coreNodeName); } for (Slice slice : slices.values()) { Replica replica = slice.getReplica(coreNodeName); if (replica != null) return replica; } return null; } public Replica getLeader(String sliceName) { Slice slice = getSlice(sliceName); if (slice == null) return null; return slice.getLeader(); } /** * Check that all replicas in a collection are live * * @see CollectionStatePredicate */ public static boolean isFullyActive( Set liveNodes, DocCollection collectionState, int expectedShards, int expectedReplicas) { Objects.requireNonNull(liveNodes); if (collectionState == null) return false; int activeShards = 0; for (Slice slice : collectionState) { int activeReplicas = 0; for (Replica replica : slice) { if (replica.isActive(liveNodes) == false) return false; activeReplicas++; } if (activeReplicas != expectedReplicas) return false; activeShards++; } return activeShards == expectedShards; } @Override public Iterator iterator() { return slices.values().iterator(); } public List getReplicas() { List replicas = new ArrayList<>(); for (Slice slice : this) { replicas.addAll(slice.getReplicas()); } return replicas; } /** * @param predicate test against shardName vs. replica * @return the first replica that matches the predicate */ public Replica getReplica(BiPredicate predicate) { final Replica[] result = new Replica[1]; forEachReplica( (s, replica) -> { if (result[0] != null) return; if (predicate.test(s, replica)) { result[0] = replica; } }); return result[0]; } public List getReplicas(EnumSet s) { List replicas = new ArrayList<>(); for (Slice slice : this) { replicas.addAll(slice.getReplicas(s)); } return replicas; } /** Get the shardId of a core on a specific node */ public String getShardId(String nodeName, String coreName) { for (Slice slice : this) { for (Replica replica : slice) { if (Objects.equals(replica.getNodeName(), nodeName) && Objects.equals(replica.getCoreName(), coreName)) return slice.getName(); } } return null; } @Override public boolean equals(Object that) { if (!(that instanceof DocCollection)) return false; DocCollection other = (DocCollection) that; return super.equals(that) && Objects.equals(this.name, other.name) && this.znodeVersion == other.znodeVersion && this.getChildNodesVersion() == other.getChildNodesVersion(); } @Override public int hashCode() { return Objects.hash(name, znodeVersion, getChildNodesVersion()); } /** * @return the number of replicas of type {@link org.apache.solr.common.cloud.Replica.Type#NRT} * this collection was created with */ public Integer getNumNrtReplicas() { return numNrtReplicas; } /** * @return the number of replicas of type {@link org.apache.solr.common.cloud.Replica.Type#TLOG} * this collection was created with */ public Integer getNumTlogReplicas() { return numTlogReplicas; } /** * @return the number of replicas of type {@link org.apache.solr.common.cloud.Replica.Type#PULL} * this collection was created with */ public Integer getNumPullReplicas() { return numPullReplicas; } public boolean isPerReplicaState() { return Boolean.TRUE.equals(perReplicaState); } public PerReplicaStates getPerReplicaStates() { return perReplicaStatesRef != null ? perReplicaStatesRef.get() : null; } public int getExpectedReplicaCount(Replica.Type type, int def) { Integer result = null; if (type == Replica.Type.NRT) result = numNrtReplicas; if (type == Replica.Type.PULL) result = numPullReplicas; if (type == Replica.Type.TLOG) result = numTlogReplicas; return result == null ? def : result; } /** JSON properties related to a collection's state. */ public interface CollectionStateProps { String NRT_REPLICAS = "nrtReplicas"; String PULL_REPLICAS = "pullReplicas"; String TLOG_REPLICAS = "tlogReplicas"; String REPLICATION_FACTOR = "replicationFactor"; String READ_ONLY = "readOnly"; String CONFIGNAME = "configName"; String DOC_ROUTER = "router"; String SHARDS = "shards"; String PER_REPLICA_STATE = "perReplicaState"; } public interface PrsSupplier extends Supplier {} }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy