All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.accumulo.server.master.balancer.TabletBalancer Maven / Gradle / Ivy

There is a newer version: 3.0.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   https://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package org.apache.accumulo.server.master.balancer;

import static java.util.stream.Collectors.toList;

import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.SortedMap;

import org.apache.accumulo.core.clientImpl.thrift.ThriftSecurityException;
import org.apache.accumulo.core.conf.Property;
import org.apache.accumulo.core.data.TableId;
import org.apache.accumulo.core.dataImpl.KeyExtent;
import org.apache.accumulo.core.manager.balancer.AssignmentParamsImpl;
import org.apache.accumulo.core.manager.balancer.BalanceParamsImpl;
import org.apache.accumulo.core.master.thrift.TabletServerStatus;
import org.apache.accumulo.core.metadata.TServerInstance;
import org.apache.accumulo.core.rpc.ThriftUtil;
import org.apache.accumulo.core.rpc.clients.ThriftClientTypes;
import org.apache.accumulo.core.spi.balancer.BalancerEnvironment;
import org.apache.accumulo.core.tabletserver.thrift.TabletClientService.Client;
import org.apache.accumulo.core.tabletserver.thrift.TabletStats;
import org.apache.accumulo.core.trace.TraceUtil;
import org.apache.accumulo.server.ServerContext;
import org.apache.accumulo.server.conf.ServerConfigurationFactory;
import org.apache.accumulo.server.manager.balancer.BalancerEnvironmentImpl;
import org.apache.accumulo.server.master.state.TabletMigration;
import org.apache.thrift.TException;
import org.apache.thrift.transport.TTransportException;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;

/**
 * This class is responsible for managing the distribution of tablets throughout an Accumulo
 * cluster. In most cases, users will want a balancer implementation which ensures a uniform
 * distribution of tablets, so that no individual tablet server is handling significantly more work
 * than any other.
 *
 * 

* Implementations may wish to store configuration in Accumulo's system configuration using the * {@link Property#GENERAL_ARBITRARY_PROP_PREFIX}. They may also benefit from using per-table * configuration using {@link Property#TABLE_ARBITRARY_PROP_PREFIX}. * * @deprecated since 2.1.0. Use {@link org.apache.accumulo.core.spi.balancer.TabletBalancer} * instead. */ @Deprecated(since = "2.1.0") @SuppressFBWarnings(value = "NM_SAME_SIMPLE_NAME_AS_INTERFACE", justification = "Class is deprecated and will be removed.") public abstract class TabletBalancer implements org.apache.accumulo.core.spi.balancer.TabletBalancer { private static final Logger log = LoggerFactory.getLogger(TabletBalancer.class); protected ServerContext context; @Override public void init(BalancerEnvironment balancerEnvironment) { var bei = (BalancerEnvironmentImpl) balancerEnvironment; init(bei.getContext()); } @Override public void getAssignments(AssignmentParameters params) { AssignmentParamsImpl api = (AssignmentParamsImpl) params; getAssignments(api.thriftCurrentStatus(), api.thriftUnassigned(), api.thriftAssignmentsOut()); } @Override public long balance(BalanceParameters params) { BalanceParamsImpl bpi = (BalanceParamsImpl) params; List migrationsOut = new ArrayList<>(); long result = balance(bpi.thriftCurrentStatus(), bpi.thriftCurrentMigrations(), migrationsOut); migrationsOut.forEach(mo -> bpi.addMigration(mo.tablet, mo.oldServer, mo.newServer)); return result; } /** * Initialize the TabletBalancer. This gives the balancer the opportunity to read the * configuration. * * @deprecated since 2.0.0; use {@link #init(ServerContext)} instead. */ @Deprecated(since = "2.0.0") public void init(ServerConfigurationFactory conf) { init(conf.getServerContext()); } /** * Initialize the TabletBalancer. This gives the balancer the opportunity to read the * configuration. * * @since 2.0.0 */ public void init(ServerContext context) { this.context = context; } /** * Assign tablets to tablet servers. This method is called whenever the manager finds tablets that * are unassigned. * * @param current The current table-summary state of all the online tablet servers. Read-only. The * TabletServerStatus for each server may be null if the tablet server has not yet * responded to a recent request for status. * @param unassigned A map from unassigned tablet to the last known tablet server. Read-only. * @param assignments A map from tablet to assigned server. Write-only. */ public abstract void getAssignments(SortedMap current, Map unassigned, Map assignments); /** * Ask the balancer if any migrations are necessary. * * If the balancer is going to self-abort due to some environmental constraint (e.g. it requires * some minimum number of tservers, or a maximum number of outstanding migrations), it should * issue a log message to alert operators. The message should be at WARN normally and at ERROR if * the balancer knows that the problem can not self correct. It should not issue these messages * more than once a minute. * * @param current The current table-summary state of all the online tablet servers. Read-only. * @param migrations the current set of migrations. Read-only. * @param migrationsOut new migrations to perform; should not contain tablets in the current set * of migrations. Write-only. * @return the time, in milliseconds, to wait before re-balancing. * * This method will not be called when there are unassigned tablets. */ public abstract long balance(SortedMap current, Set migrations, List migrationsOut); private static final long ONE_SECOND = 1000L; private boolean stuck = false; private long stuckNotificationTime = -1L; protected static final long TIME_BETWEEN_BALANCER_WARNINGS = 60 * ONE_SECOND; /** * A deferred call descendent TabletBalancers use to log why they can't continue. The call is * deferred so that TabletBalancer can limit how often messages happen. * * Implementations should be reused as much as possible. * * Be sure to pass in a properly scoped Logger instance so that messages indicate what part of the * system is having trouble. */ protected abstract static class BalancerProblem implements Runnable { protected final Logger balancerLog; public BalancerProblem(Logger logger) { balancerLog = logger; } } /** * If a TabletBalancer requires active tservers, it should use this problem to indicate when there * are none. NoTservers is safe to share with anyone who uses the same Logger. TabletBalancers * should have a single static instance. */ protected static class NoTservers extends BalancerProblem { public NoTservers(Logger logger) { super(logger); } @Override public void run() { balancerLog.warn("Not balancing because we don't have any tservers"); } } /** * If a TabletBalancer only balances when there are no outstanding migrations, it should use this * problem to indicate when they exist. * * Iff a TabletBalancer makes use of the migrations member to provide samples, then * OutstandingMigrations is not thread safe. */ protected static class OutstandingMigrations extends BalancerProblem { public Set migrations = Collections.emptySet(); public OutstandingMigrations(Logger logger) { super(logger); } @Override public void run() { balancerLog.warn("Not balancing due to {} outstanding migrations.", migrations.size()); balancerLog.debug("Sample up to 10 outstanding migrations: {}", migrations.stream().limit(10).collect(toList())); } } /** * Warn that a Balancer can't work because of some external restriction. Will not call the * provided logging handler more often than TIME_BETWEEN_BALANCER_WARNINGS */ protected void constraintNotMet(BalancerProblem cause) { if (stuck) { if ((System.currentTimeMillis() - stuckNotificationTime) > TIME_BETWEEN_BALANCER_WARNINGS) { cause.run(); stuckNotificationTime = System.currentTimeMillis(); } } else { stuck = true; stuckNotificationTime = System.currentTimeMillis(); } } /** * Resets logging about problems meeting an external constraint on balancing. */ protected void resetBalancerErrors() { stuck = false; } /** * Fetch the tablets for the given table by asking the tablet server. Useful if your balance * strategy needs details at the tablet level to decide what tablets to move. * * @param tserver The tablet server to ask. * @param tableId The table id * @return a list of tablet statistics * @throws ThriftSecurityException tablet server disapproves of your internal System password. * @throws TException any other problem */ public List getOnlineTabletsForTable(TServerInstance tserver, TableId tableId) throws ThriftSecurityException, TException { log.debug("Scanning tablet server {} for table {}", tserver, tableId); Client client = ThriftUtil.getClient(ThriftClientTypes.TABLET_SERVER, tserver.getHostAndPort(), context); try { return client.getTabletStats(TraceUtil.traceInfo(), context.rpcCreds(), tableId.canonical()); } catch (TTransportException e) { log.error("Unable to connect to {}: ", tserver, e); } finally { ThriftUtil.returnClient(client, context); } return null; } /** * Utility to ensure that the migrations from balance() are consistent: *

    *
  • Tablet objects are not null *
  • Source and destination tablet servers are not null and current *
* * @return A list of TabletMigration object that passed sanity checks. */ public static List checkMigrationSanity(Set current, List migrations) { List result = new ArrayList<>(migrations.size()); for (TabletMigration m : migrations) { if (m.tablet == null) { log.warn("Balancer gave back a null tablet {}", m); continue; } if (m.newServer == null) { log.warn("Balancer did not set the destination {}", m); continue; } if (m.oldServer == null) { log.warn("Balancer did not set the source {}", m); continue; } if (!current.contains(m.oldServer)) { log.warn("Balancer wants to move a tablet from a server that is not current: {}", m); continue; } if (!current.contains(m.newServer)) { log.warn("Balancer wants to move a tablet to a server that is not current: {}", m); continue; } result.add(m); } return result; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy