All Downloads are FREE. Search and download functionalities are using the official Maven repository.

ai.grakn.engine.task.postprocessing.CountPostProcessor Maven / Gradle / Ivy

There is a newer version: 1.4.3
Show newest version
/*
 * Grakn - A Distributed Semantic Database
 * Copyright (C) 2016-2018 Grakn Labs Limited
 *
 * Grakn is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * Grakn is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with Grakn. If not, see .
 */

package ai.grakn.engine.task.postprocessing;

import ai.grakn.GraknConfigKey;
import ai.grakn.GraknTxType;
import ai.grakn.Keyspace;
import ai.grakn.concept.ConceptId;
import ai.grakn.engine.GraknConfig;
import ai.grakn.engine.factory.EngineGraknTxFactory;
import ai.grakn.engine.lock.LockProvider;
import ai.grakn.kb.internal.EmbeddedGraknTx;
import ai.grakn.kb.log.CommitLog;
import com.codahale.metrics.MetricRegistry;
import com.codahale.metrics.Timer;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.util.HashSet;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.locks.Lock;

import static com.codahale.metrics.MetricRegistry.name;

/**
 * 

* Class responsible for updating the number of {@link ai.grakn.concept.Thing}s each {@link ai.grakn.concept.Type} * currently has. *

* * @author Filipe Peliz Pinto Teixeira */ public class CountPostProcessor { private final static Logger LOG = LoggerFactory.getLogger(CountPostProcessor.class); private final CountStorage countStorage; private final MetricRegistry metricRegistry; private final EngineGraknTxFactory factory; private final LockProvider lockProvider; private final long shardingThreshold; private CountPostProcessor(GraknConfig engineConfig, EngineGraknTxFactory factory, LockProvider lockProvider, MetricRegistry metricRegistry, CountStorage countStorage) { this.countStorage = countStorage; this.shardingThreshold = engineConfig.getProperty(GraknConfigKey.SHARDING_THRESHOLD); this.metricRegistry = metricRegistry; this.factory = factory; this.lockProvider = lockProvider; } public static CountPostProcessor create(GraknConfig engineConfig, EngineGraknTxFactory factory, LockProvider lockProvider, MetricRegistry metricRegistry, CountStorage countStorage) { return new CountPostProcessor(engineConfig, factory, lockProvider, metricRegistry, countStorage); } /** * Updates the counts of {@link ai.grakn.concept.Type}s based on the commit logs received. * * @param commitLog The commit log containing the details of the job */ public void updateCounts(CommitLog commitLog){ try (Timer.Context context = metricRegistry.timer(name(CountPostProcessor.class, "execution")).time()) { Map jobs = commitLog.instanceCount(); metricRegistry.histogram(name(CountPostProcessor.class, "jobs")) .update(jobs.size()); //We Use countStorage to keep track of counts in order to ensure sharding happens in a centralised manner. //The graph cannot be used because each engine can have it's own snapshot of the graph with caching which makes //values only approximately correct Set conceptToShard = new HashSet<>(); //Update counts jobs.forEach((key, value) -> { metricRegistry .histogram(name(CountPostProcessor.class, "shard-size-increase")) .update(value); Timer.Context contextSingle = metricRegistry .timer(name(CountPostProcessor.class, "execution-single")).time(); try { if (incrementInstanceCountAndCheckIfShardingIsNeeded(countStorage, commitLog.keyspace(), key, value, shardingThreshold)) { conceptToShard.add(key); } } finally { contextSingle.stop(); } }); //Shard anything which requires sharding conceptToShard.forEach(type -> { Timer.Context contextSharding = metricRegistry.timer("sharding").time(); try { shardConcept(countStorage, factory, commitLog.keyspace(), type, shardingThreshold); } finally { contextSharding.stop(); } }); LOG.debug("Updating instance count successful for {} tasks", jobs.size()); } catch(Exception e) { LOG.error("Could not terminate task", e); throw e; } } /** * Updates the type counts in countStorage and checks if sharding is needed. * * @param keyspace The keyspace of the graph which the type comes from * @param conceptId The id of the concept with counts to update * @param value The number of instances which the type has gained/lost * @return true if sharding is needed. */ private static boolean incrementInstanceCountAndCheckIfShardingIsNeeded(CountStorage countStorage, Keyspace keyspace, ConceptId conceptId, long value, long shardingThreshold){ long numShards = countStorage.getShardCount(keyspace, conceptId); if(numShards == 0) numShards = 1; long numInstances = countStorage.incrementInstanceCount(keyspace, conceptId, value); return numInstances > shardingThreshold * numShards; } /** * Performs the high level sharding operation. This includes: * - Acquiring a lock to ensure only one thing can shard * - Checking if sharding is still needed after having the lock * - Actually sharding * - Incrementing the number of shards on each type * * @param keyspace The database containing the {@link ai.grakn.concept.Type} to shard * @param conceptId The id of the concept to shard */ private void shardConcept(CountStorage countStorage, EngineGraknTxFactory factory, Keyspace keyspace, ConceptId conceptId, long shardingThreshold){ Lock engineLock = lockProvider.getLock(getLockingKey(keyspace, conceptId)); engineLock.lock(); //Try to get the lock try { //Check if sharding is still needed. Another engine could have sharded whilst waiting for lock if (incrementInstanceCountAndCheckIfShardingIsNeeded(countStorage, keyspace, conceptId, 0, shardingThreshold)) { try(EmbeddedGraknTx tx = factory.tx(keyspace, GraknTxType.WRITE)) { tx.shard(conceptId); tx.commitSubmitNoLogs(); } //Update number of shards countStorage.incrementShardCount(keyspace, conceptId, 1); } } finally { engineLock.unlock(); } } private static String getLockingKey(Keyspace keyspace, ConceptId conceptId){ return "/updating-instance-count-lock/" + keyspace + "/" + conceptId.getValue(); } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy