All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.languagetool.server.PipelinePool Maven / Gradle / Ivy

There is a newer version: 6.4
Show newest version
/*
 *  LanguageTool, a natural language style checker
 *  * Copyright (C) 2018 Fabian Richter
 *  *
 *  * This library is free software; you can redistribute it and/or
 *  * modify it under the terms of the GNU Lesser General Public
 *  * License as published by the Free Software Foundation; either
 *  * version 2.1 of the License, or (at your option) any later version.
 *  *
 *  * This library is distributed in the hope that it will be useful,
 *  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 *  * Lesser General Public License for more details.
 *  *
 *  * You should have received a copy of the GNU Lesser General Public
 *  * License along with this library; if not, write to the Free Software
 *  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301
 *  * USA
 *
 */

package org.languagetool.server;

import com.google.common.cache.CacheBuilder;
import com.google.common.cache.CacheLoader;
import com.google.common.cache.LoadingCache;
import org.apache.commons.lang3.builder.EqualsBuilder;
import org.apache.commons.lang3.builder.HashCodeBuilder;
import org.apache.commons.lang3.builder.ToStringBuilder;
import org.languagetool.*;
import org.languagetool.gui.Configuration;
import org.languagetool.rules.DictionaryMatchFilter;
import org.languagetool.rules.RemoteRuleConfig;
import org.languagetool.tools.Tools;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.IOException;
import java.util.Collections;
import java.util.HashSet;
import java.util.List;
import java.util.concurrent.ConcurrentLinkedQueue;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.stream.Collectors;

/**
 * Caches pre-configured JLanguageTool instances to avoid costly setup time of rules, etc.
 * TODO: reimplement using apache commons KeyedObjectPool
 */
class PipelinePool {

  private static final Logger logger = LoggerFactory.getLogger(PipelinePool.class);

  static final long PIPELINE_EXPIRE_TIME = 15 * 60 * 1000;

  public static class PipelineSettings {
    private final Language lang;
    private final Language motherTongue;
    private final TextChecker.QueryParams query;
    private final UserConfig userConfig;
    private final GlobalConfig globalConfig;
    
    PipelineSettings(Language lang, Language motherTongue, TextChecker.QueryParams params, GlobalConfig globalConfig, UserConfig userConfig) {
      this.lang = lang;
      this.motherTongue = motherTongue;
      this.query = params;
      this.userConfig = userConfig;
      this.globalConfig = globalConfig;
    }

    @Override
    public int hashCode() {
      return new HashCodeBuilder(17, 31)
        .append(lang)
        .append(motherTongue)
        .append(query)
        .append(globalConfig)
        .append(userConfig)
        .toHashCode();
    }

    @Override
    public boolean equals(Object obj) {
      if (obj == this) return true;
      if (obj == null || getClass() != obj.getClass()) {
        return false;
      }
      PipelineSettings other = (PipelineSettings) obj;
      return new EqualsBuilder()
        .append(lang, other.lang)
        .append(motherTongue, other.motherTongue)
        .append(query, other.query)
        .append(globalConfig, other.globalConfig)
        .append(userConfig, other.userConfig)
        .isEquals();
    }

    @Override
    public String toString() {
      return new ToStringBuilder(this)
        .append("lang", lang)
        .append("motherTongue", motherTongue)
        .append("query", query)
        .append("globalConfig", globalConfig)
        .append("user", userConfig)
        .build();
    }
  }

  private final HTTPServerConfig config;
  private final ResultCache cache;
  private final LoadingCache> pool;
  private final boolean internalServer;

  private long pipelineExpireCheckTimestamp;
  // stats
  private long pipelinesUsed;
  private long requests;

  PipelinePool(HTTPServerConfig config, ResultCache cache, boolean internalServer) {
    this.internalServer = internalServer;
    this.config = config;
    this.cache = cache;
    this.pipelineExpireCheckTimestamp = System.currentTimeMillis();
    int maxPoolSize = config.getMaxPipelinePoolSize();
    int expireTime = config.getPipelineExpireTime();
    if (config.isPipelineCachingEnabled()) {
      this.pool = CacheBuilder.newBuilder()
        .maximumSize(maxPoolSize)
        .expireAfterAccess(expireTime, TimeUnit.SECONDS)
        .build(new CacheLoader>() {
          @Override
          public ConcurrentLinkedQueue load(PipelineSettings key) {
            return new ConcurrentLinkedQueue<>();
          }
        });
    } else {
      this.pool = null;
    }
  }

  Pipeline getPipeline(PipelineSettings settings) throws Exception {
    if (pool != null) {
      // expire old pipelines in queues (where settings may be used, but some of the created pipelines are unused)
      long expireCheckDelta = System.currentTimeMillis() - pipelineExpireCheckTimestamp;
      if (expireCheckDelta > PIPELINE_EXPIRE_TIME) {
        AtomicInteger removed = new AtomicInteger();
        pipelineExpireCheckTimestamp = System.currentTimeMillis();
        //pool.asMap().forEach((s, queue) -> queue.removeIf(Pipeline::isExpired));
        pool.asMap().forEach((s, queue) -> queue.removeIf(pipeline -> {
          if (pipeline.isExpired()) {
            removed.getAndIncrement();
            return true;
          } else {
            return false;
          }
        }));
        ServerTools.print("Removing " + removed.get() + " expired pipelines");
      }

      requests++;
      ConcurrentLinkedQueue pipelines = pool.get(settings);
      if (requests % 1000 == 0) {
        logger.info(String.format("Pipeline cache stats: %f hit rate", (double) pipelinesUsed / requests));
      }
      Pipeline pipeline = pipelines.poll();
      if (pipeline == null) {
        //ServerTools.print(String.format("No prepared pipeline found for %s; creating one.", settings));
        pipeline = createPipeline(settings.lang, settings.motherTongue, settings.query, settings.globalConfig, settings.userConfig, config.getDisabledRuleIds());
      } else {
        pipelinesUsed++;
        //ServerTools.print(String.format("Prepared pipeline found for %s; using it.", settings));
      }
      return pipeline;
    } else {
      return createPipeline(settings.lang, settings.motherTongue, settings.query, settings.globalConfig, settings.userConfig, config.getDisabledRuleIds());
    }
  }

  void returnPipeline(PipelineSettings settings, Pipeline pipeline) throws ExecutionException {
    if (pool == null) return;
    ConcurrentLinkedQueue pipelines = pool.get(settings);
    pipeline.refreshExpireTimer();
    pipelines.add(pipeline);
  }

  /**
   * Create a JLanguageTool instance for a specific language, mother tongue, and rule configuration.
   * Uses Pipeline wrapper to safely share objects
   *  @param lang the language to be used
   * @param motherTongue the user's mother tongue or {@code null}
   */
  Pipeline createPipeline(Language lang, Language motherTongue, TextChecker.QueryParams params, GlobalConfig globalConfig,
                          UserConfig userConfig, List disabledRuleIds)
    throws Exception { // package-private for mocking
    Pipeline lt = new Pipeline(lang, params.altLanguages, motherTongue, cache, globalConfig, userConfig, params.inputLogging);
    lt.setMaxErrorsPerWordRate(config.getMaxErrorsPerWordRate());
    lt.disableRules(disabledRuleIds);
    if (config.getLanguageModelDir() != null) {
      lt.activateLanguageModelRules(config.getLanguageModelDir());
    }
    if (config.getWord2VecModelDir () != null) {
      lt.activateWord2VecModelRules(config.getWord2VecModelDir());
    }
    if (config.getRulesConfigFile() != null) {
      configureFromRulesFile(lt, lang);
    } else {
      configureFromGUI(lt, lang);
    }
    if (params.regressionTestMode) {
      List rules = Collections.emptyList();
      try {
        if (config.getRemoteRulesConfigFile() != null) {
          rules = RemoteRuleConfig.load(config.getRemoteRulesConfigFile());
        }
      } catch (Exception e) {
        logger.error("Could not load remote rule configuration", e);
      }
      // modify remote rule configuration: no timeouts, downtime, ...
      rules = rules.stream().map(c -> {
        return new RemoteRuleConfig(c.getRuleId(), c.getUrl(), c.getPort(),
          0, 0L, 0f,
          0, 0L, c.getOptions());
      }).collect(Collectors.toList());
      lt.activateRemoteRules(rules);
    } else {
      lt.activateRemoteRules(config.getRemoteRulesConfigFile());
    }
    if (params.useQuerySettings) {
      Tools.selectRules(lt, new HashSet<>(params.disabledCategories), new HashSet<>(params.enabledCategories),
        new HashSet<>(params.disabledRules), new HashSet<>(params.enabledRules), params.useEnabledOnly, params.enableTempOffRules);
    }
    if (userConfig.filterDictionaryMatches()) {
      lt.addMatchFilter(new DictionaryMatchFilter(userConfig));
    }
    if (pool != null) {
      lt.setupFinished();
    }
    return lt;
  }

  private void configureFromRulesFile(JLanguageTool langTool, Language lang) throws IOException {
    ServerTools.print("Using options configured in " + config.getRulesConfigFile());
    // If we are explicitly configuring from rules, ignore the useGUIConfig flag
    if (config.getRulesConfigFile() != null) {
      org.languagetool.gui.Tools.configureFromRules(langTool, new Configuration(config.getRulesConfigFile()
        .getCanonicalFile().getParentFile(), config.getRulesConfigFile().getName(), lang));
    } else {
      throw new RuntimeException("config.getRulesConfigFile() is null");
    }
  }

  private void configureFromGUI(JLanguageTool langTool, Language lang) throws IOException {
    Configuration config = new Configuration(lang);
    if (internalServer && config.getUseGUIConfig()) {
      ServerTools.print("Using options configured in the GUI");
      org.languagetool.gui.Tools.configureFromRules(langTool, config);
    }
  }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy