All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.github.ericmedvet.jgea.problem.classification.GrammarBasedTextFlaggingProblem Maven / Gradle / Ivy

The newest version!
/*-
 * ========================LICENSE_START=================================
 * jgea-problem
 * %%
 * Copyright (C) 2018 - 2024 Eric Medvet
 * %%
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * =========================LICENSE_END==================================
 */

package io.github.ericmedvet.jgea.problem.classification;

import io.github.ericmedvet.jgea.core.problem.QualityBasedProblem;
import io.github.ericmedvet.jgea.core.representation.grammar.string.GrammarBasedProblem;
import io.github.ericmedvet.jgea.core.representation.grammar.string.StringGrammar;
import io.github.ericmedvet.jgea.core.representation.tree.Tree;
import io.github.ericmedvet.jgea.problem.extraction.string.RegexGrammar;
import io.github.ericmedvet.jnb.datastructure.Pair;
import java.util.List;
import java.util.Set;
import java.util.function.Function;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.stream.Collectors;

public class GrammarBasedTextFlaggingProblem extends TextFlaggingProblem
    implements GrammarBasedProblem>,
        QualityBasedProblem, List> {

  private final StringGrammar grammar;
  private final Function, Classifier> solutionMapper;

  public GrammarBasedTextFlaggingProblem(
      Set alphabet,
      Set options,
      List> data,
      int folds,
      int i,
      ClassificationFitness.Metric learningErrorMetric,
      ClassificationFitness.Metric validationErrorMetric) {
    super(data, folds, i, learningErrorMetric, validationErrorMetric);
    solutionMapper = (Tree tree) -> {
      String regex = tree.leaves().stream().map(Tree::content).collect(Collectors.joining());
      return (Classifier) s -> {
        Matcher matcher = Pattern.compile(regex).matcher(s);
        return matcher.find() ? Label.FOUND : Label.NOT_FOUND;
      };
    };
    if (alphabet == null) {
      grammar = new RegexGrammar(data.stream().map(Pair::first).toList(), options);
    } else {
      grammar = new RegexGrammar(alphabet, options);
    }
  }

  @Override
  public StringGrammar getGrammar() {
    return grammar;
  }

  @Override
  public Function, Classifier> getSolutionMapper() {
    return solutionMapper;
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy