org.sejda.model.parameter.OcrTextParameters Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of sejda-model Show documentation
Show all versions of sejda-model Show documentation
Package containing reusable model for Sejda.
/*
* Created on 06 dic 2016
* Copyright 2015 by Andrea Vacondio ([email protected]).
* This file is part of Sejda.
*
* Sejda is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Sejda is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with Sejda. If not, see .
*/
package org.sejda.model.parameter;
import java.util.*;
import org.apache.commons.lang3.builder.EqualsBuilder;
import org.apache.commons.lang3.builder.HashCodeBuilder;
import org.sejda.model.input.PdfSource;
import org.sejda.model.output.MultipleTaskOutput;
import org.sejda.model.parameter.base.AbstractParameters;
import org.sejda.model.parameter.base.MultipleOutputTaskParameters;
import org.sejda.model.parameter.base.MultiplePdfSourceTaskParameters;
import org.sejda.model.validation.constraint.NotEmpty;
import javax.validation.Valid;
import javax.validation.constraints.NotNull;
/**
* Parameter class to extract text from multiple documents performing OCR
*
* @author Andrea Vacondio
*/
public class OcrTextParameters extends AbstractParameters
implements MultiplePdfSourceTaskParameters, MultipleOutputTaskParameters {
private String outputPrefix = "";
@Valid
@NotNull
private MultipleTaskOutput output;
@NotEmpty
@Valid
private List> sourceList = new ArrayList>();
@NotEmpty
private String textEncoding = "UTF-8";
private Set languages = new LinkedHashSet<>();
/**
* Adds a language o the list of possible languages of the text found in the documents. This can help the OCR engine to return a more accurate result.
*
* @param language
*/
public void addLanguage(Locale language) {
this.languages.add(language);
}
/**
* @return Languages that can be fed to the OCR engine to return a more accurate result
*/
public Set getLanguages() {
return languages;
}
public String getTextEncoding() {
return textEncoding;
}
public void setTextEncoding(String textEncoding) {
this.textEncoding = textEncoding;
}
@Override
public MultipleTaskOutput getOutput() {
return output;
}
@Override
public void setOutput(MultipleTaskOutput output) {
this.output = output;
}
@Override
public String getOutputPrefix() {
return outputPrefix;
}
@Override
public void setOutputPrefix(String outputPrefix) {
this.outputPrefix = outputPrefix;
}
/**
* adds the input source to the source list.
*
* @param input
*/
@Override
public void addSource(PdfSource> input) {
sourceList.add(input);
}
/**
* @return an unmodifiable view of the source list
*/
@Override
public List> getSourceList() {
return Collections.unmodifiableList(sourceList);
}
@Override
public int hashCode() {
return new HashCodeBuilder().appendSuper(super.hashCode()).append(output).append(sourceList)
.append(textEncoding).append(outputPrefix).append(languages).toHashCode();
}
@Override
public boolean equals(Object other) {
if (this == other) {
return true;
}
if (!(other instanceof OcrTextParameters)) {
return false;
}
OcrTextParameters parameter = (OcrTextParameters) other;
return new EqualsBuilder().appendSuper(super.equals(other)).append(output, parameter.output)
.append(sourceList, parameter.sourceList).append(textEncoding, parameter.textEncoding)
.append(outputPrefix, parameter.outputPrefix)
.append(languages, parameter.languages)
.isEquals();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy