org.languagetool.tools.ContextTools Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of languagetool-core Show documentation
Show all versions of languagetool-core Show documentation
LanguageTool is an Open Source proofreading software for English, French, German, Polish, Romanian, and more than 20 other languages. It finds many errors that a simple spell checker cannot detect like mixing up there/their and it detects some grammar problems.
/* LanguageTool, a natural language style checker
* Copyright (C) 2012 Daniel Naber (http://www.danielnaber.de)
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301
* USA
*/
package org.languagetool.tools;
import org.apache.commons.lang3.StringUtils;
/**
* Helper class to mark errors in text.
*/
public class ContextTools {
private int contextSize = 40;
private boolean escapeHtml = true;
private String errorMarkerStart = "";
private String errorMarkerEnd = "";
public ContextTools() {
}
public String getContext(int fromPos, int toPos, String contents) {
// calculate context region:
int startContent = fromPos - contextSize;
String prefix = "...";
String postfix = "...";
if (startContent < 0) {
prefix = "";
startContent = 0;
}
int endContent = toPos + contextSize;
int textLength = contents.length();
if (endContent > textLength) {
postfix = "";
endContent = textLength;
}
// now build context string plus marker:
StringBuilder sb = new StringBuilder();
sb.append(prefix);
sb.append(contents.substring(startContent, endContent).replace('\n', ' '));
String markerStr = getMarker(fromPos, toPos, startContent, endContent, prefix);
sb.append(postfix);
int startMark = markerStr.indexOf('^');
int endMark = markerStr.lastIndexOf('^');
String result = sb.toString();
if (escapeHtml) {
String escapedErrorPart = StringTools.escapeHTML(result.substring(startMark, endMark + 1))
.replace(" ", " "); // make sure whitespace errors are visible
result = StringTools.escapeHTML(result.substring(0, startMark))
+ errorMarkerStart
+ escapedErrorPart
+ errorMarkerEnd + StringTools.escapeHTML(result.substring(endMark + 1));
} else {
result = result.substring(0, startMark) + errorMarkerStart
+ result.substring(startMark, endMark + 1) + errorMarkerEnd
+ result.substring(endMark + 1);
}
return result;
}
/**
* Get a plain text context that uses {@code ^} characters in a new line as a marker of the
* given string region. Ignores {@link #setEscapeHtml(boolean)}.
* @since 2.3
*/
public String getPlainTextContext(int fromPos, int toPos, String contents) {
// calculate context region:
int startContent = fromPos - contextSize;
String prefix = "...";
String postfix = "...";
if (startContent < 0) {
prefix = "";
startContent = 0;
}
int endContent = toPos + contextSize;
if (endContent > contents.length()) {
postfix = "";
endContent = contents.length();
}
return prefix +
contents.substring(startContent, endContent).replace('\n', ' ').replace('\r', ' ').replace('\t', ' ') +
postfix + '\n' +
getMarker(fromPos, toPos, startContent, endContent, prefix);
}
/**
* Set the string used to mark the beginning and end of an error, e.g. {@code } and {@code }
* @since 5.1
*/
public void setErrorMarker(String start, String end) {
errorMarkerStart = start;
errorMarkerEnd = end;
}
/**
* Set the string used to mark the beginning of an error, e.g. {@code }
*/
public void setErrorMarkerStart(String errorMarkerStart) {
this.errorMarkerStart = errorMarkerStart;
}
/**
* Set the string used to mark the end of an error, e.g. {@code }
*/
public void setErrorMarkerEnd(String errorMarkerEnd) {
this.errorMarkerEnd = errorMarkerEnd;
}
/**
* The context size of the error. This many characters of the original text will be used
* from the left and from the right context of the error.
*/
public void setContextSize(int contextSize) {
this.contextSize = contextSize;
}
/**
* Whether HTML special characters should be escaped.
*/
public void setEscapeHtml(boolean escapeHtml) {
this.escapeHtml = escapeHtml;
}
private static String getMarker(int fromPos, int toPos, int startContent, int endContent, String prefix) {
return StringUtils.repeat(' ', prefix.length() + fromPos - startContent) +
StringUtils.repeat('^', toPos - fromPos) +
StringUtils.repeat(' ', endContent - toPos);
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy