org.liblouis.Translator Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of liblouis-java Show documentation
Show all versions of liblouis-java Show documentation
JNA based Java bindings to liblouis, an open-source braille translator and back-translator.
package org.liblouis;
import java.util.Arrays;
import java.util.HashMap;
import java.util.Map;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import org.liblouis.Louis.LouisLibrary;
import com.sun.jna.Pointer;
import com.sun.jna.ptr.IntByReference;
public class Translator {
public static final byte SHY = 1;
public static final byte ZWSP = 2;
private final String table;
/**
* @param table The translation table or table list to compile.
* @throws CompilationException if the table could not be found or if it
* could not be compiled.
*/
public Translator(String table) throws CompilationException {
if (Louis.getLibrary().lou_getTable(table) == Pointer.NULL)
throw new CompilationException("Unable to compile table '" + table + "'");
this.table = table;
}
/**
* @param query A table query
* @throws CompilationException if no match could be found or if the
* matched table could not be compiled.
*/
public static Translator find(String query) throws CompilationException {
String table = Louis.getLibrary().lou_findTable(query);
if (table == null)
throw new CompilationException("No match found for query '" + query + "'");
return new Translator(table);
}
public String getTable() {
return table;
}
/**
* @param text The text to translate.
* @param typeform Array with typeform information about the text. Must have the same length as
* text
. May be null.
* @param characterAttributes Array with other information about the text that will be passed on
* to the output. May for example be used for numbering all
* characters in the input text in order to obtain a full mapping
* between input and output. Array must have the same length as
* text
. May be null.
* @param interCharacterAttributes Array with information about the positions between characters
* that will be passed on to the output. May for example be used
* to track hyphenation points (e.g. `0` for no hyphenation
* point opportunity, `1` for soft hyphen and `2` for zero-width
* space). Length must be equal to the text
length
* minus 1.
* @return A TranslationResult containing the braille translation, the output character
* attributes (or null
if characterAttributes
was
* null
), and the output inter-character attributes (or null
* if interCharacterAttributes
was null
).
* @throws TranslationException if the translation could not be completed.
*/
public TranslationResult translate(String text,
byte[] typeform,
int[] characterAttributes,
int[] interCharacterAttributes)
throws TranslationException {
if (typeform != null)
if (typeform.length != text.length())
throw new IllegalArgumentException("typeform length must be equal to text length");
if (characterAttributes != null)
if (characterAttributes.length != text.length())
throw new IllegalArgumentException("characterAttributes length must be equal to text length");
if (interCharacterAttributes != null)
if (interCharacterAttributes.length != text.length() - 1)
throw new IllegalArgumentException("interCharacterAttributes length must be equal to text length minus 1");
WideString inbuf = getWideCharBuffer("text-in", text.length()).write(text);
WideString outbuf = getWideCharBuffer("text-out", text.length() * OUTLEN_MULTIPLIER);
IntByReference inlen = new IntByReference(text.length());
IntByReference outlen = new IntByReference(outbuf.length());
int[] inputPos = null;
if (typeform != null)
typeform = Arrays.copyOf(typeform, outbuf.length());
if (characterAttributes != null || interCharacterAttributes != null)
inputPos = getIntegerBuffer("inputpos", text.length() * OUTLEN_MULTIPLIER);
if (Louis.getLibrary().lou_translate(table, inbuf, inlen, outbuf, outlen, typeform,
null, null, inputPos, null, 0) == 0)
throw new TranslationException("Unable to complete translation");
return new TranslationResult(outbuf, outlen, inputPos, characterAttributes, interCharacterAttributes);
}
public String backTranslate(String text) throws TranslationException {
WideString inbuf = getWideCharBuffer("text-in", text.length()).write(text);
WideString outbuf = getWideCharBuffer("text-out", text.length() * OUTLEN_MULTIPLIER);
IntByReference inlen = new IntByReference(text.length());
IntByReference outlen = new IntByReference(outbuf.length());
if (Louis.getLibrary().lou_backTranslate(table, inbuf, inlen, outbuf, outlen,
null, null, null, null, null, 0) == 0)
throw new TranslationException("Unable to complete translation");
return outbuf.read(outlen.getValue());
}
/**
* @param text The text to hyphenate. Can be multiple words.
* @return The hyphenation points. Possible values are `0` for no hyphenation point, `1` for a
* hyphenation point (soft hyphen), or `2` for a zero-width space (which are inserted
* after hard hyphens). Length is equal to the text
length minus 1.
*/
public byte[] hyphenate(String text) throws TranslationException {
WideString inbuf = getWideCharBuffer("text-in", text.length()).write(text);
int inlen = text.length();
byte[] hyphens = getByteBuffer("hyphens-out", inlen);
for (int i = 0; i < inlen; i++) hyphens[i] = '0';
// lou_translate handles single words only
Matcher matcher = Pattern.compile("\\p{L}+").matcher(text);
byte[] wordHyphens = getByteBuffer("hyphens-word", inlen);
LouisLibrary louis = Louis.getLibrary();
while (matcher.find()) {
int start = matcher.start();
int end = matcher.end();
if (louis.lou_hyphenate(table, inbuf.substring(start), end - start, wordHyphens, 0) == 0)
throw new TranslationException("Unable to complete hyphenation");
for (int i = 0; i < end - start; i++) hyphens[start + i] = wordHyphens[i]; }
byte[] hyphenPositions = readHyphens(new byte[text.length() - 1], hyphens);
// add a zero-width space after hard hyphens
matcher = Pattern.compile("[\\p{L}\\p{N}]-(?=[\\p{L}\\p{N}])").matcher(text);
while (matcher.find())
hyphenPositions[matcher.start() + 1] = ZWSP;
return hyphenPositions;
}
public String display(String braille) throws TranslationException {
WideString inbuf = getWideCharBuffer("text-in", braille.length()).write(braille);
int length = braille.length();
WideString outbuf = getWideCharBuffer("text-out", braille.length() * OUTLEN_MULTIPLIER);
if (Louis.getLibrary().lou_dotsToChar(table, inbuf, outbuf, length, 0) == 0)
throw new TranslationException("Unable to complete translation");
return outbuf.read(length);
}
/*
* Number by which the input length should be multiplied to calculate
* the maximum output length. This default will handle the case where
* every input character is undefined in the translation table.
*/
private static final int OUTLEN_MULTIPLIER = WideChar.Constants.CHARSIZE * 2 + 4;
private static Map WIDECHAR_BUFFERS = new HashMap();
private static Map BYTE_BUFFERS = new HashMap();
private static Map INT_BUFFERS = new HashMap();
private static WideString getWideCharBuffer(String id, int minCapacity) {
WideString buffer = WIDECHAR_BUFFERS.get(id);
if (buffer == null || buffer.length() < minCapacity) {
buffer = new WideString(minCapacity * 2);
WIDECHAR_BUFFERS.put(id, buffer); }
return buffer;
}
private static byte[] getByteBuffer(String id, int minCapacity) {
byte[] buffer = BYTE_BUFFERS.get(id);
if (buffer == null || buffer.length < minCapacity) {
buffer = new byte[minCapacity * 2];
BYTE_BUFFERS.put(id, buffer); }
return buffer;
}
private static int[] getIntegerBuffer(String id, int minCapacity) {
int[] buffer = INT_BUFFERS.get(id);
if (buffer == null || buffer.length < minCapacity) {
buffer = new int[minCapacity * 2];
INT_BUFFERS.put(id, buffer); }
return buffer;
}
/*
* Convert a hyphen array from the form [0,1,0] to the form ['0','0','1','0']
*/
@SuppressWarnings("unused")
private static byte[] writeHyphens(byte[] hyphenPositions, byte[] buffer) {
buffer[0] = '0';
for (int i = 0; i < hyphenPositions.length; i++)
buffer[i+1] = (byte)(hyphenPositions[i] + 48);
return buffer;
}
/*
* Convert a hyphen array from the form ['0','0','1','0'] to the form [0,1,0]
*/
private static byte[] readHyphens(byte[] hyphenPositions, byte[] buffer) {
for (int i = 0; i < hyphenPositions.length; i++)
hyphenPositions[i] = (byte)(buffer[i+1] - 48);
return hyphenPositions;
}
@Override
public String toString() {
return getClass().getSimpleName() + "{table=" + table + "}";
}
@Override
public int hashCode() {
final int prime = 31;
int hash = 1;
hash = prime * hash + table.hashCode();
return hash;
}
@Override
public boolean equals(Object object) {
if (this == object)
return true;
if (object == null)
return false;
if (object.getClass() != Translator.class)
return false;
Translator that = (Translator)object;
if (!this.table.equals(that.table))
return false;
return true;
}
}