
org.eclipse.rdf4j.rio.languages.RFC3066LanguageHandler Maven / Gradle / Ivy
Show all versions of rdf4j-rio-languages Show documentation
/*******************************************************************************
* Copyright (c) 2015 Eclipse RDF4J contributors, Aduna, and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Distribution License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/org/documents/edl-v10.php.
*******************************************************************************/
package org.eclipse.rdf4j.rio.languages;
import java.util.regex.Pattern;
import org.eclipse.rdf4j.model.Literal;
import org.eclipse.rdf4j.model.ValueFactory;
import org.eclipse.rdf4j.model.util.LiteralUtilException;
import org.eclipse.rdf4j.rio.LanguageHandler;
/**
* A language handler that can verify RFC3066 formatted language tags.
*
* This language handler normalises language tags to lower-case.
*
* @see RFC 3066
* @author Peter Ansell
*/
public class RFC3066LanguageHandler implements LanguageHandler {
/**
* Language tag is RFC3066-conformant if it matches this regex: [a-zA-Z]{1,8}(-[a-zA-Z0-9]{1,8})*
*/
protected final Pattern matcher = Pattern.compile("[a-zA-Z]{1,8}(-[a-zA-Z0-9]{1,8})*");
/**
* Default constructor.
*/
public RFC3066LanguageHandler() {
}
@Override
public boolean isRecognizedLanguage(String languageTag) {
if (languageTag == null) {
throw new NullPointerException("Language tag cannot be null");
}
// language tag is RFC3066-conformant if it matches this regex:
// [a-zA-Z]{1,8}(-[a-zA-Z0-9]{1,8})*
boolean result = matcher.matcher(languageTag).matches();
return result;
}
@Override
public boolean verifyLanguage(String literalValue, String languageTag)
throws LiteralUtilException
{
if (isRecognizedLanguage(languageTag)) {
if (literalValue == null) {
throw new NullPointerException("Literal value cannot be null");
}
return matcher.matcher(languageTag).matches();
}
throw new LiteralUtilException("Could not verify RFC3066 language tag");
}
@Override
public Literal normalizeLanguage(String literalValue, String languageTag, ValueFactory valueFactory)
throws LiteralUtilException
{
if (isRecognizedLanguage(languageTag)) {
if (literalValue == null) {
throw new NullPointerException("Literal value cannot be null");
}
// TODO Implement normalisation more effectively than this
return valueFactory.createLiteral(literalValue, languageTag.toLowerCase().intern());
}
throw new LiteralUtilException("Could not normalize RFC3066 language tag");
}
@Override
public String getKey() {
return LanguageHandler.RFC3066;
}
}