![JAR search and dependency download from the Maven repository](/logo.png)
org.neo4j.importer.CharacterConverter Maven / Gradle / Ivy
/*
* Copyright (c) "Neo4j"
* Neo4j Sweden AB [https://neo4j.com]
*
* This file is part of Neo4j.
*
* Neo4j is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see .
*/
package org.neo4j.importer;
import java.util.Locale;
import java.util.function.Function;
import org.neo4j.csv.reader.Configuration;
import org.neo4j.util.Preconditions;
/**
* Converts a string expression into a character to be used as delimiter, array delimiter, or quote character. Can be
* normal characters as well as for example: '\t', '\123', and "TAB".
*/
public class CharacterConverter implements Function {
@Override
public Character apply(String value) throws RuntimeException {
// Parse "raw" ASCII character style characters:
// - \123 --> character with id 123
// - U+XXXX --> unicode character HEX
// - \t --> tab character
String lowerCaseValue = value.toLowerCase(Locale.ROOT);
if (lowerCaseValue.startsWith("\\u") || lowerCaseValue.startsWith("u+")) {
String code = value.substring(2);
Preconditions.checkState(
code.length() == 4, "Unicode characters should be specified with 4 HEX characters, e.g. 'U+20AC'");
return (char) Integer.parseInt(code, 16);
} else if (value.startsWith("\\") && value.length() > 1) {
String raw = value.substring(1);
try {
return (char) Integer.parseInt(raw);
} catch (NumberFormatException e) {
if (raw.equals("t")) {
return Configuration.TABS.delimiter();
}
}
}
// hard coded TAB --> tab character
else if (value.equals("TAB")) {
return Configuration.TABS.delimiter();
} else if (value.length() == 1) {
return value.charAt(0);
}
throw new IllegalArgumentException("Unsupported character '" + value + "'");
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy