
org.bytedeco.javacpp.tools.Tokenizer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of javacpp Show documentation
Show all versions of javacpp Show documentation
The missing bridge between Java and native C++
/*
* Copyright (C) 2014-2017 Samuel Audet
*
* Licensed either under the Apache License, Version 2.0, or (at your option)
* under the terms of the GNU General Public License as published by
* the Free Software Foundation (subject to the "Classpath" exception),
* either version 2, or any later version (collectively, the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
* http://www.gnu.org/licenses/
* http://www.gnu.org/software/classpath/license.html
*
* or as provided in the LICENSE.txt file that accompanied this code.
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.bytedeco.javacpp.tools;
import java.io.BufferedReader;
import java.io.Closeable;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.Reader;
import java.io.StringReader;
import java.util.ArrayList;
/**
*
* @author Samuel Audet
*/
class Tokenizer implements Closeable {
Tokenizer(Reader reader, File file, int lineNumber) {
this.reader = reader;
this.file = file;
this.lineNumber = lineNumber;
}
Tokenizer(String text, File file, int lineNumber) {
this.text = text;
this.reader = new StringReader(text);
this.file = file;
this.lineNumber = lineNumber;
}
Tokenizer(File file) throws IOException {
this(file, null);
}
Tokenizer(File file, String encoding) throws IOException {
this.file = file;
FileInputStream fis = new FileInputStream(file);
this.reader = new BufferedReader(encoding != null ? new InputStreamReader(fis, encoding) : new InputStreamReader(fis));
}
public void filterLines(String[] patterns, boolean skip) throws IOException {
if (patterns == null) {
return;
}
StringBuilder lines = new StringBuilder();
BufferedReader lineReader = reader instanceof BufferedReader ?
(BufferedReader)reader : new BufferedReader(reader);
String line;
while ((line = lineReader.readLine()) != null) {
int i = 0;
while (i < patterns.length && !line.matches(patterns[i])) {
i += 2;
}
if (i < patterns.length) {
if (!skip) {
lines.append(line + "\n");
}
while (i + 1 < patterns.length && (line = lineReader.readLine()) != null) {
if (!skip) {
lines.append(line + "\n");
}
if (line.matches(patterns[i + 1])) {
break;
}
}
} else if (skip) {
lines.append(line + "\n");
}
}
reader.close();
reader = new StringReader(lines.toString());
}
File file = null;
String text = null;
Reader reader = null;
String lineSeparator = null;
int lastChar = -1, lineNumber = 1;
StringBuilder buffer = new StringBuilder();
@Override public void close() throws IOException {
reader.close();
}
int readChar() throws IOException {
if (lastChar != -1) {
int c = lastChar;
lastChar = -1;
return c;
}
int c = reader.read();
if (c == '\r' || c == '\n') {
if (text == null) {
// assume text is associated with a single line of file
lineNumber++;
}
int c2 = c == '\r' ? reader.read() : -1;
if (lineSeparator == null) {
lineSeparator = c == '\r' && c2 == '\n' ? "\r\n" :
c == '\r' ? "\r" : "\n";
}
if (c2 != '\n') {
lastChar = c2;
}
c = '\n';
}
return c;
}
public Token nextToken() throws IOException {
Token token = new Token();
int c = readChar();
buffer.setLength(0);
if (Character.isWhitespace(c)) {
buffer.append((char)c);
while ((c = readChar()) != -1 && Character.isWhitespace(c)) {
buffer.append((char)c);
}
}
token.file = file;
token.text = text;
token.lineNumber = lineNumber;
token.spacing = buffer.toString();
buffer.setLength(0);
if (Character.isLetter(c) || c == '_') {
token.type = Token.IDENTIFIER;
buffer.append((char)c);
while ((c = readChar()) != -1 && (Character.isDigit(c) || Character.isLetter(c) || c == '_')) {
buffer.append((char)c);
}
token.value = buffer.toString();
lastChar = c;
} else if (Character.isDigit(c) || c == '.' || c == '-' || c == '+') {
if (c == '.') {
int c2 = readChar();
if (c2 == '.') {
int c3 = readChar();
if (c3 == '.') {
token.type = Token.SYMBOL;
token.value = "...";
return token;
} else {
// but we lose c2... does it matter?
lastChar = c3;
}
} else {
lastChar = c2;
}
}
token.type = c == '.' ? Token.FLOAT : Token.INTEGER;
buffer.append((char)c);
int prevc = 0;
boolean exp = false, large = false, unsigned = false, hex = false;
while ((c = readChar()) != -1 && (Character.isDigit(c) || c == '.' || c == '-' || c == '+' ||
(c >= 'a' && c <= 'f') || c == 'i' || c == 'l' || c == 'u' || c == 'x' ||
(c >= 'A' && c <= 'F') || c == 'I' || c == 'L' || c == 'U' || c == 'X')) {
switch (c) {
case '.': token.type = Token.FLOAT; break;
case 'e': case 'E': exp = true; break;
case 'l': case 'L': large = true; break;
case 'u': case 'U': unsigned = true; break;
case 'x': case 'X': hex = true; break;
}
if (c != 'l' && c != 'L' && c != 'u' && c != 'U') {
buffer.append((char)c);
}
prevc = c;
}
if (!hex && (exp || prevc == 'f' || prevc == 'F')) {
token.type = Token.FLOAT;
}
if (token.type == Token.INTEGER && !large) {
try {
long high = Long.decode(buffer.toString()) >> 32;
large = high != 0 && high != -1;
} catch (NumberFormatException e) {
// set as large, for things like 0x8000000000000000L
if (buffer.length() >= 16) {
large = true;
}
}
}
if (buffer.toString().endsWith("i64")) {
buffer.setLength(buffer.length() - 3);
large = true;
}
if (token.type == Token.INTEGER && (large || (unsigned && !hex))) {
buffer.append('L');
}
token.value = buffer.toString();
lastChar = c;
} else if (c == '\'') {
token.type = Token.INTEGER;
buffer.append('\'');
while ((c = readChar()) != -1 && c != '\'') {
buffer.append((char)c);
if (c == '\\') {
c = readChar();
buffer.append((char)c);
}
}
buffer.append('\'');
token.value = buffer.toString();
} else if (c == '"') {
token.type = Token.STRING;
buffer.append('"');
while ((c = readChar()) != -1 && c != '"') {
buffer.append((char)c);
if (c == '\\') {
c = readChar();
buffer.append((char)c);
}
}
buffer.append('"');
token.value = buffer.toString();
} else if (c == '/') {
c = readChar();
if (c == '/') {
token.type = Token.COMMENT;
buffer.append('/').append('/');
int prevc = 0;
while ((c = readChar()) != -1 && (prevc == '\\' || c != '\n')) {
buffer.append((char)c);
prevc = c;
}
token.value = buffer.toString();
lastChar = c;
} else if (c == '*') {
token.type = Token.COMMENT;
buffer.append('/').append('*');
int prevc = 0;
while ((c = readChar()) != -1 && (prevc != '*' || c != '/')) {
buffer.append((char)c);
prevc = c;
}
buffer.append('/');
token.value = buffer.toString();
} else {
lastChar = c;
token.type = '/';
}
} else if (c == ':') {
int c2 = readChar();
if (c2 == ':') {
token.type = Token.SYMBOL;
token.value = "::";
} else {
token.type = c;
lastChar = c2;
}
} else if (c == '&') {
int c2 = readChar();
if (c2 == '&') {
token.type = Token.SYMBOL;
token.value = "&&";
} else {
token.type = c;
lastChar = c2;
}
} else if (c == '#') {
int c2 = readChar();
if (c2 == '#') {
token.type = Token.SYMBOL;
token.value = "##";
} else {
token.type = c;
lastChar = c2;
}
} else {
if (c == '\\') {
int c2 = readChar();
if (c2 == '\n') {
token.type = Token.COMMENT;
token.value = "\n";
return token;
} else {
lastChar = c2;
}
}
token.type = c;
}
return token;
}
Token[] tokenize() {
ArrayList tokens = new ArrayList();
try {
Token token;
while (!(token = nextToken()).isEmpty()) {
tokens.add(token);
}
} catch (IOException ex) {
throw new RuntimeException(ex);
}
return tokens.toArray(new Token[tokens.size()]);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy