org.sonar.python.lexer.StringLiteralsChannel Maven / Gradle / Ivy
/*
* SonarQube Python Plugin
* Copyright (C) 2011-2018 SonarSource SA
* mailto:info AT sonarsource DOT com
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 3 of the License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program; if not, write to the Free Software Foundation,
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
*/
package org.sonar.python.lexer;
import com.sonar.sslr.api.Token;
import com.sonar.sslr.impl.Lexer;
import java.util.Arrays;
import java.util.Collections;
import java.util.HashSet;
import java.util.Set;
import org.sonar.python.api.PythonTokenType;
import org.sonar.sslr.channel.Channel;
import org.sonar.sslr.channel.CodeReader;
/**
* http://docs.python.org/reference/lexical_analysis.html#string-literals
*/
public class StringLiteralsChannel extends Channel {
private static final char EOF = (char) -1;
private static final Set PREFIX_CHARS = Collections.unmodifiableSet(new HashSet<>(Arrays.asList('R', 'F', 'U', 'B')));
private final StringBuilder sb = new StringBuilder();
private int index;
private char ch;
@Override
public boolean consume(CodeReader code, Lexer output) {
int line = code.getLinePosition();
int column = code.getColumnPosition();
index = 0;
readStringPrefix(code);
if ((ch != '\'') && (ch != '\"')) {
return false;
}
if (!read(code)) {
return false;
}
for (int i = 0; i < index; i++) {
sb.append((char) code.pop());
}
output.addToken(Token.builder()
.setLine(line)
.setColumn(column)
.setURI(output.getURI())
.setValueAndOriginalValue(sb.toString())
.setType(PythonTokenType.STRING)
.build());
sb.setLength(0);
return true;
}
private boolean read(CodeReader code) {
if (isLookingOnLongString(code, ch, index)) {
return readLongString(code);
} else {
return readString(code);
}
}
private boolean readString(CodeReader code) {
index++;
while (code.charAt(index) != ch) {
if (code.charAt(index) == EOF) {
return false;
}
if (code.charAt(index) == '\\') {
// escape
index++;
}
index++;
}
index++;
return true;
}
private boolean readLongString(CodeReader code) {
index += 3;
while (!isLookingOnLongString(code, ch, index)) {
if (code.charAt(index) == EOF) {
return false;
}
if (code.charAt(index) == '\\') {
// escape
index++;
}
index++;
}
index += 3;
return true;
}
private void readStringPrefix(CodeReader code) {
ch = Character.toUpperCase(code.charAt(index));
if (PREFIX_CHARS.contains(ch)) {
index++;
ch = Character.toUpperCase(code.charAt(index));
}
if (PREFIX_CHARS.contains(ch)) {
index++;
ch = code.charAt(index);
}
}
private static boolean isLookingOnLongString(CodeReader code, char ch, int index) {
return (code.charAt(index) == ch) && (code.charAt(index + 1) == ch) && (code.charAt(index + 2) == ch);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy