All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.commons.csv.ExtendedBufferedReader Maven / Gradle / Ivy

Go to download

The Apache Commons CSV library provides a simple interface for reading and writing CSV files of various types.

There is a newer version: 1.12.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.commons.csv;

import static org.apache.commons.csv.Constants.CR;
import static org.apache.commons.csv.Constants.END_OF_STREAM;
import static org.apache.commons.csv.Constants.LF;
import static org.apache.commons.csv.Constants.UNDEFINED;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.Reader;

/**
 * A special buffered reader which supports sophisticated read access.
 * 

* In particular the reader supports a look-ahead option, which allows you to see the next char returned by * {@link #read()}. This reader also tracks how many characters have been read with {@link #getPosition()}. *

*/ final class ExtendedBufferedReader extends BufferedReader { /** The last char returned */ private int lastChar = UNDEFINED; /** The count of EOLs (CR/LF/CRLF) seen so far */ private long eolCounter; /** The position, which is number of characters read so far */ private long position; private boolean closed; /** * Created extended buffered reader using default buffer-size */ ExtendedBufferedReader(final Reader reader) { super(reader); } @Override public int read() throws IOException { final int current = super.read(); if (current == CR || current == LF && lastChar != CR) { eolCounter++; } lastChar = current; this.position++; return lastChar; } /** * Returns the last character that was read as an integer (0 to 65535). This will be the last character returned by * any of the read methods. This will not include a character read using the {@link #lookAhead()} method. If no * character has been read then this will return {@link Constants#UNDEFINED}. If the end of the stream was reached * on the last read then this will return {@link Constants#END_OF_STREAM}. * * @return the last character that was read */ int getLastChar() { return lastChar; } @Override public int read(final char[] buf, final int offset, final int length) throws IOException { if (length == 0) { return 0; } final int len = super.read(buf, offset, length); if (len > 0) { for (int i = offset; i < offset + len; i++) { final char ch = buf[i]; if (ch == LF) { if (CR != (i > 0 ? buf[i - 1] : lastChar)) { eolCounter++; } } else if (ch == CR) { eolCounter++; } } lastChar = buf[offset + len - 1]; } else if (len == -1) { lastChar = END_OF_STREAM; } position += len; return len; } /** * Calls {@link BufferedReader#readLine()} which drops the line terminator(s). This method should only be called * when processing a comment, otherwise information can be lost. *

* Increments {@link #eolCounter} *

* Sets {@link #lastChar} to {@link Constants#END_OF_STREAM} at EOF, otherwise to LF * * @return the line that was read, or null if reached EOF. */ @Override public String readLine() throws IOException { final String line = super.readLine(); if (line != null) { lastChar = LF; // needed for detecting start of line eolCounter++; } else { lastChar = END_OF_STREAM; } return line; } /** * Returns the next character in the current reader without consuming it. So the next call to {@link #read()} will * still return this value. Does not affect line number or last character. * * @return the next character * * @throws IOException * if there is an error in reading */ int lookAhead() throws IOException { super.mark(1); final int c = super.read(); super.reset(); return c; } /** * Returns the current line number * * @return the current line number */ long getCurrentLineNumber() { // Check if we are at EOL or EOF or just starting if (lastChar == CR || lastChar == LF || lastChar == UNDEFINED || lastChar == END_OF_STREAM) { return eolCounter; // counter is accurate } return eolCounter + 1; // Allow for counter being incremented only at EOL } /** * Gets the character position in the reader. * * @return the current position in the reader (counting characters, not bytes since this is a Reader) */ long getPosition() { return this.position; } public boolean isClosed() { return closed; } /** * Closes the stream. * * @throws IOException * If an I/O error occurs */ @Override public void close() throws IOException { // Set ivars before calling super close() in case close() throws an IOException. closed = true; lastChar = END_OF_STREAM; super.close(); } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy