All Downloads are FREE. Search and download functionalities are using the official Maven repository.

src.it.unimi.dsi.io.LineWordReader Maven / Gradle / Ivy

package it.unimi.dsi.io;

/*
 * DSI utilities
 *
 * Copyright (C) 2006-2017 Sebastiano Vigna
 *
 *  This library is free software; you can redistribute it and/or modify it
 *  under the terms of the GNU Lesser General Public License as published by the Free
 *  Software Foundation; either version 3 of the License, or (at your option)
 *  any later version.
 *
 *  This library is distributed in the hope that it will be useful, but
 *  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
 *  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License
 *  for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public License
 *  along with this program; if not, see .
 *
 */

import it.unimi.dsi.lang.MutableString;

import java.io.IOException;
import java.io.Reader;
import java.io.Serializable;

/** A trivial {@link it.unimi.dsi.io.WordReader} that considers each line
 * of a document a single word.
 *
 * 

The intended usage of this class is that of indexing stuff like lists of document * identifiers: if the identifiers contain nonalphabetical characters, the default * {@link it.unimi.dsi.io.FastBufferedReader} might do a poor job. * *

Note that the non-word returned by {@link #next(MutableString, MutableString)} is * always empty. */ public class LineWordReader implements WordReader, Serializable { private static final long serialVersionUID = 1L; /** An fast buffered reader wrapping the underlying reader. */ private FastBufferedReader fastBufferedReader = new FastBufferedReader(); @Override public boolean next(final MutableString word, final MutableString nonWord) throws IOException { nonWord.length(0); return fastBufferedReader.readLine(word) != null; } @Override public LineWordReader setReader(final Reader reader) { fastBufferedReader.setReader(reader); return this; } @Override public LineWordReader copy() { return new LineWordReader(); } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy