All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.lucene.search.spell.PlainTextDictionary Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.lucene.search.spell;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.Reader;
import java.nio.charset.StandardCharsets;
import java.nio.file.Files;
import java.nio.file.Path;
import org.apache.lucene.search.suggest.InputIterator;
import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.BytesRefBuilder;
import org.apache.lucene.util.BytesRefIterator;
import org.apache.lucene.util.IOUtils;

/**
 * Dictionary represented by a text file.
 *
 * 

Format allowed: 1 word per line:
* word1
* word2
* word3
*/ public class PlainTextDictionary implements Dictionary { private BufferedReader in; /** * Creates a dictionary based on a Path. * *

NOTE: content is treated as UTF-8 */ public PlainTextDictionary(Path path) throws IOException { in = Files.newBufferedReader(path, StandardCharsets.UTF_8); } /** * Creates a dictionary based on an inputstream. * *

NOTE: content is treated as UTF-8 */ public PlainTextDictionary(InputStream dictFile) { in = new BufferedReader(IOUtils.getDecodingReader(dictFile, StandardCharsets.UTF_8)); } /** Creates a dictionary based on a reader. */ public PlainTextDictionary(Reader reader) { in = new BufferedReader(reader); } @Override public InputIterator getEntryIterator() throws IOException { return new InputIterator.InputIteratorWrapper(new FileIterator()); } final class FileIterator implements BytesRefIterator { private boolean done = false; private final BytesRefBuilder spare = new BytesRefBuilder(); @Override public BytesRef next() throws IOException { if (done) { return null; } boolean success = false; BytesRef result; try { String line; if ((line = in.readLine()) != null) { spare.copyChars(line); result = spare.get(); } else { done = true; IOUtils.close(in); result = null; } success = true; } finally { if (!success) { IOUtils.closeWhileHandlingException(in); } } return result; } } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy