com.uber.hoodie.common.util.collection.LazyFileIterable Maven / Gradle / Ivy
The newest version!
/*
* Copyright (c) 2016 Uber Technologies, Inc. ([email protected])
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.uber.hoodie.common.util.collection;
import com.uber.hoodie.exception.HoodieException;
import java.io.IOException;
import java.io.RandomAccessFile;
import java.util.Iterator;
import java.util.Map;
import java.util.function.Consumer;
import java.util.stream.Collectors;
/**
* Iterable to lazily fetch values spilled to disk. This class uses RandomAccessFile to randomly access the position of
* the latest value for a key spilled to disk and returns the result.
*/
public class LazyFileIterable implements Iterable {
// Used to access the value written at a specific position in the file
private final String filePath;
// Stores the key and corresponding value's latest metadata spilled to disk
private final Map inMemoryMetadataOfSpilledData;
public LazyFileIterable(String filePath, Map map) {
this.filePath = filePath;
this.inMemoryMetadataOfSpilledData = map;
}
@Override
public Iterator iterator() {
try {
return new LazyFileIterator<>(filePath, inMemoryMetadataOfSpilledData);
} catch (IOException io) {
throw new HoodieException("Unable to initialize iterator for file on disk", io);
}
}
/**
* Iterator implementation for the iterable defined above.
*/
public class LazyFileIterator implements Iterator {
private final String filePath;
private RandomAccessFile readOnlyFileHandle;
private final Iterator> metadataIterator;
public LazyFileIterator(String filePath, Map map) throws IOException {
this.filePath = filePath;
this.readOnlyFileHandle = new RandomAccessFile(filePath, "r");
readOnlyFileHandle.seek(0);
// sort the map in increasing order of offset of value so disk seek is only in one(forward) direction
this.metadataIterator = map
.entrySet()
.stream()
.sorted(
(Map.Entry o1, Map.Entry o2) ->
o1.getValue().getOffsetOfValue().compareTo(o2.getValue().getOffsetOfValue()))
.collect(Collectors.toList()).iterator();
this.addShutdownHook();
}
@Override
public boolean hasNext() {
boolean available = this.metadataIterator.hasNext();
if (!available) {
close();
}
return available;
}
@Override
public R next() {
if (!hasNext()) {
throw new IllegalStateException("next() called on EOF'ed stream. File :" + filePath);
}
Map.Entry entry = this.metadataIterator.next();
return DiskBasedMap.get(entry.getValue(), readOnlyFileHandle);
}
@Override
public void remove() {
this.metadataIterator.remove();
}
@Override
public void forEachRemaining(Consumer super R> action) {
action.accept(next());
}
private void close() {
if (readOnlyFileHandle != null) {
try {
readOnlyFileHandle.close();
readOnlyFileHandle = null;
} catch (IOException e) {
throw new RuntimeException(e);
}
}
}
private void addShutdownHook() {
Runtime.getRuntime().addShutdownHook(new Thread() {
public void run() {
close();
}
});
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy