io.druid.segment.data.IntermediateLongSupplierSerializer Maven / Gradle / Ivy
/*
* Licensed to Metamarkets Group Inc. (Metamarkets) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. Metamarkets licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package io.druid.segment.data;
import com.google.common.io.ByteSink;
import com.google.common.io.CountingOutputStream;
import com.google.common.math.LongMath;
import com.google.common.primitives.Longs;
import io.druid.common.utils.SerializerUtils;
import io.druid.java.util.common.io.smoosh.FileSmoosher;
import it.unimi.dsi.fastutil.longs.Long2IntMap;
import it.unimi.dsi.fastutil.longs.Long2IntOpenHashMap;
import it.unimi.dsi.fastutil.longs.LongArrayList;
import it.unimi.dsi.fastutil.longs.LongList;
import java.io.BufferedInputStream;
import java.io.DataInputStream;
import java.io.IOException;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;
import java.nio.channels.WritableByteChannel;
/**
* Unsafe for concurrent use from multiple threads.
*/
public class IntermediateLongSupplierSerializer implements LongSupplierSerializer
{
private final IOPeon ioPeon;
private final String filenameBase;
private final String tempFile;
private final ByteOrder order;
private final CompressedObjectStrategy.CompressionStrategy compression;
private CountingOutputStream tempOut = null;
private final ByteBuffer helperBuffer = ByteBuffer.allocate(Longs.BYTES);
private int numInserted = 0;
private final Long2IntMap uniqueValues = new Long2IntOpenHashMap();
private final LongList valuesAddedInOrder = new LongArrayList();
private long maxVal = Long.MIN_VALUE;
private long minVal = Long.MAX_VALUE;
private LongSupplierSerializer delegate;
public IntermediateLongSupplierSerializer(
IOPeon ioPeon,
String filenameBase,
ByteOrder order,
CompressedObjectStrategy.CompressionStrategy compression
)
{
this.ioPeon = ioPeon;
this.tempFile = filenameBase + ".temp";
this.filenameBase = filenameBase;
this.order = order;
this.compression = compression;
}
@Override
public void open() throws IOException
{
tempOut = new CountingOutputStream(ioPeon.makeOutputStream(tempFile));
}
@Override
public int size()
{
return numInserted;
}
@Override
public void add(long value) throws IOException
{
SerializerUtils.writeBigEndianLongToOutputStream(tempOut, value, helperBuffer);
++numInserted;
if (uniqueValues.size() <= CompressionFactory.MAX_TABLE_SIZE && !uniqueValues.containsKey(value)) {
uniqueValues.put(value, uniqueValues.size());
valuesAddedInOrder.add(value);
}
if (value > maxVal) {
maxVal = value;
}
if (value < minVal) {
minVal = value;
}
}
private void makeDelegate() throws IOException
{
CompressionFactory.LongEncodingWriter writer;
long delta;
try {
delta = LongMath.checkedSubtract(maxVal, minVal);
}
catch (ArithmeticException e) {
delta = -1;
}
if (uniqueValues.size() <= CompressionFactory.MAX_TABLE_SIZE) {
writer = new TableLongEncodingWriter(uniqueValues, valuesAddedInOrder);
} else if (delta != -1 && delta != Long.MAX_VALUE) {
writer = new DeltaLongEncodingWriter(minVal, delta);
} else {
writer = new LongsLongEncodingWriter(order);
}
if (compression == CompressedObjectStrategy.CompressionStrategy.NONE) {
delegate = new EntireLayoutLongSupplierSerializer(
ioPeon, filenameBase, order, writer
);
} else {
delegate = new BlockLayoutLongSupplierSerializer(
ioPeon, filenameBase, order, writer, compression
);
}
try (DataInputStream tempIn = new DataInputStream(new BufferedInputStream(ioPeon.makeInputStream(tempFile)))) {
delegate.open();
int available = numInserted;
while (available > 0) {
delegate.add(tempIn.readLong());
available--;
}
}
}
@Override
public void closeAndConsolidate(ByteSink consolidatedOut) throws IOException
{
tempOut.close();
makeDelegate();
delegate.closeAndConsolidate(consolidatedOut);
}
@Override
public void close() throws IOException
{
tempOut.close();
makeDelegate();
delegate.close();
}
@Override
public long getSerializedSize()
{
return delegate.getSerializedSize();
}
@Override
public void writeToChannel(WritableByteChannel channel, FileSmoosher smoosher) throws IOException
{
delegate.writeToChannel(channel, smoosher);
}
}