All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.activej.multilog.Multilog Maven / Gradle / Ivy

The newest version!
/*
 * Copyright (C) 2020 ActiveJ LLC.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package io.activej.multilog;

import io.activej.bytebuf.ByteBuf;
import io.activej.common.MemSize;
import io.activej.common.builder.AbstractBuilder;
import io.activej.common.exception.MalformedDataException;
import io.activej.common.exception.TruncatedDataException;
import io.activej.common.ref.RefBoolean;
import io.activej.common.time.Stopwatch;
import io.activej.csp.process.frame.ChannelFrameDecoder;
import io.activej.csp.process.frame.ChannelFrameEncoder;
import io.activej.csp.process.frame.FrameFormat;
import io.activej.csp.supplier.ChannelSuppliers;
import io.activej.datastream.consumer.StreamConsumer;
import io.activej.datastream.consumer.StreamConsumers;
import io.activej.datastream.csp.ChannelDeserializer;
import io.activej.datastream.csp.ChannelSerializer;
import io.activej.datastream.stats.DetailedStreamStats;
import io.activej.datastream.stats.StreamRegistry;
import io.activej.datastream.stats.StreamStats;
import io.activej.datastream.supplier.StreamSupplier;
import io.activej.datastream.supplier.StreamSupplierWithResult;
import io.activej.datastream.supplier.StreamSuppliers;
import io.activej.fs.IFileSystem;
import io.activej.fs.exception.IllegalOffsetException;
import io.activej.jmx.api.attribute.JmxAttribute;
import io.activej.promise.Promise;
import io.activej.promise.SettablePromise;
import io.activej.reactor.AbstractReactive;
import io.activej.reactor.Reactor;
import io.activej.reactor.jmx.ReactiveJmxBeanWithStats;
import io.activej.serializer.BinarySerializer;
import org.jetbrains.annotations.Nullable;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.time.Duration;
import java.util.Iterator;
import java.util.List;
import java.util.Objects;

import static io.activej.common.Checks.checkArgument;
import static io.activej.common.function.FunctionEx.identity;
import static io.activej.datastream.stats.StreamStatsSizeCounter.forByteBufs;
import static io.activej.reactor.Reactive.checkInReactorThread;
import static java.util.concurrent.TimeUnit.SECONDS;
import static java.util.stream.Collectors.toList;

public final class Multilog extends AbstractReactive
	implements IMultilog, ReactiveJmxBeanWithStats {
	private static final Logger logger = LoggerFactory.getLogger(Multilog.class);

	public static final MemSize DEFAULT_BUFFER_SIZE = MemSize.kilobytes(256);

	private final IFileSystem fileSystem;
	private final LogNamingScheme namingScheme;
	private final BinarySerializer serializer;

	private MemSize bufferSize = DEFAULT_BUFFER_SIZE;
	private Duration autoFlushInterval = null;
	private boolean ignoreMalformedLogs;
	private final FrameFormat frameFormat;

	private final StreamRegistry streamReads = StreamRegistry.create();
	private final StreamRegistry streamWrites = StreamRegistry.create();

	private final DetailedStreamStats streamReadStats = StreamStats.detailedBuilder()
		.withSizeCounter(forByteBufs())
		.build();
	private final DetailedStreamStats streamWriteStats = StreamStats.detailedBuilder()
		.withSizeCounter(forByteBufs())
		.build();

	private Multilog(
		Reactor reactor, IFileSystem fileSystem, FrameFormat frameFormat, BinarySerializer serializer,
		LogNamingScheme namingScheme
	) {
		super(reactor);
		this.fileSystem = fileSystem;
		this.frameFormat = frameFormat;
		this.serializer = serializer;
		this.namingScheme = namingScheme;
	}

	public static  Multilog create(
		Reactor reactor, IFileSystem fileSystem, FrameFormat frameFormat, BinarySerializer serializer,
		LogNamingScheme namingScheme
	) {
		return builder(reactor, fileSystem, frameFormat, serializer, namingScheme).build();
	}

	public static  Multilog.Builder builder(
		Reactor reactor, IFileSystem fileSystem, FrameFormat frameFormat, BinarySerializer serializer,
		LogNamingScheme namingScheme
	) {
		return new Multilog<>(reactor, fileSystem, frameFormat, serializer, namingScheme).new Builder();
	}

	public final class Builder extends AbstractBuilder> {
		private Builder() {}

		public Builder withBufferSize(int bufferSize) {
			checkNotBuilt(this);
			Multilog.this.bufferSize = MemSize.of(bufferSize);
			return this;
		}

		public Builder withBufferSize(MemSize bufferSize) {
			checkNotBuilt(this);
			Multilog.this.bufferSize = bufferSize;
			return this;
		}

		public Builder withAutoFlushInterval(Duration autoFlushInterval) {
			checkNotBuilt(this);
			Multilog.this.autoFlushInterval = autoFlushInterval;
			return this;
		}

		public Builder withIgnoreMalformedLogs(boolean ignore) {
			checkNotBuilt(this);
			Multilog.this.ignoreMalformedLogs = ignore;
			return this;
		}

		@Override
		protected Multilog doBuild() {
			return Multilog.this;
		}
	}

	@Override
	public Promise> write(String logPartition) {
		checkInReactorThread(this);
		validateLogPartition(logPartition);

		return Promise.of(StreamConsumers.ofSupplier(
				supplier -> supplier
					.transformWith(ChannelSerializer.builder(serializer)
						.withAutoFlushInterval(autoFlushInterval)
						.withInitialBufferSize(bufferSize)
						.withSkipSerializationErrors()
						.build())
					.transformWith(streamWrites.register(logPartition))
					.transformWith(streamWriteStats)
					.bindTo(new LogStreamChunker(reactor, fileSystem, namingScheme, logPartition,
						consumer -> consumer.transformWith(
							ChannelFrameEncoder.builder(frameFormat)
								.withEncoderResets()
								.build()))))
			.withAcknowledgement(ack -> ack
				.mapException(e -> new MultilogException("Failed to write logs to partition '" + logPartition + '\'', e))));
	}

	@Override
	public Promise> read(
		String logPartition, LogFile startLogFile, long startOffset, @Nullable LogFile endLogFile
	) {
		checkInReactorThread(this);
		validateLogPartition(logPartition);
		LogPosition startPosition = LogPosition.create(startLogFile, startOffset);
		return fileSystem.list(namingScheme.getListGlob(logPartition))
			.map(files ->
				files.keySet().stream()
					.map(namingScheme::parse)
					.filter(Objects::nonNull)
					.filter(partitionAndFile -> partitionAndFile.logPartition().equals(logPartition))
					.map(PartitionAndFile::logFile)
					.collect(toList()))
			.map(logFiles -> {
				RefBoolean lastFileRef = new RefBoolean(true);
				return readLogFiles(logPartition, startPosition, logFiles.stream()
					.filter(logFile -> {
						if (logFile.compareTo(startPosition.getLogFile()) < 0)
							return false;

						if (endLogFile == null || logFile.compareTo(endLogFile) <= 0) {
							return true;
						}

						lastFileRef.set(false);
						return false;
					})
					.map(logFile -> logFile.equals(startPosition.getLogFile()) ?
						startPosition : LogPosition.create(logFile, 0)
					)
					.sorted()
					.collect(toList()), lastFileRef.get());
			})
			.mapException(e -> new MultilogException("Failed to read logs from partition '" + logPartition + '\'', e));
	}

	private StreamSupplierWithResult readLogFiles(String logPartition, LogPosition startPosition, List logFiles, boolean lastFile) {
		SettablePromise positionPromise = new SettablePromise<>();

		Iterator> logFileStreams = new Iterator>() {
			final Stopwatch sw = Stopwatch.createUnstarted();

			final Iterator it = logFiles.iterator();
			final CountingFrameFormat countingFormat = new CountingFrameFormat(frameFormat);
			LogPosition currentPosition;

			@Override
			public boolean hasNext() {
				if (it.hasNext()) return true;
				positionPromise.trySet(getLogPosition());
				return false;
			}

			LogPosition getLogPosition() {
				if (currentPosition == null)
					return startPosition;

				return LogPosition.create(currentPosition.getLogFile(), currentPosition.getPosition() + countingFormat.getCount());
			}

			@Override
			public StreamSupplier next() {
				currentPosition = it.next();
				long position = currentPosition.getPosition();
				LogFile currentLogFile = currentPosition.getLogFile();
				if (logger.isTraceEnabled())
					logger.trace("Read log file `{}` from: {}", currentLogFile, position);

				return StreamSuppliers.ofPromise(
					fileSystem.download(namingScheme.path(logPartition, currentLogFile), position, Long.MAX_VALUE)
						.then(Promise::of,
							e -> {
								if (ignoreMalformedLogs && e instanceof IllegalOffsetException) {
									if (logger.isWarnEnabled()) {
										logger.warn(
											"Ignoring log file whose size is less than log position {} {}:`{}` in {}, " +
											"previous position: {}",
											position, fileSystem,
											namingScheme.path(logPartition, currentPosition.getLogFile()), sw,
											countingFormat.getCount(),
											e);
									}
									return Promise.of(ChannelSuppliers.empty());
								}
								return Promise.ofException(e);
							})
						.map(fileStream -> {
							countingFormat.resetCount();
							sw.reset().start();
							return fileStream
								.transformWith(streamReads.register(
									logPartition + ":" + currentLogFile +
									"@" + position))
								.transformWith(streamReadStats)
								.transformWith(
									ChannelFrameDecoder.builder(countingFormat)
										.withDecoderResets()
										.build())
								.transformWith(supplier ->
									supplier.withEndOfStream(eos ->
										eos.map(identity(),
											e -> {
												if (e instanceof TruncatedDataException && !it.hasNext() && lastFile) {
													return null;
												}
												if (ignoreMalformedLogs && e instanceof MalformedDataException) {
													if (!logger.isWarnEnabled()) return null;

													logger.warn(
														"Ignoring malformed log file {}:`{}` in {}, " +
														"previous position: {}",
														fileSystem,
														namingScheme.path(logPartition, currentPosition.getLogFile()),
														sw, countingFormat.getCount(),
														e);
													return null;
												} else {
													throw e;
												}
											})))
								.transformWith(ChannelDeserializer.create(serializer))
								.withEndOfStream(eos ->
									eos.whenComplete(($, e) -> log(e)));
						}));
			}

			private void log(Exception e) {
				if (e == null && logger.isTraceEnabled()) {
					logger.trace("Finish log file {}:`{}` in {}, compressed bytes: {} ({} bytes/s)",
						fileSystem, namingScheme.path(logPartition, currentPosition.getLogFile()),
						sw, countingFormat.getCount(), countingFormat.getCount() / Math.max(sw.elapsed(SECONDS), 1));
				} else if (e != null && logger.isErrorEnabled()) {
					logger.error("Error on log file {}:`{}` in {}, compressed bytes: {} ({} bytes/s)",
						fileSystem, namingScheme.path(logPartition, currentPosition.getLogFile()),
						sw, countingFormat.getCount(), countingFormat.getCount() / Math.max(sw.elapsed(SECONDS), 1), e);
				}
			}
		};

		return StreamSupplierWithResult.of(StreamSuppliers.concat(logFileStreams), positionPromise);
	}

	private static void validateLogPartition(String logPartition) {
		checkArgument(!logPartition.contains("-"), "Using dash (-) in log partition name is not allowed");
	}

	@JmxAttribute
	public boolean isIgnoreMalformedLogs() {
		return ignoreMalformedLogs;
	}

	@JmxAttribute
	public MemSize getBufferSize() {
		return bufferSize;
	}

	@JmxAttribute
	public Duration getAutoFlushInterval() {
		return autoFlushInterval;
	}

	@SuppressWarnings("rawtypes")
	@JmxAttribute
	public StreamRegistry getStreamReads() {
		return streamReads;
	}

	@SuppressWarnings("rawtypes")
	@JmxAttribute
	public StreamRegistry getStreamWrites() {
		return streamWrites;
	}

	@SuppressWarnings("rawtypes")
	@JmxAttribute
	public DetailedStreamStats getStreamReadStats() {
		return streamReadStats;
	}

	@SuppressWarnings("rawtypes")
	@JmxAttribute
	public DetailedStreamStats getStreamWriteStats() {
		return streamWriteStats;
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy