All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.google.common.flogger.backend.MetadataProcessor Maven / Gradle / Ivy

There is a newer version: 2.0.31
Show newest version
/*
 * Copyright (C) 2020 The Flogger Authors.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.google.common.flogger.backend;

import static com.google.common.flogger.util.Checks.checkArgument;
import static com.google.common.flogger.util.Checks.checkNotNull;

import com.google.common.flogger.MetadataKey;
import java.util.AbstractSet;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.List;
import java.util.Map;
import java.util.Set;

/**
 * Processor combining scope and log-site metadata into a single view. This is necessary when
 * backends wish to combine metadata without incurring the cost of building maps etc. While it is
 * not strictly necessary to use this processor when handling metadata, it is recommended.
 *
 * 

The expected usage pattern for this class is that: * *

    *
  1. The logger backend creates one or more stateless {@link MetadataHandler} instances as * static constants. These should be immutable and thread safe since they include only code. *
  2. When handling a log statement, the logger backend generates a {@link MetadataProcessor} in * the logging thread for the current scope and log-site metadata. *
  3. The processor can then be repeatedly used to dispatch calls to one or more of the handlers, * potentially with different mutable context instances. *
* *

By splitting the various life-cycles (handler, processor, contexts) this approach should help * minimize the cost of processing metadata per log statement. * *

Instances of MetadataProcessor are reusable, but not thread safe. All metadata processing must * be done in the logging thread. */ public abstract class MetadataProcessor { // Immutable empty processor which never handles any metadata. private static final MetadataProcessor EMPTY_PROCESSOR = new MetadataProcessor() { @Override public void process(MetadataHandler handler, C context) {} @Override public void handle(MetadataKey key, MetadataHandler handler, C context) {} @Override public T getSingleValue(MetadataKey key) { return null; } @Override public int keyCount() { return 0; } @Override public Set> keySet() { return Collections.emptySet(); } }; /** * Returns a new processor for the combined scope and log-site metadata. Note that this returned * instance may read directly from the supplied metadata during processing, so the supplied * metadata must not be modified while the processor instance is being used. * * @param scopeMetadata Metadata for the current scope (i.e. from {@code ScopedLoggingContext}) * @param logMetadata Metadata extracted from the current log statement (i.e. from {@code * LogData}) * @return a processor to handle a unified view of the data */ public static MetadataProcessor forScopeAndLogSite(Metadata scopeMetadata, Metadata logMetadata) { int totalSize = scopeMetadata.size() + logMetadata.size(); if (totalSize == 0) { return EMPTY_PROCESSOR; } else if (totalSize <= LightweightProcessor.MAX_LIGHTWEIGHT_ELEMENTS) { return getLightweightProcessor(scopeMetadata, logMetadata); } else { return getSimpleProcessor(scopeMetadata, logMetadata); } } // Visible for testing static MetadataProcessor getLightweightProcessor(Metadata scope, Metadata logged) { return new LightweightProcessor(scope, logged); } // Visible for testing static MetadataProcessor getSimpleProcessor(Metadata scope, Metadata logged) { return new SimpleProcessor(scope, logged); } private MetadataProcessor() {} /** * Processes a combined view of the scope and log-site metadata in this processor by invoking the * given handler for each distinct metadata key. The handler method invoked depends on whether the * key is single valued or repeated. * *

Rules for merging scope and log-site metadata are as follows: * *

    *
  • Distinct keys are iterated in the order they were first declared, with scope keys * preceding log-site keys. *
  • For singleton keys, a log-site value replaces any value supplied in the scope. *
  • For repeated keys, all values are collected in declaration order, with scope values * preceding log-site values. *
* *

Note that equal or identical repeated values are permitted, and no "deduplication" is * performed. This is very much in contrast to the {@link com.google.common.flogger.context.Tags * Tags} mechanism, which de-duplicates mappings and reorders keys and values to generate a * minimal, canonical representation. * *

Furthermore, scope-supplied tags will be a single value in the scope metadata, keyed with * the {@link com.google.common.flogger.LogContext.Key#TAGS TAGS} key. * * @param handler the metadata handler to be called back * @param context arbitrary context instance to be passed into each callback. */ public abstract void process(MetadataHandler handler, C context); /** * Invokes the given handler for the combined scope and log-site metadata for a specified key. The * handler method invoked depends on whether the key is single valued or repeated. If no metadata * is present for the given key, the handler is not invoked. */ public abstract void handle(MetadataKey key, MetadataHandler handler, C context); /** * Returns the unique value for a single valued key, or {@code null} if not present. * * @throws IllegalArgumentException if passed a repeatable key (even if that key has one value). */ public abstract T getSingleValue(MetadataKey key); /** * Returns the number of unique keys represented by this processor. This is the same as the size * of {@link #keySet()}, but a separate method to avoid needing to allocate anything just to know * the number of keys. */ public abstract int keyCount(); /** * Returns the set of {@link MetadataKey}s known to this processor, in the order in which they * will be processed. Note that this implementation is lightweight, but not necessarily performant * for things like containment testing. */ public abstract Set> keySet(); /* * The values in the keyMap array are structured as: * [ bits 31-5 : bitmap of additional repeated indices | bits 4-0 first value index ] * * There are 27 additional bits for the mask, but since index 0 could never be an "additional" * value, the bit-mask indices only need to start from 1, giving a maximum of: * 1 (first value index) + 27 (additional repeated indices in mask) * indices in total. * * Obviously this could be extended to a "long", but the bloom filter is only efficient up to * about 10-15 elements (and that's a super rare case anyway). At some point it's just not worth * trying to squeeze anymore value from this class and the "SimpleProcessor" should be used * instead (we might even want to switch before hitting 28 elements depending on performance). */ private static final class LightweightProcessor extends MetadataProcessor { private static final int MAX_LIGHTWEIGHT_ELEMENTS = 28; private final Metadata scope; private final Metadata logged; // Mapping of key/value indices for distinct keys (kept in key "encounter" order). private final int[] keyMap; // Count of unique keys in the keyMap. private final int keyCount; private LightweightProcessor(Metadata scope, Metadata logged) { this.scope = checkNotNull(scope, "scope metadata"); this.logged = checkNotNull(logged, "logged metadata"); // We can never have more distinct keys, so this never needs resizing. This should be the // only variable sized allocation required by this algorithm. When duplicate keys exist some // elements at the end of the array will be unused, but the array is typically small and it is // common for all keys to be distinct, so "right sizing" the array wouldn't be worth it. int maxKeyCount = scope.size() + logged.size(); // This should be impossible (outside of tests). checkArgument(maxKeyCount <= MAX_LIGHTWEIGHT_ELEMENTS, "metadata size too large"); this.keyMap = new int[maxKeyCount]; this.keyCount = prepareKeyMap(keyMap); } @Override public void process(MetadataHandler handler, C context) { for (int i = 0; i < keyCount; i++) { int n = keyMap[i]; dispatch(getKey(n & 0x1F), n, handler, context); } } @Override public void handle(MetadataKey key, MetadataHandler handler, C context) { int index = indexOf(key, keyMap, keyCount); if (index >= 0) { dispatch(key, keyMap[index], handler, context); } } @Override public T getSingleValue(MetadataKey key) { checkArgument(!key.canRepeat(), "key must be single valued"); int index = indexOf(key, keyMap, keyCount); // For single keys, the keyMap values are just the value index. return (index >= 0) ? key.cast(getValue(keyMap[index])) : null; } @Override public int keyCount() { return keyCount; } @Override public Set> keySet() { // We may want to cache this, since it's effectively immutable, but it's also a small and // likely short lived instance, so quite possibly not worth it for the cost of another field. return new AbstractSet>() { @Override public int size() { return keyCount; } @Override public Iterator> iterator() { return new Iterator>() { private int i = 0; @Override public boolean hasNext() { return i < keyCount; } @Override public MetadataKey next() { return getKey(keyMap[i++] & 0x1F); } @Override // in case we are on an earlier Java version with no default method for this public void remove() { throw new UnsupportedOperationException(); } }; } }; } // Separate method to re-capture the value type. private void dispatch(MetadataKey key, int n, MetadataHandler handler, C context) { if (!key.canRepeat()) { // For single keys, the keyMap values are just the value index. handler.handle(key, key.cast(getValue(n)), context); } else { handler.handleRepeated(key, new ValueIterator(key, n), context); } } // Note that this could be made a reusable instance (reset between callbacks) if we wanted to // same a little on allocations. However this is a fixed size instance and repeated keys are // a fairly unusual use case. private final class ValueIterator implements Iterator { private final MetadataKey key; private int nextIndex; // For repeated keys, the bits 5-32 contain a mask of additional indices (where bit 5 // implies index 1, since index 0 cannot apply to an additional repeated value). private int mask; private ValueIterator(MetadataKey key, int valueIndices) { this.key = key; // Get the first element index (lowest 5 bits, 0-27). this.nextIndex = valueIndices & 0x1F; // Adjust keymap indices mask so bit-0 represents the index *after* the first element. // This adjustment is 5 (rather than the 4 with which indices are encoded) because we are // shifting past the first index. this.mask = valueIndices >>> (5 + nextIndex); } @Override public boolean hasNext() { return nextIndex >= 0; } @Override public T next() { T next = key.cast(getValue(nextIndex)); if (mask != 0) { // Skip the previous value and any "gaps" in the mask to find the new next index. int skip = 1 + Integer.numberOfTrailingZeros(mask); mask >>>= skip; nextIndex += skip; } else { // After returning the current value we're done. nextIndex = -1; } return next; } @Override // in case we are on an earlier Java version with no default method for this public void remove() { throw new UnsupportedOperationException(); } } // Fill the keyMap array and return the count of distinct keys found. private int prepareKeyMap(int[] keyMap) { long bloomFilterMask = 0L; int count = 0; for (int n = 0; n < keyMap.length; n++) { MetadataKey key = getKey(n); // Use the bloom filter mask to get a quick true-negative test for whether we've seen this // key before. Most keys are distinct and this test is very reliable up to 10-15 keys, so // it saves building a HashSet or similar to track the set of unique keys. long oldMask = bloomFilterMask; bloomFilterMask |= key.getBloomFilterMask(); if (bloomFilterMask == oldMask) { // Very probably a duplicate key. This is rare compared to distinct keys, but will happen // (e.g. for repeated keys with several values). Now we find the index of the key (since // we need to update that element in the keyMap array). This is a linear search but in // normal usage should happen once or twice over a small set (e.g. 5 distinct elements). // It is still expected to be faster/cheaper than creating and populating a HashSet. // // NOTE: It is impossible to get here if (n == 0) because the key's bloom filter must have // at least one bit set so can never equal the initial mask first time round the loop. int i = indexOf(key, keyMap, count); // If the index is -1, it wasn't actually in the set and this was a false-positive. if (i != -1) { // Definitely duplicate key. The key could still be non-repeating though since it might // appear in both scope and logged metadata exactly once: // * For non-repeating keys, just replace the existing map value with the new index. // * For repeated keys, keep the index in the low 5-bits and set a new bit in the mask. // // Since we can never see (n == 0) here, we encode index 1 at bit 5 (hence "n + 4", not // "n + 5" below). This trick just gives us the ability to store one more index. keyMap[i] = key.canRepeat() ? keyMap[i] | (1 << (n + 4)) : n; continue; } } // This key is definitely not already in the keyMap, so add it and increment the count. keyMap[count++] = n; } return count; } // Returns the (unique) index into the keyMap array for the given key. private int indexOf(MetadataKey key, int[] keyMap, int count) { for (int i = 0; i < count; i++) { // Low 5 bits of keyMap values are *always* an index to a valid metadata key. if (key.equals(getKey(keyMap[i] & 0x1F))) { return i; } } return -1; } private MetadataKey getKey(int n) { int scopeSize = scope.size(); return n >= scopeSize ? logged.getKey(n - scopeSize) : scope.getKey(n); } private Object getValue(int n) { int scopeSize = scope.size(); return n >= scopeSize ? logged.getValue(n - scopeSize) : scope.getValue(n); } } /** * Simple version of a metadata processor which allocates "large" data structures. This is needed * when a large number of metadata elements need processing. It should behave exactly the same as * the "lightweight" processor if the supplied Metadata is correctly behaved and not modified * during processing. */ private static final class SimpleProcessor extends MetadataProcessor { private final Map, Object> map; private SimpleProcessor(Metadata scope, Metadata logged) { LinkedHashMap, Object> map = new LinkedHashMap, Object>(); addTo(map, scope); addTo(map, logged); // Wrap any repeated value lists to make them unmodifiable (required for correctness). for (Map.Entry, Object> e : map.entrySet()) { if (e.getKey().canRepeat()) { e.setValue(Collections.unmodifiableList((List) e.getValue())); } } this.map = Collections.unmodifiableMap(map); } // Unlike the LightweightProcessor, we copy references from the Metadata eagerly, so can "cast" // values to their key-types early, ensuring safe casting when dispatching. private static void addTo(Map, Object> map, Metadata metadata) { for (int i = 0; i < metadata.size(); i++) { MetadataKey key = metadata.getKey(i); Object value = map.get(key); if (key.canRepeat()) { @SuppressWarnings("unchecked") List list = (List) value; if (list == null) { list = new ArrayList(); map.put(key, list); } // Cast value to ensure that "repeated key is MetadataKey" implies "value is List" list.add(key.cast(metadata.getValue(i))); } else { // Cast value to ensure that "singleton key is MetadataKey" implies "value is T". map.put(key, key.cast(metadata.getValue(i))); } } } @Override public void process(MetadataHandler handler, C context) { for (Map.Entry, Object> e : map.entrySet()) { dispatch(e.getKey(), e.getValue(), handler, context); } } @Override public void handle(MetadataKey key, MetadataHandler handler, C context) { Object value = map.get(key); if (value != null) { dispatch(key, value, handler, context); } } // It's safe to ignore warnings since single keys are only ever 'T' when added to the map. @Override @SuppressWarnings("unchecked") public T getSingleValue(MetadataKey key) { checkArgument(!key.canRepeat(), "key must be single valued"); Object value = map.get(key); return (value != null) ? (T) value : null; } @Override public int keyCount() { return map.size(); } @Override public Set> keySet() { return map.keySet(); } // It's safe to ignore warnings here since we know that repeated keys only ever get 'List' // and single keys are only ever 'T' when added to the map. @SuppressWarnings("unchecked") private static void dispatch( MetadataKey key, Object value, MetadataHandler handler, C context) { if (key.canRepeat()) { handler.handleRepeated(key, ((List) value).iterator(), context); } else { handler.handle(key, (T) value, context); } } } }