com.google.common.flogger.backend.MetadataProcessor Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of runtime-impl-jetty12 Show documentation
There is a newer version: 2.0.31
/*
 * Copyright (C) 2020 The Flogger Authors.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.google.common.flogger.backend;

import static com.google.common.flogger.util.Checks.checkArgument;
import static com.google.common.flogger.util.Checks.checkNotNull;

import com.google.common.flogger.MetadataKey;
import java.util.AbstractSet;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.List;
import java.util.Map;
import java.util.Set;

/**
 * Processor combining scope and log-site metadata into a single view. This is necessary when
 * backends wish to combine metadata without incurring the cost of building maps etc. While it is
 * not strictly necessary to use this processor when handling metadata, it is recommended.
 *
 * The expected usage pattern for this class is that:
 *
 * 

 *   The logger backend creates one or more stateless {@link MetadataHandler} instances as
 *       static constants. These should be immutable and thread safe since they include only code.
 *   
When handling a log statement, the logger backend generates a {@link MetadataProcessor} in
 *       the logging thread for the current scope and log-site metadata.
 *   
The processor can then be repeatedly used to dispatch calls to one or more of the handlers,
 *       potentially with different mutable context instances.
 * 
 *
 * By splitting the various life-cycles (handler, processor, contexts) this approach should help
 * minimize the cost of processing metadata per log statement.
 *
 * 
Instances of MetadataProcessor are reusable, but not thread safe. All metadata processing must
 * be done in the logging thread.
 */
public abstract class MetadataProcessor {
  // Immutable empty processor which never handles any metadata.
  private static final MetadataProcessor EMPTY_PROCESSOR = new MetadataProcessor() {
    @Override
    public  void process(MetadataHandler handler, C context) {}

    @Override
    public  void handle(MetadataKey key, MetadataHandler handler, C context) {}

    @Override
    public  T getSingleValue(MetadataKey key) {
      return null;
    }

    @Override
    public int keyCount() {
      return 0;
    }

    @Override
    public Set> keySet() {
      return Collections.emptySet();
    }
  };

  /**
   * Returns a new processor for the combined scope and log-site metadata. Note that this returned
   * instance may read directly from the supplied metadata during processing, so the supplied
   * metadata must not be modified while the processor instance is being used.
   *
   * @param scopeMetadata Metadata for the current scope (i.e. from {@code ScopedLoggingContext})
   * @param logMetadata Metadata extracted from the current log statement (i.e. from {@code
   *     LogData})
   * @return a processor to handle a unified view of the data
   */
  public static MetadataProcessor forScopeAndLogSite(Metadata scopeMetadata, Metadata logMetadata) {
    int totalSize = scopeMetadata.size() + logMetadata.size();
    if (totalSize == 0) {
      return EMPTY_PROCESSOR;
    } else if (totalSize <= LightweightProcessor.MAX_LIGHTWEIGHT_ELEMENTS) {
      return getLightweightProcessor(scopeMetadata, logMetadata);
    } else {
      return getSimpleProcessor(scopeMetadata, logMetadata);
    }
  }

  // Visible for testing
  static MetadataProcessor getLightweightProcessor(Metadata scope, Metadata logged) {
    return new LightweightProcessor(scope, logged);
  }

  // Visible for testing
  static MetadataProcessor getSimpleProcessor(Metadata scope, Metadata logged) {
    return new SimpleProcessor(scope, logged);
  }

  private MetadataProcessor() {}

  /**
   * Processes a combined view of the scope and log-site metadata in this processor by invoking the
   * given handler for each distinct metadata key. The handler method invoked depends on whether the
   * key is single valued or repeated.
   *
   * 
Rules for merging scope and log-site metadata are as follows:
   *
   * 

   *   Distinct keys are iterated in the order they were first declared, with scope keys
   *       preceding log-site keys.
   *   
For singleton keys, a log-site value replaces any value supplied in the scope.
   *   
For repeated keys, all values are collected in declaration order, with scope values
   *       preceding log-site values.
   * 
   *
   * Note that equal or identical repeated values are permitted, and no "deduplication" is
   * performed. This is very much in contrast to the {@link com.google.common.flogger.context.Tags
   * Tags} mechanism, which de-duplicates mappings and reorders keys and values to generate a
   * minimal, canonical representation.
   *
   * 
Furthermore, scope-supplied tags will be a single value in the scope metadata, keyed with
   * the {@link com.google.common.flogger.LogContext.Key#TAGS TAGS} key.
   *
   * @param handler the metadata handler to be called back
   * @param context arbitrary context instance to be passed into each callback.
   */
  public abstract  void process(MetadataHandler handler, C context);

  /**
   * Invokes the given handler for the combined scope and log-site metadata for a specified key. The
   * handler method invoked depends on whether the key is single valued or repeated. If no metadata
   * is present for the given key, the handler is not invoked.
   */
  public abstract  void handle(MetadataKey key, MetadataHandler handler, C context);

  /**
   * Returns the unique value for a single valued key, or {@code null} if not present.
   *
   * @throws IllegalArgumentException if passed a repeatable key (even if that key has one value).
   */
  public abstract  T getSingleValue(MetadataKey key);

  /**
   * Returns the number of unique keys represented by this processor. This is the same as the size
   * of {@link #keySet()}, but a separate method to avoid needing to allocate anything just to know
   * the number of keys.
   */
  public abstract int keyCount();

  /**
   * Returns the set of {@link MetadataKey}s known to this processor, in the order in which they
   * will be processed. Note that this implementation is lightweight, but not necessarily performant
   * for things like containment testing.
   */
  public abstract Set> keySet();

  /*
   * The values in the keyMap array are structured as:
   *     [ bits 31-5 : bitmap of additional repeated indices | bits 4-0 first value index ]
   *
   * There are 27 additional bits for the mask, but since index 0 could never be an "additional"
   * value, the bit-mask indices only need to start from 1, giving a maximum of:
   *    1 (first value index) + 27 (additional repeated indices in mask)
   * indices in total.
   *
   * Obviously this could be extended to a "long", but the bloom filter is only efficient up to
   * about 10-15 elements (and that's a super rare case anyway). At some point it's just not worth
   * trying to squeeze anymore value from this class and the "SimpleProcessor" should be used
   * instead (we might even want to switch before hitting 28 elements depending on performance).
   */
  private static final class LightweightProcessor extends MetadataProcessor {
    private static final int MAX_LIGHTWEIGHT_ELEMENTS = 28;

    private final Metadata scope;
    private final Metadata logged;
    // Mapping of key/value indices for distinct keys (kept in key "encounter" order).
    private final int[] keyMap;
    // Count of unique keys in the keyMap.
    private final int keyCount;

    private LightweightProcessor(Metadata scope, Metadata logged) {
      this.scope = checkNotNull(scope, "scope metadata");
      this.logged = checkNotNull(logged, "logged metadata");
      // We can never have more distinct keys, so this never needs resizing. This should be the
      // only variable sized allocation required by this algorithm. When duplicate keys exist some
      // elements at the end of the array will be unused, but the array is typically small and it is
      // common for all keys to be distinct, so "right sizing" the array wouldn't be worth it.
      int maxKeyCount = scope.size() + logged.size();
      // This should be impossible (outside of tests).
      checkArgument(maxKeyCount <= MAX_LIGHTWEIGHT_ELEMENTS, "metadata size too large");
      this.keyMap = new int[maxKeyCount];
      this.keyCount = prepareKeyMap(keyMap);
    }

    @Override
    public  void process(MetadataHandler handler, C context) {
      for (int i = 0; i < keyCount; i++) {
        int n = keyMap[i];
        dispatch(getKey(n & 0x1F), n, handler, context);
      }
    }

    @Override
    public  void handle(MetadataKey key, MetadataHandler handler, C context) {
      int index = indexOf(key, keyMap, keyCount);
      if (index >= 0) {
        dispatch(key, keyMap[index], handler, context);
      }
    }

    @Override
    public  T getSingleValue(MetadataKey key) {
      checkArgument(!key.canRepeat(), "key must be single valued");
      int index = indexOf(key, keyMap, keyCount);
      // For single keys, the keyMap values are just the value index.
      return (index >= 0) ? key.cast(getValue(keyMap[index])) : null;
    }

    @Override
    public int keyCount() {
      return keyCount;
    }

    @Override
    public Set> keySet() {
      // We may want to cache this, since it's effectively immutable, but it's also a small and
      // likely short lived instance, so quite possibly not worth it for the cost of another field.
      return new AbstractSet>() {
        @Override
        public int size() {
          return keyCount;
        }

        @Override
        public Iterator> iterator() {
          return new Iterator>() {
            private int i = 0;

            @Override
            public boolean hasNext() {
              return i < keyCount;
            }

            @Override
            public MetadataKey next() {
              return getKey(keyMap[i++] & 0x1F);
            }

            @Override // in case we are on an earlier Java version with no default method for this
            public void remove() {
              throw new UnsupportedOperationException();
            }
          };
        }
      };
    }

    // Separate method to re-capture the value type.
    private  void dispatch(MetadataKey key, int n, MetadataHandler handler, C context) {
      if (!key.canRepeat()) {
        // For single keys, the keyMap values are just the value index.
        handler.handle(key, key.cast(getValue(n)), context);
      } else {
        handler.handleRepeated(key, new ValueIterator(key, n), context);
      }
    }

    // Note that this could be made a reusable instance (reset between callbacks) if we wanted to
    // same a little on allocations. However this is a fixed size instance and repeated keys are
    // a fairly unusual use case.
    private final class ValueIterator implements Iterator {
      private final MetadataKey key;
      private int nextIndex;
      // For repeated keys, the bits 5-32 contain a mask of additional indices (where bit 5
      // implies index 1, since index 0 cannot apply to an additional repeated value).
      private int mask;

      private ValueIterator(MetadataKey key, int valueIndices) {
        this.key = key;
        // Get the first element index (lowest 5 bits, 0-27).
        this.nextIndex = valueIndices & 0x1F;
        // Adjust keymap indices mask so bit-0 represents the index *after* the first element.
        // This adjustment is 5 (rather than the 4 with which indices are encoded) because we are
        // shifting past the first index.
        this.mask = valueIndices >>> (5 + nextIndex);
      }

      @Override
      public boolean hasNext() {
        return nextIndex >= 0;
      }

      @Override
      public T next() {
        T next = key.cast(getValue(nextIndex));
        if (mask != 0) {
          // Skip the previous value and any "gaps" in the mask to find the new next index.
          int skip = 1 + Integer.numberOfTrailingZeros(mask);
          mask >>>= skip;
          nextIndex += skip;
        } else {
          // After returning the current value we're done.
          nextIndex = -1;
        }
        return next;
      }

      @Override // in case we are on an earlier Java version with no default method for this
      public void remove() {
        throw new UnsupportedOperationException();
      }
    }

    // Fill the keyMap array and return the count of distinct keys found.
    private int prepareKeyMap(int[] keyMap) {
      long bloomFilterMask = 0L;
      int count = 0;
      for (int n = 0; n < keyMap.length; n++) {
        MetadataKey key = getKey(n);
        // Use the bloom filter mask to get a quick true-negative test for whether we've seen this
        // key before. Most keys are distinct and this test is very reliable up to 10-15 keys, so
        // it saves building a HashSet or similar to track the set of unique keys.
        long oldMask = bloomFilterMask;
        bloomFilterMask |= key.getBloomFilterMask();
        if (bloomFilterMask == oldMask) {
          // Very probably a duplicate key. This is rare compared to distinct keys, but will happen
          // (e.g. for repeated keys with several values). Now we find the index of the key (since
          // we need to update that element in the keyMap array). This is a linear search but in
          // normal usage should happen once or twice over a small set (e.g. 5 distinct elements).
          // It is still expected to be faster/cheaper than creating and populating a HashSet.
          //
          // NOTE: It is impossible to get here if (n == 0) because the key's bloom filter must have
          // at least one bit set so can never equal the initial mask first time round the loop.
          int i = indexOf(key, keyMap, count);
          // If the index is -1, it wasn't actually in the set and this was a false-positive.
          if (i != -1) {
            // Definitely duplicate key. The key could still be non-repeating though since it might
            // appear in both scope and logged metadata exactly once:
            // * For non-repeating keys, just replace the existing map value with the new index.
            // * For repeated keys, keep the index in the low 5-bits and set a new bit in the mask.
            //
            // Since we can never see (n == 0) here, we encode index 1 at bit 5 (hence "n + 4", not
            // "n + 5" below). This trick just gives us the ability to store one more index.
            keyMap[i] = key.canRepeat() ? keyMap[i] | (1 << (n + 4)) : n;
            continue;
          }
        }
        // This key is definitely not already in the keyMap, so add it and increment the count.
        keyMap[count++] = n;
      }
      return count;
    }

    // Returns the (unique) index into the keyMap array for the given key.
    private int indexOf(MetadataKey key, int[] keyMap, int count) {
      for (int i = 0; i < count; i++) {
        // Low 5 bits of keyMap values are *always* an index to a valid metadata key.
        if (key.equals(getKey(keyMap[i] & 0x1F))) {
          return i;
        }
      }
      return -1;
    }

    private MetadataKey getKey(int n) {
      int scopeSize = scope.size();
      return n >= scopeSize ? logged.getKey(n - scopeSize) : scope.getKey(n);
    }

    private Object getValue(int n) {
      int scopeSize = scope.size();
      return n >= scopeSize ? logged.getValue(n - scopeSize) : scope.getValue(n);
    }
  }

  /**
   * Simple version of a metadata processor which allocates "large" data structures. This is needed
   * when a large number of metadata elements need processing. It should behave exactly the same as
   * the "lightweight" processor if the supplied Metadata is correctly behaved and not modified
   * during processing.
   */
  private static final class SimpleProcessor extends MetadataProcessor {
    private final Map, Object> map;

    private SimpleProcessor(Metadata scope, Metadata logged) {
      LinkedHashMap, Object> map = new LinkedHashMap, Object>();
      addTo(map, scope);
      addTo(map, logged);
      // Wrap any repeated value lists to make them unmodifiable (required for correctness).
      for (Map.Entry, Object> e : map.entrySet()) {
        if (e.getKey().canRepeat()) {
          e.setValue(Collections.unmodifiableList((List) e.getValue()));
        }
      }
      this.map = Collections.unmodifiableMap(map);
    }

    // Unlike the LightweightProcessor, we copy references from the Metadata eagerly, so can "cast"
    // values to their key-types early, ensuring safe casting when dispatching.
    private static void addTo(Map, Object> map, Metadata metadata) {
      for (int i = 0; i < metadata.size(); i++) {
        MetadataKey key = metadata.getKey(i);
        Object value = map.get(key);
        if (key.canRepeat()) {
          @SuppressWarnings("unchecked")
          List