All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.google.protobuf.DescriptorMessageInfoFactory Maven / Gradle / Ivy

Go to download

Core Protocol Buffers library. Protocol Buffers are a way of encoding structured data in an efficient yet extensible format.

There is a newer version: 4.29.2
Show newest version
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
//
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file or at
// https://developers.google.com/open-source/licenses/bsd

package com.google.protobuf;

import static com.google.protobuf.FieldInfo.forExplicitPresenceField;
import static com.google.protobuf.FieldInfo.forField;
import static com.google.protobuf.FieldInfo.forFieldWithEnumVerifier;
import static com.google.protobuf.FieldInfo.forLegacyRequiredField;
import static com.google.protobuf.FieldInfo.forMapField;
import static com.google.protobuf.FieldInfo.forOneofMemberField;
import static com.google.protobuf.FieldInfo.forPackedField;
import static com.google.protobuf.FieldInfo.forPackedFieldWithEnumVerifier;
import static com.google.protobuf.FieldInfo.forRepeatedMessageField;

import com.google.protobuf.Descriptors.Descriptor;
import com.google.protobuf.Descriptors.FieldDescriptor;
import com.google.protobuf.Descriptors.FieldDescriptor.Type;
import com.google.protobuf.Descriptors.OneofDescriptor;
import java.lang.reflect.Field;
import java.lang.reflect.Method;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.Stack;
import java.util.concurrent.ConcurrentHashMap;

/** A factory for message info based on protobuf descriptors for a {@link GeneratedMessage}. */
@ExperimentalApi
final class DescriptorMessageInfoFactory implements MessageInfoFactory {
  private static final String GET_DEFAULT_INSTANCE_METHOD_NAME = "getDefaultInstance";
  private static final DescriptorMessageInfoFactory instance = new DescriptorMessageInfoFactory();

  /**
   * Names that should be avoided (in UpperCamelCase format). Using them causes the compiler to
   * generate accessors whose names collide with methods defined in base classes.
   *
   * 

Keep this list in sync with kForbiddenWordList in * src/google/protobuf/compiler/java/java_helpers.cc */ private static final Set specialFieldNames = new HashSet<>( Arrays.asList( // java.lang.Object: "Class", // com.google.protobuf.MessageLiteOrBuilder: "DefaultInstanceForType", // com.google.protobuf.MessageLite: "ParserForType", "SerializedSize", // com.google.protobuf.MessageOrBuilder: "AllFields", "DescriptorForType", "InitializationErrorString", "UnknownFields", // obsolete. kept for backwards compatibility of generated code "CachedSize")); // Disallow construction - it's a singleton. private DescriptorMessageInfoFactory() {} public static DescriptorMessageInfoFactory getInstance() { return instance; } @Override public boolean isSupported(Class messageType) { return GeneratedMessage.class.isAssignableFrom(messageType); } @Override public MessageInfo messageInfoFor(Class messageType) { if (!GeneratedMessage.class.isAssignableFrom(messageType)) { throw new IllegalArgumentException("Unsupported message type: " + messageType.getName()); } return convert(messageType, descriptorForType(messageType)); } private static Message getDefaultInstance(Class messageType) { try { Method method = messageType.getDeclaredMethod(GET_DEFAULT_INSTANCE_METHOD_NAME); return (Message) method.invoke(null); } catch (Exception e) { throw new IllegalArgumentException( "Unable to get default instance for message class " + messageType.getName(), e); } } private static Descriptor descriptorForType(Class messageType) { return getDefaultInstance(messageType).getDescriptorForType(); } private static ProtoSyntax convertSyntax(DescriptorProtos.Edition edition) { switch (edition) { case EDITION_PROTO2: return ProtoSyntax.PROTO2; case EDITION_PROTO3: return ProtoSyntax.PROTO3; default: return ProtoSyntax.EDITIONS; } } private static MessageInfo convert(Class messageType, Descriptor messageDescriptor) { List fieldDescriptors = messageDescriptor.getFields(); StructuralMessageInfo.Builder builder = StructuralMessageInfo.newBuilder(fieldDescriptors.size()); builder.withDefaultInstance(getDefaultInstance(messageType)); builder.withSyntax(convertSyntax(messageDescriptor.getFile().getEdition())); builder.withMessageSetWireFormat(messageDescriptor.getOptions().getMessageSetWireFormat()); OneofState oneofState = new OneofState(); // Performance optimization to cache presence bits across field iterations. int bitFieldIndex = 0; int presenceMask = 1; Field bitField = null; // Fields in the descriptor are ordered by the index position in which they appear in the // proto file. This is the same order used to determine the presence mask used in the // bitFields. So to determine the appropriate presence mask to be used for a field, we simply // need to shift the presence mask whenever a presence-checked field is encountered. for (int i = 0; i < fieldDescriptors.size(); ++i) { final FieldDescriptor fd = fieldDescriptors.get(i); boolean enforceUtf8 = fd.needsUtf8Check(); Internal.EnumVerifier enumVerifier = null; // Enum verifier for closed enums. if (fd.getJavaType() == Descriptors.FieldDescriptor.JavaType.ENUM && fd.legacyEnumFieldTreatedAsClosed()) { enumVerifier = new Internal.EnumVerifier() { @Override public boolean isInRange(int number) { return fd.getEnumType().findValueByNumber(number) != null; } }; } if (fd.getRealContainingOneof() != null) { // Build a oneof member field for non-synthetic oneofs. builder.withField(buildOneofMember(messageType, fd, oneofState, enforceUtf8, enumVerifier)); continue; } Field field = field(messageType, fd); int number = fd.getNumber(); FieldType type = getFieldType(fd); // Handle field with implicit presence. if (!fd.hasPresence()) { FieldInfo fieldImplicitPresence; if (fd.isMapField()) { // Map field points to an auto-generated message entry type with the definition: // message MapEntry { // K key = 1; // V value = 2; // } final FieldDescriptor valueField = fd.getMessageType().findFieldByNumber(2); if (valueField.getJavaType() == Descriptors.FieldDescriptor.JavaType.ENUM && valueField.legacyEnumFieldTreatedAsClosed()) { enumVerifier = new Internal.EnumVerifier() { @Override public boolean isInRange(int number) { return valueField.getEnumType().findValueByNumber(number) != null; } }; } fieldImplicitPresence = forMapField( field, number, SchemaUtil.getMapDefaultEntry(messageType, fd.getName()), enumVerifier); } else if (fd.isRepeated() && fd.getJavaType() == FieldDescriptor.JavaType.MESSAGE) { fieldImplicitPresence = forRepeatedMessageField( field, number, type, getTypeForRepeatedMessageField(messageType, fd)); } else if (fd.isPacked()) { if (enumVerifier != null) { fieldImplicitPresence = forPackedFieldWithEnumVerifier( field, number, type, enumVerifier, cachedSizeField(messageType, fd)); } else { fieldImplicitPresence = forPackedField(field, number, type, cachedSizeField(messageType, fd)); } } else { if (enumVerifier != null) { fieldImplicitPresence = forFieldWithEnumVerifier(field, number, type, enumVerifier); } else { fieldImplicitPresence = forField(field, number, type, enforceUtf8); } } builder.withField(fieldImplicitPresence); continue; } // Handle field with explicit presence. FieldInfo fieldExplicitPresence; if (bitField == null) { // Lazy-create the next bitfield since we know it must exist. bitField = bitField(messageType, bitFieldIndex); } if (fd.isRequired()) { fieldExplicitPresence = forLegacyRequiredField( field, number, type, bitField, presenceMask, enforceUtf8, enumVerifier); } else { fieldExplicitPresence = forExplicitPresenceField( field, number, type, bitField, presenceMask, enforceUtf8, enumVerifier); } builder.withField(fieldExplicitPresence); // Update the presence mask for the next iteration. If the shift clears out the mask, we // will go to the next bitField. presenceMask <<= 1; if (presenceMask == 0) { bitField = null; presenceMask = 1; bitFieldIndex++; } } List fieldsToCheckIsInitialized = new ArrayList<>(); for (int i = 0; i < fieldDescriptors.size(); ++i) { FieldDescriptor fd = fieldDescriptors.get(i); if (fd.isRequired() || (fd.getJavaType() == FieldDescriptor.JavaType.MESSAGE && needsIsInitializedCheck(fd.getMessageType()))) { fieldsToCheckIsInitialized.add(fd.getNumber()); } } int[] numbers = new int[fieldsToCheckIsInitialized.size()]; for (int i = 0; i < fieldsToCheckIsInitialized.size(); i++) { numbers[i] = fieldsToCheckIsInitialized.get(i); } if (numbers.length > 0) { builder.withCheckInitialized(numbers); } return builder.build(); } /** * A helper class to determine whether a message type needs to implement {@code isInitialized()}. * *

If a message type doesn't have any required fields or extensions (directly and * transitively), it doesn't need to implement isInitialized() and can always return true there. * It's a bit tricky to determine whether a type has transitive required fields because protobuf * allows cycle references within the same .proto file (e.g., message Foo has a Bar field, and * message Bar has a Foo field). For that we use Tarjan's strongly connected components algorithm * to classify messages into strongly connected groups. Messages in the same group are * transitively including each other, so they should either all have transitive required fields * (or extensions), or none have. * *

This class is thread-safe. */ //

The code is adapted from the C++ implementation: // https://github.com/protocolbuffers/protobuf/blob/main/src/google/protobuf/compiler/java/java_helpers.h static class IsInitializedCheckAnalyzer { private final Map resultCache = new ConcurrentHashMap(); // The following data members are part of Tarjan's SCC algorithm. See: // https://en.wikipedia.org/wiki/Tarjan%27s_strongly_connected_components_algorithm private int index = 0; private final Stack stack = new Stack(); private final Map nodeCache = new HashMap(); public boolean needsIsInitializedCheck(Descriptor descriptor) { Boolean cachedValue = resultCache.get(descriptor); if (cachedValue != null) { return cachedValue; } synchronized (this) { // Double-check the cache because some other thread may have updated it while we // were acquiring the lock. cachedValue = resultCache.get(descriptor); if (cachedValue != null) { return cachedValue; } return dfs(descriptor).component.needsIsInitializedCheck; } } private static class Node { final Descriptor descriptor; final int index; int lowLink; StronglyConnectedComponent component; // null if the node is still on stack. Node(Descriptor descriptor, int index) { this.descriptor = descriptor; this.index = index; this.lowLink = index; this.component = null; } } private static class StronglyConnectedComponent { final List messages = new ArrayList(); boolean needsIsInitializedCheck = false; } private Node dfs(Descriptor descriptor) { Node result = new Node(descriptor, index++); stack.push(result); nodeCache.put(descriptor, result); // Recurse the fields / nodes in graph for (FieldDescriptor field : descriptor.getFields()) { if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) { Node child = nodeCache.get(field.getMessageType()); if (child == null) { // Unexplored node child = dfs(field.getMessageType()); result.lowLink = Math.min(result.lowLink, child.lowLink); } else { if (child.component == null) { // Still in the stack so we found a back edge. result.lowLink = Math.min(result.lowLink, child.lowLink); } } } } if (result.index == result.lowLink) { // This is the root of a strongly connected component. StronglyConnectedComponent component = new StronglyConnectedComponent(); while (true) { Node node = stack.pop(); node.component = component; component.messages.add(node.descriptor); if (node == result) { break; } } analyze(component); } return result; } // Determine whether messages in this SCC needs isInitialized check. private void analyze(StronglyConnectedComponent component) { boolean needsIsInitializedCheck = false; loop: for (Descriptor descriptor : component.messages) { if (descriptor.isExtendable()) { needsIsInitializedCheck = true; break; } for (FieldDescriptor field : descriptor.getFields()) { if (field.isRequired()) { needsIsInitializedCheck = true; break loop; } if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) { // Since we are analyzing the graph bottom-up, all referenced fields should either be // in this same component or in a different already-analyzed component. Node node = nodeCache.get(field.getMessageType()); if (node.component != component) { if (node.component.needsIsInitializedCheck) { needsIsInitializedCheck = true; break loop; } } } } } component.needsIsInitializedCheck = needsIsInitializedCheck; for (Descriptor descriptor : component.messages) { resultCache.put(descriptor, component.needsIsInitializedCheck); } } } private static IsInitializedCheckAnalyzer isInitializedCheckAnalyzer = new IsInitializedCheckAnalyzer(); private static boolean needsIsInitializedCheck(Descriptor descriptor) { return isInitializedCheckAnalyzer.needsIsInitializedCheck(descriptor); } /** Builds info for a oneof member field. */ private static FieldInfo buildOneofMember( Class messageType, FieldDescriptor fd, OneofState oneofState, boolean enforceUtf8, Internal.EnumVerifier enumVerifier) { OneofInfo oneof = oneofState.getOneof(messageType, fd.getContainingOneof()); FieldType type = getFieldType(fd); Class oneofStoredType = getOneofStoredType(messageType, fd, type); return forOneofMemberField( fd.getNumber(), type, oneof, oneofStoredType, enforceUtf8, enumVerifier); } private static Class getOneofStoredType( Class messageType, FieldDescriptor fd, FieldType type) { switch (type.getJavaType()) { case BOOLEAN: return Boolean.class; case BYTE_STRING: return ByteString.class; case DOUBLE: return Double.class; case FLOAT: return Float.class; case ENUM: case INT: return Integer.class; case LONG: return Long.class; case STRING: return String.class; case MESSAGE: return getOneofStoredTypeForMessage(messageType, fd); default: throw new IllegalArgumentException("Invalid type for oneof: " + type); } } private static FieldType getFieldType(FieldDescriptor fd) { switch (fd.getType()) { case BOOL: if (!fd.isRepeated()) { return FieldType.BOOL; } return fd.isPacked() ? FieldType.BOOL_LIST_PACKED : FieldType.BOOL_LIST; case BYTES: return fd.isRepeated() ? FieldType.BYTES_LIST : FieldType.BYTES; case DOUBLE: if (!fd.isRepeated()) { return FieldType.DOUBLE; } return fd.isPacked() ? FieldType.DOUBLE_LIST_PACKED : FieldType.DOUBLE_LIST; case ENUM: if (!fd.isRepeated()) { return FieldType.ENUM; } return fd.isPacked() ? FieldType.ENUM_LIST_PACKED : FieldType.ENUM_LIST; case FIXED32: if (!fd.isRepeated()) { return FieldType.FIXED32; } return fd.isPacked() ? FieldType.FIXED32_LIST_PACKED : FieldType.FIXED32_LIST; case FIXED64: if (!fd.isRepeated()) { return FieldType.FIXED64; } return fd.isPacked() ? FieldType.FIXED64_LIST_PACKED : FieldType.FIXED64_LIST; case FLOAT: if (!fd.isRepeated()) { return FieldType.FLOAT; } return fd.isPacked() ? FieldType.FLOAT_LIST_PACKED : FieldType.FLOAT_LIST; case GROUP: return fd.isRepeated() ? FieldType.GROUP_LIST : FieldType.GROUP; case INT32: if (!fd.isRepeated()) { return FieldType.INT32; } return fd.isPacked() ? FieldType.INT32_LIST_PACKED : FieldType.INT32_LIST; case INT64: if (!fd.isRepeated()) { return FieldType.INT64; } return fd.isPacked() ? FieldType.INT64_LIST_PACKED : FieldType.INT64_LIST; case MESSAGE: if (fd.isMapField()) { return FieldType.MAP; } return fd.isRepeated() ? FieldType.MESSAGE_LIST : FieldType.MESSAGE; case SFIXED32: if (!fd.isRepeated()) { return FieldType.SFIXED32; } return fd.isPacked() ? FieldType.SFIXED32_LIST_PACKED : FieldType.SFIXED32_LIST; case SFIXED64: if (!fd.isRepeated()) { return FieldType.SFIXED64; } return fd.isPacked() ? FieldType.SFIXED64_LIST_PACKED : FieldType.SFIXED64_LIST; case SINT32: if (!fd.isRepeated()) { return FieldType.SINT32; } return fd.isPacked() ? FieldType.SINT32_LIST_PACKED : FieldType.SINT32_LIST; case SINT64: if (!fd.isRepeated()) { return FieldType.SINT64; } return fd.isPacked() ? FieldType.SINT64_LIST_PACKED : FieldType.SINT64_LIST; case STRING: return fd.isRepeated() ? FieldType.STRING_LIST : FieldType.STRING; case UINT32: if (!fd.isRepeated()) { return FieldType.UINT32; } return fd.isPacked() ? FieldType.UINT32_LIST_PACKED : FieldType.UINT32_LIST; case UINT64: if (!fd.isRepeated()) { return FieldType.UINT64; } return fd.isPacked() ? FieldType.UINT64_LIST_PACKED : FieldType.UINT64_LIST; default: throw new IllegalArgumentException("Unsupported field type: " + fd.getType()); } } private static Field bitField(Class messageType, int index) { return field(messageType, "bitField" + index + "_"); } private static Field field(Class messageType, FieldDescriptor fd) { return field(messageType, getFieldName(fd)); } private static Field cachedSizeField(Class messageType, FieldDescriptor fd) { return field(messageType, getCachedSizeFieldName(fd)); } private static Field field(Class messageType, String fieldName) { try { return messageType.getDeclaredField(fieldName); } catch (Exception e) { throw new IllegalArgumentException( "Unable to find field " + fieldName + " in message class " + messageType.getName()); } } static String getFieldName(FieldDescriptor fd) { String name = (fd.getType() == FieldDescriptor.Type.GROUP) ? fd.getMessageType().getName() : fd.getName(); // convert to UpperCamelCase for comparison to the specialFieldNames // (which are in UpperCamelCase) String upperCamelCaseName = snakeCaseToUpperCamelCase(name); // Append underscores to match the behavior of the protoc java compiler final String suffix; if (specialFieldNames.contains(upperCamelCaseName)) { // For proto field names that match the specialFieldNames, // the protoc java compiler appends "__" to the java field name // to prevent the field's accessor method names from clashing with other methods. // For example: // proto field name = "class" // java field name = "class__" // accessor method name = "getClass_()" (so that it does not clash with // Object.getClass()) suffix = "__"; } else { // For other proto field names, // the protoc java compiler appends "_" to the java field name // to prevent field names from clashing with java keywords. // For example: // proto field name = "int" // java field name = "int_" (so that it does not clash with int keyword) // accessor method name = "getInt()" suffix = "_"; } return snakeCaseToLowerCamelCase(name) + suffix; } private static String getCachedSizeFieldName(FieldDescriptor fd) { return snakeCaseToLowerCamelCase(fd.getName()) + "MemoizedSerializedSize"; } /** * Converts a snake case string into lower camel case. * *

Some examples: * *

   *     snakeCaseToLowerCamelCase("foo_bar") => "fooBar"
   *     snakeCaseToLowerCamelCase("foo") => "foo"
   * 
* * @param snakeCase the string in snake case to convert * @return the string converted to camel case, with a lowercase first character */ private static String snakeCaseToLowerCamelCase(String snakeCase) { return snakeCaseToCamelCase(snakeCase, false); } /** * Converts a snake case string into upper camel case. * *

Some examples: * *

   *     snakeCaseToUpperCamelCase("foo_bar") => "FooBar"
   *     snakeCaseToUpperCamelCase("foo") => "Foo"
   * 
* * @param snakeCase the string in snake case to convert * @return the string converted to camel case, with an uppercase first character */ private static String snakeCaseToUpperCamelCase(String snakeCase) { return snakeCaseToCamelCase(snakeCase, true); } /** * Converts a snake case string into camel case. * *

For better readability, prefer calling either {@link #snakeCaseToLowerCamelCase(String)} or * {@link #snakeCaseToUpperCamelCase(String)}. * *

Some examples: * *

   *     snakeCaseToCamelCase("foo_bar", false) => "fooBar"
   *     snakeCaseToCamelCase("foo_bar", true) => "FooBar"
   *     snakeCaseToCamelCase("foo", false) => "foo"
   *     snakeCaseToCamelCase("foo", true) => "Foo"
   *     snakeCaseToCamelCase("Foo", false) => "foo"
   *     snakeCaseToCamelCase("fooBar", false) => "fooBar"
   * 
* *

This implementation of this method must exactly match the corresponding function in the * protocol compiler. Specifically, the {@code UnderscoresToCamelCase} function in {@code * src/google/protobuf/compiler/java/java_helpers.cc}. * * @param snakeCase the string in snake case to convert * @param capFirst true if the first letter of the returned string should be uppercase. false if * the first letter of the returned string should be lowercase. * @return the string converted to camel case, with an uppercase or lowercase first character * depending on if {@code capFirst} is true or false, respectively */ private static String snakeCaseToCamelCase(String snakeCase, boolean capFirst) { StringBuilder sb = new StringBuilder(snakeCase.length() + 1); boolean capNext = capFirst; for (int ctr = 0; ctr < snakeCase.length(); ctr++) { char next = snakeCase.charAt(ctr); if (next == '_') { capNext = true; } else if (Character.isDigit(next)) { sb.append(next); capNext = true; } else if (capNext) { sb.append(Character.toUpperCase(next)); capNext = false; } else if (ctr == 0) { sb.append(Character.toLowerCase(next)); } else { sb.append(next); } } return sb.toString(); } /** * Inspects the message to identify the stored type for a message field that is part of a oneof. */ private static Class getOneofStoredTypeForMessage(Class messageType, FieldDescriptor fd) { try { String name = fd.getType() == Type.GROUP ? fd.getMessageType().getName() : fd.getName(); Method getter = messageType.getDeclaredMethod(getterForField(name)); return getter.getReturnType(); } catch (Exception e) { throw new RuntimeException(e); } } /** Inspects the message to identify the message type of a repeated message field. */ private static Class getTypeForRepeatedMessageField(Class messageType, FieldDescriptor fd) { try { String name = fd.getType() == Type.GROUP ? fd.getMessageType().getName() : fd.getName(); Method getter = messageType.getDeclaredMethod(getterForField(name), int.class); return getter.getReturnType(); } catch (Exception e) { throw new RuntimeException(e); } } /** Constructs the name of the get method for the given field in the proto. */ private static String getterForField(String snakeCase) { String camelCase = snakeCaseToLowerCamelCase(snakeCase); StringBuilder builder = new StringBuilder("get"); // Capitalize the first character in the field name. builder.append(Character.toUpperCase(camelCase.charAt(0))); builder.append(camelCase.substring(1, camelCase.length())); return builder.toString(); } private static final class OneofState { private OneofInfo[] oneofs = new OneofInfo[2]; OneofInfo getOneof(Class messageType, OneofDescriptor desc) { int index = desc.getIndex(); if (index >= oneofs.length) { // Grow the array. oneofs = Arrays.copyOf(oneofs, index * 2); } OneofInfo info = oneofs[index]; if (info == null) { info = newInfo(messageType, desc); oneofs[index] = info; } return info; } private static OneofInfo newInfo(Class messageType, OneofDescriptor desc) { String camelCase = snakeCaseToLowerCamelCase(desc.getName()); String valueFieldName = camelCase + "_"; String caseFieldName = camelCase + "Case_"; return new OneofInfo( desc.getIndex(), field(messageType, caseFieldName), field(messageType, valueFieldName)); } } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy