# Copyright 2018 Google LLC # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # https://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import abc import enum from google.protobuf import message from google.protobuf import duration_pb2 from google.protobuf import timestamp_pb2 from google.protobuf import field_mask_pb2 from google.protobuf import struct_pb2 from google.protobuf import wrappers_pb2 from proto.marshal import compat from proto.marshal.collections import MapComposite from proto.marshal.collections import Repeated from proto.marshal.collections import RepeatedComposite from proto.marshal.rules import bytes as pb_bytes from proto.marshal.rules import stringy_numbers from proto.marshal.rules import dates from proto.marshal.rules import struct from proto.marshal.rules import wrappers from proto.marshal.rules import field_mask from proto.primitives import ProtoType class Rule(abc.ABC): """Abstract class definition for marshal rules.""" @classmethod def __subclasshook__(cls, C): if hasattr(C, "to_python") and hasattr(C, "to_proto"): return True return NotImplemented class BaseMarshal: """The base class to translate between protobuf and Python classes. Protocol buffers defines many common types (e.g. Timestamp, Duration) which also exist in the Python standard library. The marshal essentially translates between these: it keeps a registry of common protocol buffers and their Python representations, and translates back and forth. The protocol buffer class is always the "key" in this relationship; when presenting a message, the declared field types are used to determine whether a value should be transformed into another class. Similarly, when accepting a Python value (when setting a field, for example), the declared field type is still used. This means that, if appropriate, multiple protocol buffer types may use the same Python type. The primary implementation of this is :class:`Marshal`, which should usually be used instead of this class directly. """ def __init__(self): self._rules = {} self._noop = NoopRule() self.reset() def register(self, proto_type: type, rule: Rule = None): """Register a rule against the given ``proto_type``. This function expects a ``proto_type`` (the descriptor class) and a ``rule``; an object with a ``to_python`` and ``to_proto`` method. Each method should return the appropriate Python or protocol buffer type, and be idempotent (e.g. accept either type as input). This function can also be used as a decorator:: @marshal.register(timestamp_pb2.Timestamp) class TimestampRule: ... In this case, the class will be initialized for you with zero arguments. Args: proto_type (type): A protocol buffer message type. rule: A marshal object """ # If a rule was provided, register it and be done. if rule: # Ensure the rule implements Rule. if not isinstance(rule, Rule): raise TypeError( "Marshal rule instances must implement " "`to_proto` and `to_python` methods." ) # Register the rule. self._rules[proto_type] = rule return # Create an inner function that will register an instance of the # marshal class to this object's registry, and return it. def register_rule_class(rule_class: type): # Ensure the rule class is a valid rule. if not issubclass(rule_class, Rule): raise TypeError( "Marshal rule subclasses must implement " "`to_proto` and `to_python` methods." ) # Register the rule class. self._rules[proto_type] = rule_class() return rule_class return register_rule_class def reset(self): """Reset the registry to its initial state.""" self._rules.clear() # Register date and time wrappers. self.register(timestamp_pb2.Timestamp, dates.TimestampRule()) self.register(duration_pb2.Duration, dates.DurationRule()) # Register FieldMask wrappers. self.register(field_mask_pb2.FieldMask, field_mask.FieldMaskRule()) # Register nullable primitive wrappers. self.register(wrappers_pb2.BoolValue, wrappers.BoolValueRule()) self.register(wrappers_pb2.BytesValue, wrappers.BytesValueRule()) self.register(wrappers_pb2.DoubleValue, wrappers.DoubleValueRule()) self.register(wrappers_pb2.FloatValue, wrappers.FloatValueRule()) self.register(wrappers_pb2.Int32Value, wrappers.Int32ValueRule()) self.register(wrappers_pb2.Int64Value, wrappers.Int64ValueRule()) self.register(wrappers_pb2.StringValue, wrappers.StringValueRule()) self.register(wrappers_pb2.UInt32Value, wrappers.UInt32ValueRule()) self.register(wrappers_pb2.UInt64Value, wrappers.UInt64ValueRule()) # Register the google.protobuf.Struct wrappers. # # These are aware of the marshal that created them, because they # create RepeatedComposite and MapComposite instances directly and # need to pass the marshal to them. self.register(struct_pb2.Value, struct.ValueRule(marshal=self)) self.register(struct_pb2.ListValue, struct.ListValueRule(marshal=self)) self.register(struct_pb2.Struct, struct.StructRule(marshal=self)) # Special case for bytes to allow base64 encode/decode self.register(ProtoType.BYTES, pb_bytes.BytesRule()) # Special case for int64 from strings because of dict round trip. # See https://github.com/protocolbuffers/protobuf/issues/2679 for rule_class in stringy_numbers.STRINGY_NUMBER_RULES: self.register(rule_class._proto_type, rule_class()) def get_rule(self, proto_type): # Rules are needed to convert values between proto-plus and pb. # Retrieve the rule for the specified proto type. # The NoopRule will be used when a rule is not found. rule = self._rules.get(proto_type, self._noop) # If we don't find a rule, also check under `_instances` # in case there is a rule in another package. # See https://github.com/googleapis/proto-plus-python/issues/349 if rule == self._noop and hasattr(self, "_instances"): for _, instance in self._instances.items(): rule = instance._rules.get(proto_type, self._noop) if rule != self._noop: break return rule def to_python(self, proto_type, value, *, absent: bool = None): # Internal protobuf has its own special type for lists of values. # Return a view around it that implements MutableSequence. value_type = type(value) # Minor performance boost over isinstance if value_type in compat.repeated_composite_types: return RepeatedComposite(value, marshal=self) if value_type in compat.repeated_scalar_types: if isinstance(proto_type, type): return RepeatedComposite(value, marshal=self, proto_type=proto_type) else: return Repeated(value, marshal=self) # Same thing for maps of messages. # See https://github.com/protocolbuffers/protobuf/issues/16596 # We need to look up the name of the type in compat.map_composite_type_names # as class `MessageMapContainer` is no longer exposed # This is done to avoid taking a breaking change in proto-plus. if ( value_type in compat.map_composite_types or value_type.__name__ in compat.map_composite_type_names ): return MapComposite(value, marshal=self) return self.get_rule(proto_type=proto_type).to_python(value, absent=absent) def to_proto(self, proto_type, value, *, strict: bool = False): # The protos in google/protobuf/struct.proto are exceptional cases, # because they can and should represent themselves as lists and dicts. # These cases are handled in their rule classes. if proto_type not in ( struct_pb2.Value, struct_pb2.ListValue, struct_pb2.Struct, ): # For our repeated and map view objects, simply return the # underlying pb. if isinstance(value, (Repeated, MapComposite)): return value.pb # Convert lists and tuples recursively. if isinstance(value, (list, tuple)): return type(value)(self.to_proto(proto_type, i) for i in value) # Convert dictionaries recursively when the proto type is a map. # This is slightly more complicated than converting a list or tuple # because we have to step through the magic that protocol buffers does. # # Essentially, a type of map will show up here as # a FoosEntry with a `key` field, `value` field, and a `map_entry` # annotation. We need to do the conversion based on the `value` # field's type. if isinstance(value, dict) and ( proto_type.DESCRIPTOR.has_options and proto_type.DESCRIPTOR.GetOptions().map_entry ): recursive_type = type(proto_type().value) return {k: self.to_proto(recursive_type, v) for k, v in value.items()} pb_value = self.get_rule(proto_type=proto_type).to_proto(value) # Sanity check: If we are in strict mode, did we get the value we want? if strict and not isinstance(pb_value, proto_type): raise TypeError( "Parameter must be instance of the same class; " "expected {expected}, got {got}".format( expected=proto_type.__name__, got=pb_value.__class__.__name__, ), ) # Return the final value. return pb_value class Marshal(BaseMarshal): """The translator between protocol buffer and Python instances. The bulk of the implementation is in :class:`BaseMarshal`. This class adds identity tracking: multiple instantiations of :class:`Marshal` with the same name will provide the same instance. """ _instances = {} def __new__(cls, *, name: str): """Create a marshal instance. Args: name (str): The name of the marshal. Instantiating multiple marshals with the same ``name`` argument will provide the same marshal each time. """ klass = cls._instances.get(name) if klass is None: klass = cls._instances[name] = super().__new__(cls) return klass def __init__(self, *, name: str): """Instantiate a marshal. Args: name (str): The name of the marshal. Instantiating multiple marshals with the same ``name`` argument will provide the same marshal each time. """ self._name = name if not hasattr(self, "_rules"): super().__init__() class NoopRule: """A catch-all rule that does nothing.""" def to_python(self, pb_value, *, absent: bool = None): return pb_value def to_proto(self, value): return value __all__ = ("Marshal",)