예제 #1
0
def GroupDecoder(field_number, is_repeated, is_packed, key, new_default):
    """Returns a decoder for a group field."""

    end_tag_bytes = encoder.TagBytes(field_number,
                                     wire_format.WIRETYPE_END_GROUP)
    end_tag_len = len(end_tag_bytes)

    assert not is_packed
    if is_repeated:
        tag_bytes = encoder.TagBytes(field_number,
                                     wire_format.WIRETYPE_START_GROUP)
        tag_len = len(tag_bytes)

        def DecodeRepeatedField(buffer, pos, end, message, field_dict):
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            while 1:
                value = field_dict.get(key)
                if value is None:
                    value = field_dict.setdefault(key, new_default(message))
                # Read sub-message.
                pos = value.add()._InternalParse(buffer, pos, end)
                # Read end tag.
                new_pos = pos + end_tag_len
                if buffer[pos:new_pos] != end_tag_bytes or new_pos > end:
                    raise _DecodeError('Missing group end tag.')
                # Predict that the next tag is another copy of the same repeated field.
                pos = new_pos + tag_len
                if buffer[new_pos:pos] != tag_bytes or new_pos == end:
                    # Prediction failed.  Return.
                    return new_pos

        return DecodeRepeatedField
    else:

        def DecodeField(buffer, pos, end, message, field_dict):
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            # Read sub-message.
            pos = value._InternalParse(buffer, pos, end)
            # Read end tag.
            new_pos = pos + end_tag_len
            if buffer[pos:new_pos] != end_tag_bytes or new_pos > end:
                raise _DecodeError('Missing group end tag.')
            return new_pos

        return DecodeField
예제 #2
0
        def DecodeField(buffer, pos, end, message, field_dict):
            """Decode serialized repeated enum to its value and a new position.

      Args:
        buffer: memoryview of the serialized bytes.
        pos: int, position in the memory view to start at.
        end: int, end position of serialized data
        message: Message object to store unknown fields in
        field_dict: Map[Descriptor, Any] to store decoded values in.

      Returns:
        int, new position in serialized data.
      """
            value_start_pos = pos
            (enum_value, pos) = _DecodeSignedVarint32(buffer, pos)
            if pos > end:
                raise _DecodeError('Truncated message.')
            # pylint: disable=protected-access
            if enum_value in enum_type.values_by_number:
                field_dict[key] = enum_value
            else:
                if not message._unknown_fields:
                    message._unknown_fields = []
                tag_bytes = encoder.TagBytes(field_number,
                                             wire_format.WIRETYPE_VARINT)
                message._unknown_fields.append(
                    (tag_bytes, buffer[value_start_pos:pos].tobytes()))
                if message._unknown_field_set is None:
                    message._unknown_field_set = containers.UnknownFieldSet()
                message._unknown_field_set._add(field_number,
                                                wire_format.WIRETYPE_VARINT,
                                                enum_value)
                # pylint: enable=protected-access
            return pos
예제 #3
0
    def SpecificDecoder(field_number, is_repeated, is_packed, key,
                        new_default):
        if is_packed:
            local_DecodeVarint = _DecodeVarint

            def DecodePackedField(buffer, pos, end, message, field_dict):
                value = field_dict.get(key)
                if value is None:
                    value = field_dict.setdefault(key, new_default(message))
                (endpoint, pos) = local_DecodeVarint(buffer, pos)
                endpoint += pos
                if endpoint > end:
                    raise _DecodeError('Truncated message.')
                while pos < endpoint:
                    (element, pos) = decode_value(buffer, pos)
                    value.append(element)
                if pos > endpoint:
                    del value[-1]  # Discard corrupt value.
                    raise _DecodeError('Packed element was truncated.')
                return pos

            return DecodePackedField
        elif is_repeated:
            tag_bytes = encoder.TagBytes(field_number, wire_type)
            tag_len = len(tag_bytes)

            def DecodeRepeatedField(buffer, pos, end, message, field_dict):
                value = field_dict.get(key)
                if value is None:
                    value = field_dict.setdefault(key, new_default(message))
                while 1:
                    (element, new_pos) = decode_value(buffer, pos)
                    value.append(element)
                    # Predict that the next tag is another copy of the same repeated
                    # field.
                    pos = new_pos + tag_len
                    if buffer[new_pos:pos] != tag_bytes or new_pos >= end:
                        # Prediction failed.  Return.
                        if new_pos > end:
                            raise _DecodeError('Truncated message.')
                        return new_pos

            return DecodeRepeatedField
        else:

            def DecodeField(buffer, pos, end, message, field_dict):
                (field_dict[key], pos) = decode_value(buffer, pos)
                if pos > end:
                    del field_dict[key]  # Discard corrupt value.
                    raise _DecodeError('Truncated message.')
                return pos

            return DecodeField
예제 #4
0
def MessageDecoder(field_number, is_repeated, is_packed, key, new_default):
    """Returns a decoder for a message field."""

    local_DecodeVarint = _DecodeVarint

    assert not is_packed
    if is_repeated:
        tag_bytes = encoder.TagBytes(field_number,
                                     wire_format.WIRETYPE_LENGTH_DELIMITED)
        tag_len = len(tag_bytes)

        def DecodeRepeatedField(buffer, pos, end, message, field_dict):
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            while 1:
                # Read length.
                (size, pos) = local_DecodeVarint(buffer, pos)
                new_pos = pos + size
                if new_pos > end:
                    raise _DecodeError('Truncated message.')
                # Read sub-message.
                if value.add()._InternalParse(buffer, pos, new_pos) != new_pos:
                    # The only reason _InternalParse would return early is if it
                    # encountered an end-group tag.
                    raise _DecodeError('Unexpected end-group tag.')
                # Predict that the next tag is another copy of the same repeated field.
                pos = new_pos + tag_len
                if buffer[new_pos:pos] != tag_bytes or new_pos == end:
                    # Prediction failed.  Return.
                    return new_pos

        return DecodeRepeatedField
    else:

        def DecodeField(buffer, pos, end, message, field_dict):
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            # Read length.
            (size, pos) = local_DecodeVarint(buffer, pos)
            new_pos = pos + size
            if new_pos > end:
                raise _DecodeError('Truncated message.')
            # Read sub-message.
            if value._InternalParse(buffer, pos, new_pos) != new_pos:
                # The only reason _InternalParse would return early is if it encountered
                # an end-group tag.
                raise _DecodeError('Unexpected end-group tag.')
            return new_pos

        return DecodeField
예제 #5
0
        def DecodePackedField(buffer, pos, end, message, field_dict):
            """Decode serialized packed enum to its value and a new position.

      Args:
        buffer: memoryview of the serialized bytes.
        pos: int, position in the memory view to start at.
        end: int, end position of serialized data
        message: Message object to store unknown fields in
        field_dict: Map[Descriptor, Any] to store decoded values in.

      Returns:
        int, new position in serialized data.
      """
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            (endpoint, pos) = local_DecodeVarint(buffer, pos)
            endpoint += pos
            if endpoint > end:
                raise _DecodeError('Truncated message.')
            while pos < endpoint:
                value_start_pos = pos
                (element, pos) = _DecodeSignedVarint32(buffer, pos)
                # pylint: disable=protected-access
                if element in enum_type.values_by_number:
                    value.append(element)
                else:
                    if not message._unknown_fields:
                        message._unknown_fields = []
                    tag_bytes = encoder.TagBytes(field_number,
                                                 wire_format.WIRETYPE_VARINT)

                    message._unknown_fields.append(
                        (tag_bytes, buffer[value_start_pos:pos].tobytes()))
                    if message._unknown_field_set is None:
                        message._unknown_field_set = containers.UnknownFieldSet(
                        )
                    message._unknown_field_set._add(
                        field_number, wire_format.WIRETYPE_VARINT, element)
                    # pylint: enable=protected-access
            if pos > endpoint:
                if element in enum_type.values_by_number:
                    del value[-1]  # Discard corrupt value.
                else:
                    del message._unknown_fields[-1]
                    # pylint: disable=protected-access
                    del message._unknown_field_set._values[-1]
                    # pylint: enable=protected-access
                raise _DecodeError('Packed element was truncated.')
            return pos
예제 #6
0
def MapDecoder(field_descriptor, new_default, is_message_map):
    """Returns a decoder for a map field."""

    key = field_descriptor
    tag_bytes = encoder.TagBytes(field_descriptor.number,
                                 wire_format.WIRETYPE_LENGTH_DELIMITED)
    tag_len = len(tag_bytes)
    local_DecodeVarint = _DecodeVarint
    # Can't read _concrete_class yet; might not be initialized.
    message_type = field_descriptor.message_type

    def DecodeMap(buffer, pos, end, message, field_dict):
        submsg = message_type._concrete_class()
        value = field_dict.get(key)
        if value is None:
            value = field_dict.setdefault(key, new_default(message))
        while 1:
            # Read length.
            (size, pos) = local_DecodeVarint(buffer, pos)
            new_pos = pos + size
            if new_pos > end:
                raise _DecodeError('Truncated message.')
            # Read sub-message.
            submsg.Clear()
            if submsg._InternalParse(buffer, pos, new_pos) != new_pos:
                # The only reason _InternalParse would return early is if it
                # encountered an end-group tag.
                raise _DecodeError('Unexpected end-group tag.')

            if is_message_map:
                value[submsg.key].CopyFrom(submsg.value)
            else:
                value[submsg.key] = submsg.value

            # Predict that the next tag is another copy of the same repeated field.
            pos = new_pos + tag_len
            if buffer[new_pos:pos] != tag_bytes or new_pos == end:
                # Prediction failed.  Return.
                return new_pos

    return DecodeMap
예제 #7
0
def BytesDecoder(field_number, is_repeated, is_packed, key, new_default):
    """Returns a decoder for a bytes field."""

    local_DecodeVarint = _DecodeVarint

    assert not is_packed
    if is_repeated:
        tag_bytes = encoder.TagBytes(field_number,
                                     wire_format.WIRETYPE_LENGTH_DELIMITED)
        tag_len = len(tag_bytes)

        def DecodeRepeatedField(buffer, pos, end, message, field_dict):
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            while 1:
                (size, pos) = local_DecodeVarint(buffer, pos)
                new_pos = pos + size
                if new_pos > end:
                    raise _DecodeError('Truncated string.')
                value.append(buffer[pos:new_pos].tobytes())
                # Predict that the next tag is another copy of the same repeated field.
                pos = new_pos + tag_len
                if buffer[new_pos:pos] != tag_bytes or new_pos == end:
                    # Prediction failed.  Return.
                    return new_pos

        return DecodeRepeatedField
    else:

        def DecodeField(buffer, pos, end, message, field_dict):
            (size, pos) = local_DecodeVarint(buffer, pos)
            new_pos = pos + size
            if new_pos > end:
                raise _DecodeError('Truncated string.')
            field_dict[key] = buffer[pos:new_pos].tobytes()
            return new_pos

        return DecodeField
예제 #8
0
def MessageSetItemDecoder(descriptor):
    """Returns a decoder for a MessageSet item.

  The parameter is the message Descriptor.

  The message set message looks like this:
    message MessageSet {
      repeated group Item = 1 {
        required int32 type_id = 2;
        required string message = 3;
      }
    }
  """

    type_id_tag_bytes = encoder.TagBytes(2, wire_format.WIRETYPE_VARINT)
    message_tag_bytes = encoder.TagBytes(3,
                                         wire_format.WIRETYPE_LENGTH_DELIMITED)
    item_end_tag_bytes = encoder.TagBytes(1, wire_format.WIRETYPE_END_GROUP)

    local_ReadTag = ReadTag
    local_DecodeVarint = _DecodeVarint
    local_SkipField = SkipField

    def DecodeItem(buffer, pos, end, message, field_dict):
        """Decode serialized message set to its value and new position.

    Args:
      buffer: memoryview of the serialized bytes.
      pos: int, position in the memory view to start at.
      end: int, end position of serialized data
      message: Message object to store unknown fields in
      field_dict: Map[Descriptor, Any] to store decoded values in.

    Returns:
      int, new position in serialized data.
    """
        message_set_item_start = pos
        type_id = -1
        message_start = -1
        message_end = -1

        # Technically, type_id and message can appear in any order, so we need
        # a little loop here.
        while 1:
            (tag_bytes, pos) = local_ReadTag(buffer, pos)
            if tag_bytes == type_id_tag_bytes:
                (type_id, pos) = local_DecodeVarint(buffer, pos)
            elif tag_bytes == message_tag_bytes:
                (size, message_start) = local_DecodeVarint(buffer, pos)
                pos = message_end = message_start + size
            elif tag_bytes == item_end_tag_bytes:
                break
            else:
                pos = SkipField(buffer, pos, end, tag_bytes)
                if pos == -1:
                    raise _DecodeError('Missing group end tag.')

        if pos > end:
            raise _DecodeError('Truncated message.')

        if type_id == -1:
            raise _DecodeError('MessageSet item missing type_id.')
        if message_start == -1:
            raise _DecodeError('MessageSet item missing message.')

        extension = message.Extensions._FindExtensionByNumber(type_id)
        # pylint: disable=protected-access
        if extension is not None:
            value = field_dict.get(extension)
            if value is None:
                value = field_dict.setdefault(
                    extension, extension.message_type._concrete_class())
            if value._InternalParse(buffer, message_start,
                                    message_end) != message_end:
                # The only reason _InternalParse would return early is if it encountered
                # an end-group tag.
                raise _DecodeError('Unexpected end-group tag.')
        else:
            if not message._unknown_fields:
                message._unknown_fields = []
            message._unknown_fields.append(
                (MESSAGE_SET_ITEM_TAG,
                 buffer[message_set_item_start:pos].tobytes()))
            if message._unknown_field_set is None:
                message._unknown_field_set = containers.UnknownFieldSet()
            message._unknown_field_set._add(
                type_id, wire_format.WIRETYPE_LENGTH_DELIMITED,
                buffer[message_start:message_end].tobytes())
            # pylint: enable=protected-access

        return pos

    return DecodeItem
예제 #9
0
def StringDecoder(field_number,
                  is_repeated,
                  is_packed,
                  key,
                  new_default,
                  is_strict_utf8=False):
    """Returns a decoder for a string field."""

    local_DecodeVarint = _DecodeVarint
    local_unicode = six.text_type

    def _ConvertToUnicode(memview):
        """Convert byte to unicode."""
        byte_str = memview.tobytes()
        try:
            value = local_unicode(byte_str, 'utf-8')
        except UnicodeDecodeError as e:
            # add more information to the error message and re-raise it.
            e.reason = '%s in field: %s' % (e, key.full_name)
            raise

        if is_strict_utf8 and six.PY2 and sys.maxunicode > _UCS2_MAXUNICODE:
            # Only do the check for python2 ucs4 when is_strict_utf8 enabled
            if _SURROGATE_PATTERN.search(value):
                reason = (
                    'String field %s contains invalid UTF-8 data when parsing'
                    'a protocol buffer: surrogates not allowed. Use'
                    'the bytes type if you intend to send raw bytes.') % (
                        key.full_name)
                raise message.DecodeError(reason)

        return value

    assert not is_packed
    if is_repeated:
        tag_bytes = encoder.TagBytes(field_number,
                                     wire_format.WIRETYPE_LENGTH_DELIMITED)
        tag_len = len(tag_bytes)

        def DecodeRepeatedField(buffer, pos, end, message, field_dict):
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            while 1:
                (size, pos) = local_DecodeVarint(buffer, pos)
                new_pos = pos + size
                if new_pos > end:
                    raise _DecodeError('Truncated string.')
                value.append(_ConvertToUnicode(buffer[pos:new_pos]))
                # Predict that the next tag is another copy of the same repeated field.
                pos = new_pos + tag_len
                if buffer[new_pos:pos] != tag_bytes or new_pos == end:
                    # Prediction failed.  Return.
                    return new_pos

        return DecodeRepeatedField
    else:

        def DecodeField(buffer, pos, end, message, field_dict):
            (size, pos) = local_DecodeVarint(buffer, pos)
            new_pos = pos + size
            if new_pos > end:
                raise _DecodeError('Truncated string.')
            field_dict[key] = _ConvertToUnicode(buffer[pos:new_pos])
            return new_pos

        return DecodeField
예제 #10
0
def EnumDecoder(field_number, is_repeated, is_packed, key, new_default):
    enum_type = key.enum_type
    if is_packed:
        local_DecodeVarint = _DecodeVarint

        def DecodePackedField(buffer, pos, end, message, field_dict):
            """Decode serialized packed enum to its value and a new position.

      Args:
        buffer: memoryview of the serialized bytes.
        pos: int, position in the memory view to start at.
        end: int, end position of serialized data
        message: Message object to store unknown fields in
        field_dict: Map[Descriptor, Any] to store decoded values in.

      Returns:
        int, new position in serialized data.
      """
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            (endpoint, pos) = local_DecodeVarint(buffer, pos)
            endpoint += pos
            if endpoint > end:
                raise _DecodeError('Truncated message.')
            while pos < endpoint:
                value_start_pos = pos
                (element, pos) = _DecodeSignedVarint32(buffer, pos)
                # pylint: disable=protected-access
                if element in enum_type.values_by_number:
                    value.append(element)
                else:
                    if not message._unknown_fields:
                        message._unknown_fields = []
                    tag_bytes = encoder.TagBytes(field_number,
                                                 wire_format.WIRETYPE_VARINT)

                    message._unknown_fields.append(
                        (tag_bytes, buffer[value_start_pos:pos].tobytes()))
                    if message._unknown_field_set is None:
                        message._unknown_field_set = containers.UnknownFieldSet(
                        )
                    message._unknown_field_set._add(
                        field_number, wire_format.WIRETYPE_VARINT, element)
                    # pylint: enable=protected-access
            if pos > endpoint:
                if element in enum_type.values_by_number:
                    del value[-1]  # Discard corrupt value.
                else:
                    del message._unknown_fields[-1]
                    # pylint: disable=protected-access
                    del message._unknown_field_set._values[-1]
                    # pylint: enable=protected-access
                raise _DecodeError('Packed element was truncated.')
            return pos

        return DecodePackedField
    elif is_repeated:
        tag_bytes = encoder.TagBytes(field_number, wire_format.WIRETYPE_VARINT)
        tag_len = len(tag_bytes)

        def DecodeRepeatedField(buffer, pos, end, message, field_dict):
            """Decode serialized repeated enum to its value and a new position.

      Args:
        buffer: memoryview of the serialized bytes.
        pos: int, position in the memory view to start at.
        end: int, end position of serialized data
        message: Message object to store unknown fields in
        field_dict: Map[Descriptor, Any] to store decoded values in.

      Returns:
        int, new position in serialized data.
      """
            value = field_dict.get(key)
            if value is None:
                value = field_dict.setdefault(key, new_default(message))
            while 1:
                (element, new_pos) = _DecodeSignedVarint32(buffer, pos)
                # pylint: disable=protected-access
                if element in enum_type.values_by_number:
                    value.append(element)
                else:
                    if not message._unknown_fields:
                        message._unknown_fields = []
                    message._unknown_fields.append(
                        (tag_bytes, buffer[pos:new_pos].tobytes()))
                    if message._unknown_field_set is None:
                        message._unknown_field_set = containers.UnknownFieldSet(
                        )
                    message._unknown_field_set._add(
                        field_number, wire_format.WIRETYPE_VARINT, element)
                # pylint: enable=protected-access
                # Predict that the next tag is another copy of the same repeated
                # field.
                pos = new_pos + tag_len
                if buffer[new_pos:pos] != tag_bytes or new_pos >= end:
                    # Prediction failed.  Return.
                    if new_pos > end:
                        raise _DecodeError('Truncated message.')
                    return new_pos

        return DecodeRepeatedField
    else:

        def DecodeField(buffer, pos, end, message, field_dict):
            """Decode serialized repeated enum to its value and a new position.

      Args:
        buffer: memoryview of the serialized bytes.
        pos: int, position in the memory view to start at.
        end: int, end position of serialized data
        message: Message object to store unknown fields in
        field_dict: Map[Descriptor, Any] to store decoded values in.

      Returns:
        int, new position in serialized data.
      """
            value_start_pos = pos
            (enum_value, pos) = _DecodeSignedVarint32(buffer, pos)
            if pos > end:
                raise _DecodeError('Truncated message.')
            # pylint: disable=protected-access
            if enum_value in enum_type.values_by_number:
                field_dict[key] = enum_value
            else:
                if not message._unknown_fields:
                    message._unknown_fields = []
                tag_bytes = encoder.TagBytes(field_number,
                                             wire_format.WIRETYPE_VARINT)
                message._unknown_fields.append(
                    (tag_bytes, buffer[value_start_pos:pos].tobytes()))
                if message._unknown_field_set is None:
                    message._unknown_field_set = containers.UnknownFieldSet()
                message._unknown_field_set._add(field_number,
                                                wire_format.WIRETYPE_VARINT,
                                                enum_value)
                # pylint: enable=protected-access
            return pos

        return DecodeField
예제 #11
0
            new_pos = pos + size
            if new_pos > end:
                raise _DecodeError('Truncated message.')
            # Read sub-message.
            if value._InternalParse(buffer, pos, new_pos) != new_pos:
                # The only reason _InternalParse would return early is if it encountered
                # an end-group tag.
                raise _DecodeError('Unexpected end-group tag.')
            return new_pos

        return DecodeField


# --------------------------------------------------------------------

MESSAGE_SET_ITEM_TAG = encoder.TagBytes(1, wire_format.WIRETYPE_START_GROUP)


def MessageSetItemDecoder(descriptor):
    """Returns a decoder for a MessageSet item.

  The parameter is the message Descriptor.

  The message set message looks like this:
    message MessageSet {
      repeated group Item = 1 {
        required int32 type_id = 2;
        required string message = 3;
      }
    }
  """