python/google/protobuf/internal/input_stream.py - platform/external/protobuf - Git at Google

 # Protocol Buffers - Google's data interchange format
 # Copyright 2008 Google Inc.  All rights reserved.
 # http://code.google.com/p/protobuf/
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.
 #     * Neither the name of Google Inc. nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 """InputStream is the primitive interface for reading bits from the wire.

 All protocol buffer deserialization can be expressed in terms of
 the InputStream primitives provided here.
 """

 __author__ = 'robinson@google.com (Will Robinson)'

 import array
 import struct
 from google.protobuf import message
 from google.protobuf.internal import wire_format


 # Note that much of this code is ported from //net/proto/ProtocolBuffer, and
 # that the interface is strongly inspired by CodedInputStream from the C++
 # proto2 implementation.


 class InputStreamBuffer(object):

   """Contains all logic for reading bits, and dealing with stream position.

   If an InputStream method ever raises an exception, the stream is left
   in an indeterminate state and is not safe for further use.
   """

   def __init__(self, s):
     # What we really want is something like array('B', s), where elements we
     # read from the array are already given to us as one-byte integers.  BUT
     # using array() instead of buffer() would force full string copies to result
     # from each GetSubBuffer() call.
     #
     # So, if the N serialized bytes of a single protocol buffer object are
     # split evenly between 2 child messages, and so on recursively, using
     # array('B', s) instead of buffer() would incur an additional N*logN bytes
     # copied during deserialization.
     #
     # The higher constant overhead of having to ord() for every byte we read
     # from the buffer in _ReadVarintHelper() could definitely lead to worse
     # performance in many real-world scenarios, even if the asymptotic
     # complexity is better.  However, our real answer is that the mythical
     # Python/C extension module output mode for the protocol compiler will
     # be blazing-fast and will eliminate most use of this class anyway.
     self._buffer = buffer(s)
     self._pos = 0

   def EndOfStream(self):
     """Returns true iff we're at the end of the stream.
     If this returns true, then a call to any other InputStream method
     will raise an exception.
     """
     return self._pos >= len(self._buffer)

   def Position(self):
     """Returns the current position in the stream, or equivalently, the
     number of bytes read so far.
     """
     return self._pos

   def GetSubBuffer(self, size=None):
     """Returns a sequence-like object that represents a portion of our
     underlying sequence.

     Position 0 in the returned object corresponds to self.Position()
     in this stream.

     If size is specified, then the returned object ends after the
     next "size" bytes in this stream.  If size is not specified,
     then the returned object ends at the end of this stream.

     We guarantee that the returned object R supports the Python buffer
     interface (and thus that the call buffer(R) will work).

     Note that the returned buffer is read-only.

     The intended use for this method is for nested-message and nested-group
     deserialization, where we want to make a recursive MergeFromString()
     call on the portion of the original sequence that contains the serialized
     nested message.  (And we'd like to do so without making unnecessary string
     copies).

     REQUIRES: size is nonnegative.
     """
     # Note that buffer() doesn't perform any actual string copy.
     if size is None:
       return buffer(self._buffer, self._pos)
     else:
       if size < 0:
         raise message.DecodeError('Negative size %d' % size)
       return buffer(self._buffer, self._pos, size)

   def SkipBytes(self, num_bytes):
     """Skip num_bytes bytes ahead, or go to the end of the stream, whichever
     comes first.

     REQUIRES: num_bytes is nonnegative.
     """
     if num_bytes < 0:
       raise message.DecodeError('Negative num_bytes %d' % num_bytes)
     self._pos += num_bytes
     self._pos = min(self._pos, len(self._buffer))

   def ReadBytes(self, size):
     """Reads up to 'size' bytes from the stream, stopping early
     only if we reach the end of the stream.  Returns the bytes read
     as a string.
     """
     if size < 0:
       raise message.DecodeError('Negative size %d' % size)
     s = (self._buffer[self._pos : self._pos + size])
     self._pos += len(s)  # Only advance by the number of bytes actually read.
     return s

   def ReadLittleEndian32(self):
     """Interprets the next 4 bytes of the stream as a little-endian
     encoded, unsiged 32-bit integer, and returns that integer.
     """
     try:
       i = struct.unpack(wire_format.FORMAT_UINT32_LITTLE_ENDIAN,
                         self._buffer[self._pos : self._pos + 4])
       self._pos += 4
       return i[0]  # unpack() result is a 1-element tuple.
     except struct.error, e:
       raise message.DecodeError(e)

   def ReadLittleEndian64(self):
     """Interprets the next 8 bytes of the stream as a little-endian
     encoded, unsiged 64-bit integer, and returns that integer.
     """
     try:
       i = struct.unpack(wire_format.FORMAT_UINT64_LITTLE_ENDIAN,
                         self._buffer[self._pos : self._pos + 8])
       self._pos += 8
       return i[0]  # unpack() result is a 1-element tuple.
     except struct.error, e:
       raise message.DecodeError(e)

   def ReadVarint32(self):
     """Reads a varint from the stream, interprets this varint
     as a signed, 32-bit integer, and returns the integer.
     """
     i = self.ReadVarint64()
     if not wire_format.INT32_MIN <= i <= wire_format.INT32_MAX:
       raise message.DecodeError('Value out of range for int32: %d' % i)
     return int(i)

   def ReadVarUInt32(self):
     """Reads a varint from the stream, interprets this varint
     as an unsigned, 32-bit integer, and returns the integer.
     """
     i = self.ReadVarUInt64()
     if i > wire_format.UINT32_MAX:
       raise message.DecodeError('Value out of range for uint32: %d' % i)
     return i

   def ReadVarint64(self):
     """Reads a varint from the stream, interprets this varint
     as a signed, 64-bit integer, and returns the integer.
     """
     i = self.ReadVarUInt64()
     if i > wire_format.INT64_MAX:
       i -= (1 << 64)
     return i

   def ReadVarUInt64(self):
     """Reads a varint from the stream, interprets this varint
     as an unsigned, 64-bit integer, and returns the integer.
     """
     i = self._ReadVarintHelper()
     if not 0 <= i <= wire_format.UINT64_MAX:
       raise message.DecodeError('Value out of range for uint64: %d' % i)
     return i

   def _ReadVarintHelper(self):
     """Helper for the various varint-reading methods above.
     Reads an unsigned, varint-encoded integer from the stream and
     returns this integer.

     Does no bounds checking except to ensure that we read at most as many bytes
     as could possibly be present in a varint-encoded 64-bit number.
     """
     result = 0
     shift = 0
     while 1:
       if shift >= 64:
         raise message.DecodeError('Too many bytes when decoding varint.')
       try:
         b = ord(self._buffer[self._pos])
       except IndexError:
         raise message.DecodeError('Truncated varint.')
       self._pos += 1
       result |= ((b & 0x7f) << shift)
       shift += 7
       if not (b & 0x80):
         return result


 class InputStreamArray(object):

   """Contains all logic for reading bits, and dealing with stream position.

   If an InputStream method ever raises an exception, the stream is left
   in an indeterminate state and is not safe for further use.

   This alternative to InputStreamBuffer is used in environments where buffer()
   is unavailble, such as Google App Engine.
   """

   def __init__(self, s):
     self._buffer = array.array('B', s)
     self._pos = 0

   def EndOfStream(self):
     return self._pos >= len(self._buffer)

   def Position(self):
     return self._pos

   def GetSubBuffer(self, size=None):
     if size is None:
       return self._buffer[self._pos : ].tostring()
     else:
       if size < 0:
         raise message.DecodeError('Negative size %d' % size)
       return self._buffer[self._pos : self._pos + size].tostring()

   def SkipBytes(self, num_bytes):
     if num_bytes < 0:
       raise message.DecodeError('Negative num_bytes %d' % num_bytes)
     self._pos += num_bytes
     self._pos = min(self._pos, len(self._buffer))

   def ReadBytes(self, size):
     if size < 0:
       raise message.DecodeError('Negative size %d' % size)
     s = self._buffer[self._pos : self._pos + size].tostring()
     self._pos += len(s)  # Only advance by the number of bytes actually read.
     return s

   def ReadLittleEndian32(self):
     try:
       i = struct.unpack(wire_format.FORMAT_UINT32_LITTLE_ENDIAN,
                         self._buffer[self._pos : self._pos + 4])
       self._pos += 4
       return i[0]  # unpack() result is a 1-element tuple.
     except struct.error, e:
       raise message.DecodeError(e)

   def ReadLittleEndian64(self):
     try:
       i = struct.unpack(wire_format.FORMAT_UINT64_LITTLE_ENDIAN,
                         self._buffer[self._pos : self._pos + 8])
       self._pos += 8
       return i[0]  # unpack() result is a 1-element tuple.
     except struct.error, e:
       raise message.DecodeError(e)

   def ReadVarint32(self):
     i = self.ReadVarint64()
     if not wire_format.INT32_MIN <= i <= wire_format.INT32_MAX:
       raise message.DecodeError('Value out of range for int32: %d' % i)
     return int(i)

   def ReadVarUInt32(self):
     i = self.ReadVarUInt64()
     if i > wire_format.UINT32_MAX:
       raise message.DecodeError('Value out of range for uint32: %d' % i)
     return i

   def ReadVarint64(self):
     i = self.ReadVarUInt64()
     if i > wire_format.INT64_MAX:
       i -= (1 << 64)
     return i

   def ReadVarUInt64(self):
     i = self._ReadVarintHelper()
     if not 0 <= i <= wire_format.UINT64_MAX:
       raise message.DecodeError('Value out of range for uint64: %d' % i)
     return i

   def _ReadVarintHelper(self):
     result = 0
     shift = 0
     while 1:
       if shift >= 64:
         raise message.DecodeError('Too many bytes when decoding varint.')
       try:
         b = self._buffer[self._pos]
       except IndexError:
         raise message.DecodeError('Truncated varint.')
       self._pos += 1
       result |= ((b & 0x7f) << shift)
       shift += 7
       if not (b & 0x80):
         return result


 try:
   buffer('')
   InputStream = InputStreamBuffer
 except NotImplementedError:
   # Google App Engine: dev_appserver.py
   InputStream = InputStreamArray
 except RuntimeError:
   # Google App Engine: production
   InputStream = InputStreamArray
	# Protocol Buffers - Google's data interchange format
	# Copyright 2008 Google Inc. All rights reserved.
	# http://code.google.com/p/protobuf/
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.
	# * Neither the name of Google Inc. nor the names of its
	# contributors may be used to endorse or promote products derived from
	# this software without specific prior written permission.
	#
	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	"""InputStream is the primitive interface for reading bits from the wire.

	All protocol buffer deserialization can be expressed in terms of
	the InputStream primitives provided here.
	"""

	__author__ = 'robinson@google.com (Will Robinson)'

	import array
	import struct
	from google.protobuf import message
	from google.protobuf.internal import wire_format


	# Note that much of this code is ported from //net/proto/ProtocolBuffer, and
	# that the interface is strongly inspired by CodedInputStream from the C++
	# proto2 implementation.


	class InputStreamBuffer(object):

	"""Contains all logic for reading bits, and dealing with stream position.

	If an InputStream method ever raises an exception, the stream is left
	in an indeterminate state and is not safe for further use.
	"""

	def __init__(self, s):
	# What we really want is something like array('B', s), where elements we
	# read from the array are already given to us as one-byte integers. BUT
	# using array() instead of buffer() would force full string copies to result
	# from each GetSubBuffer() call.
	#
	# So, if the N serialized bytes of a single protocol buffer object are
	# split evenly between 2 child messages, and so on recursively, using
	# array('B', s) instead of buffer() would incur an additional N*logN bytes
	# copied during deserialization.
	#
	# The higher constant overhead of having to ord() for every byte we read
	# from the buffer in _ReadVarintHelper() could definitely lead to worse
	# performance in many real-world scenarios, even if the asymptotic
	# complexity is better. However, our real answer is that the mythical
	# Python/C extension module output mode for the protocol compiler will
	# be blazing-fast and will eliminate most use of this class anyway.
	self._buffer = buffer(s)
	self._pos = 0

	def EndOfStream(self):
	"""Returns true iff we're at the end of the stream.
	If this returns true, then a call to any other InputStream method
	will raise an exception.
	"""
	return self._pos >= len(self._buffer)

	def Position(self):
	"""Returns the current position in the stream, or equivalently, the
	number of bytes read so far.
	"""
	return self._pos

	def GetSubBuffer(self, size=None):
	"""Returns a sequence-like object that represents a portion of our
	underlying sequence.

	Position 0 in the returned object corresponds to self.Position()
	in this stream.

	If size is specified, then the returned object ends after the
	next "size" bytes in this stream. If size is not specified,
	then the returned object ends at the end of this stream.

	We guarantee that the returned object R supports the Python buffer
	interface (and thus that the call buffer(R) will work).

	Note that the returned buffer is read-only.

	The intended use for this method is for nested-message and nested-group
	deserialization, where we want to make a recursive MergeFromString()
	call on the portion of the original sequence that contains the serialized
	nested message. (And we'd like to do so without making unnecessary string
	copies).

	REQUIRES: size is nonnegative.
	"""
	# Note that buffer() doesn't perform any actual string copy.
	if size is None:
	return buffer(self._buffer, self._pos)
	else:
	if size < 0:
	raise message.DecodeError('Negative size %d' % size)
	return buffer(self._buffer, self._pos, size)

	def SkipBytes(self, num_bytes):
	"""Skip num_bytes bytes ahead, or go to the end of the stream, whichever
	comes first.

	REQUIRES: num_bytes is nonnegative.
	"""
	if num_bytes < 0:
	raise message.DecodeError('Negative num_bytes %d' % num_bytes)
	self._pos += num_bytes
	self._pos = min(self._pos, len(self._buffer))

	def ReadBytes(self, size):
	"""Reads up to 'size' bytes from the stream, stopping early
	only if we reach the end of the stream. Returns the bytes read
	as a string.
	"""
	if size < 0:
	raise message.DecodeError('Negative size %d' % size)
	s = (self._buffer[self._pos : self._pos + size])
	self._pos += len(s) # Only advance by the number of bytes actually read.
	return s

	def ReadLittleEndian32(self):
	"""Interprets the next 4 bytes of the stream as a little-endian
	encoded, unsiged 32-bit integer, and returns that integer.
	"""
	try:
	i = struct.unpack(wire_format.FORMAT_UINT32_LITTLE_ENDIAN,
	self._buffer[self._pos : self._pos + 4])
	self._pos += 4
	return i[0] # unpack() result is a 1-element tuple.
	except struct.error, e:
	raise message.DecodeError(e)

	def ReadLittleEndian64(self):
	"""Interprets the next 8 bytes of the stream as a little-endian
	encoded, unsiged 64-bit integer, and returns that integer.
	"""
	try:
	i = struct.unpack(wire_format.FORMAT_UINT64_LITTLE_ENDIAN,
	self._buffer[self._pos : self._pos + 8])
	self._pos += 8
	return i[0] # unpack() result is a 1-element tuple.
	except struct.error, e:
	raise message.DecodeError(e)

	def ReadVarint32(self):
	"""Reads a varint from the stream, interprets this varint
	as a signed, 32-bit integer, and returns the integer.
	"""
	i = self.ReadVarint64()
	if not wire_format.INT32_MIN <= i <= wire_format.INT32_MAX:
	raise message.DecodeError('Value out of range for int32: %d' % i)
	return int(i)

	def ReadVarUInt32(self):
	"""Reads a varint from the stream, interprets this varint
	as an unsigned, 32-bit integer, and returns the integer.
	"""
	i = self.ReadVarUInt64()
	if i > wire_format.UINT32_MAX:
	raise message.DecodeError('Value out of range for uint32: %d' % i)
	return i

	def ReadVarint64(self):
	"""Reads a varint from the stream, interprets this varint
	as a signed, 64-bit integer, and returns the integer.
	"""
	i = self.ReadVarUInt64()
	if i > wire_format.INT64_MAX:
	i -= (1 << 64)
	return i

	def ReadVarUInt64(self):
	"""Reads a varint from the stream, interprets this varint
	as an unsigned, 64-bit integer, and returns the integer.
	"""
	i = self._ReadVarintHelper()
	if not 0 <= i <= wire_format.UINT64_MAX:
	raise message.DecodeError('Value out of range for uint64: %d' % i)
	return i

	def _ReadVarintHelper(self):
	"""Helper for the various varint-reading methods above.
	Reads an unsigned, varint-encoded integer from the stream and
	returns this integer.

	Does no bounds checking except to ensure that we read at most as many bytes
	as could possibly be present in a varint-encoded 64-bit number.
	"""
	result = 0
	shift = 0
	while 1:
	if shift >= 64:
	raise message.DecodeError('Too many bytes when decoding varint.')
	try:
	b = ord(self._buffer[self._pos])
	except IndexError:
	raise message.DecodeError('Truncated varint.')
	self._pos += 1
	result \|= ((b & 0x7f) << shift)
	shift += 7
	if not (b & 0x80):
	return result


	class InputStreamArray(object):

	"""Contains all logic for reading bits, and dealing with stream position.

	If an InputStream method ever raises an exception, the stream is left
	in an indeterminate state and is not safe for further use.

	This alternative to InputStreamBuffer is used in environments where buffer()
	is unavailble, such as Google App Engine.
	"""

	def __init__(self, s):
	self._buffer = array.array('B', s)
	self._pos = 0

	def EndOfStream(self):
	return self._pos >= len(self._buffer)

	def Position(self):
	return self._pos

	def GetSubBuffer(self, size=None):
	if size is None:
	return self._buffer[self._pos : ].tostring()
	else:
	if size < 0:
	raise message.DecodeError('Negative size %d' % size)
	return self._buffer[self._pos : self._pos + size].tostring()

	def SkipBytes(self, num_bytes):
	if num_bytes < 0:
	raise message.DecodeError('Negative num_bytes %d' % num_bytes)
	self._pos += num_bytes
	self._pos = min(self._pos, len(self._buffer))

	def ReadBytes(self, size):
	if size < 0:
	raise message.DecodeError('Negative size %d' % size)
	s = self._buffer[self._pos : self._pos + size].tostring()
	self._pos += len(s) # Only advance by the number of bytes actually read.
	return s

	def ReadLittleEndian32(self):
	try:
	i = struct.unpack(wire_format.FORMAT_UINT32_LITTLE_ENDIAN,
	self._buffer[self._pos : self._pos + 4])
	self._pos += 4
	return i[0] # unpack() result is a 1-element tuple.
	except struct.error, e:
	raise message.DecodeError(e)

	def ReadLittleEndian64(self):
	try:
	i = struct.unpack(wire_format.FORMAT_UINT64_LITTLE_ENDIAN,
	self._buffer[self._pos : self._pos + 8])
	self._pos += 8
	return i[0] # unpack() result is a 1-element tuple.
	except struct.error, e:
	raise message.DecodeError(e)

	def ReadVarint32(self):
	i = self.ReadVarint64()
	if not wire_format.INT32_MIN <= i <= wire_format.INT32_MAX:
	raise message.DecodeError('Value out of range for int32: %d' % i)
	return int(i)

	def ReadVarUInt32(self):
	i = self.ReadVarUInt64()
	if i > wire_format.UINT32_MAX:
	raise message.DecodeError('Value out of range for uint32: %d' % i)
	return i

	def ReadVarint64(self):
	i = self.ReadVarUInt64()
	if i > wire_format.INT64_MAX:
	i -= (1 << 64)
	return i

	def ReadVarUInt64(self):
	i = self._ReadVarintHelper()
	if not 0 <= i <= wire_format.UINT64_MAX:
	raise message.DecodeError('Value out of range for uint64: %d' % i)
	return i

	def _ReadVarintHelper(self):
	result = 0
	shift = 0
	while 1:
	if shift >= 64:
	raise message.DecodeError('Too many bytes when decoding varint.')
	try:
	b = self._buffer[self._pos]
	except IndexError:
	raise message.DecodeError('Truncated varint.')
	self._pos += 1
	result \|= ((b & 0x7f) << shift)
	shift += 7
	if not (b & 0x80):
	return result


	try:
	buffer('')
	InputStream = InputStreamBuffer
	except NotImplementedError:
	# Google App Engine: dev_appserver.py
	InputStream = InputStreamArray
	except RuntimeError:
	# Google App Engine: production
	InputStream = InputStreamArray