1
0
mirror of https://github.com/trezor/trezor-firmware.git synced 2024-12-18 20:38:10 +00:00
trezor-firmware/src/protobuf.py

265 lines
6.8 KiB
Python
Raw Normal View History

'''
2017-07-04 16:09:08 +00:00
Extremely minimal streaming codec for a subset of protobuf. Supports uint32,
bytes, string, embedded message and repeated fields.
2017-08-21 11:22:35 +00:00
For de-serializing (loading) protobuf types, object with `AsyncReader`
2017-08-21 11:22:35 +00:00
interface is required:
2017-09-16 13:00:31 +00:00
>>> class AsyncReader:
>>> async def areadinto(self, buffer):
>>> """
>>> Reads `len(buffer)` bytes into `buffer`, or raises `EOFError`.
>>> """
2017-08-21 11:22:35 +00:00
For serializing (dumping) protobuf types, object with `AsyncWriter` interface is
required:
2017-09-16 13:00:31 +00:00
>>> class AsyncWriter:
>>> async def awrite(self, buffer):
>>> """
>>> Writes all bytes from `buffer`, or raises `EOFError`.
>>> """
2016-09-21 12:14:49 +00:00
'''
2016-09-29 10:29:43 +00:00
from micropython import const
2017-07-04 16:09:08 +00:00
_UVARINT_BUFFER = bytearray(1)
2016-09-21 12:14:49 +00:00
2017-07-04 16:09:08 +00:00
async def load_uvarint(reader):
buffer = _UVARINT_BUFFER
result = 0
shift = 0
byte = 0x80
while byte & 0x80:
2017-08-15 13:09:09 +00:00
await reader.areadinto(buffer)
2017-07-04 16:09:08 +00:00
byte = buffer[0]
result += (byte & 0x7F) << shift
shift += 7
return result
2016-09-21 12:14:49 +00:00
2017-07-04 16:09:08 +00:00
async def dump_uvarint(writer, n):
if n < 0:
raise ValueError("Cannot dump signed value, convert it to unsigned first.")
2017-07-04 16:09:08 +00:00
buffer = _UVARINT_BUFFER
shifted = True
while shifted:
shifted = n >> 7
buffer[0] = (n & 0x7F) | (0x80 if shifted else 0x00)
2017-08-15 13:09:09 +00:00
await writer.awrite(buffer)
2017-07-04 16:09:08 +00:00
n = shifted
# protobuf interleaved signed encoding:
# https://developers.google.com/protocol-buffers/docs/encoding#structure
# the idea is to save the sign in LSbit instead of twos-complement.
# so counting up, you go: 0, -1, 1, -2, 2, ... (as the first bit changes, sign flips)
#
# To achieve this with a twos-complement number:
# 1. shift left by 1, leaving LSbit free
# 2. if the number is negative, do bitwise negation.
# This keeps positive number the same, and converts negative from twos-complement
# to the appropriate value, while setting the sign bit.
#
# The original algorithm makes use of the fact that arithmetic (signed) shift
# keeps the sign bits, so for a n-bit number, (x >> n) gets us "all sign bits".
# Then you can take "number XOR all-sign-bits", which is XOR 0 (identity) for positive
# and XOR 1 (bitwise negation) for negative. Cute and efficient.
#
# But this is harder in Python because we don't natively know the bit size of the number.
# So we have to branch on whether the number is negative.
2018-07-03 14:20:58 +00:00
def sint_to_uint(sint):
res = sint << 1
if sint < 0:
res = ~res
return res
def uint_to_sint(uint):
sign = uint & 1
res = uint >> 1
if sign:
res = ~res
return res
2016-04-07 21:45:10 +00:00
class UVarintType:
WIRE_TYPE = 0
class SVarintType:
WIRE_TYPE = 0
2017-07-04 16:09:08 +00:00
class BoolType:
WIRE_TYPE = 0
2016-08-05 10:35:45 +00:00
2016-04-07 21:45:10 +00:00
2017-07-04 16:09:08 +00:00
class BytesType:
WIRE_TYPE = 2
2016-04-07 21:45:10 +00:00
2017-07-04 16:09:08 +00:00
class UnicodeType:
2016-04-07 21:45:10 +00:00
WIRE_TYPE = 2
2016-09-21 12:14:49 +00:00
2017-07-04 16:09:08 +00:00
class MessageType:
WIRE_TYPE = 2
@classmethod
def get_fields(cls):
return {}
def __init__(self, **kwargs):
for kw in kwargs:
setattr(self, kw, kwargs[kw])
def __eq__(self, rhs):
2018-07-03 14:20:58 +00:00
return self.__class__ is rhs.__class__ and self.__dict__ == rhs.__dict__
def __repr__(self):
2018-07-03 14:20:58 +00:00
return "<%s>" % self.__class__.__name__
2017-07-04 16:09:08 +00:00
class LimitedReader:
def __init__(self, reader, limit):
self.reader = reader
self.limit = limit
2017-08-15 13:09:09 +00:00
async def areadinto(self, buf):
2017-07-04 16:09:08 +00:00
if self.limit < len(buf):
raise EOFError
else:
2017-08-15 13:09:09 +00:00
nread = await self.reader.areadinto(buf)
2017-07-04 16:09:08 +00:00
self.limit -= nread
return nread
class CountingWriter:
def __init__(self):
self.size = 0
2017-08-15 13:09:09 +00:00
async def awrite(self, buf):
2017-07-04 16:09:08 +00:00
nwritten = len(buf)
self.size += nwritten
return nwritten
FLAG_REPEATED = const(1)
async def load_message(reader, msg_type):
fields = msg_type.get_fields()
2017-07-04 16:09:08 +00:00
msg = msg_type()
while True:
2016-09-21 12:14:49 +00:00
try:
2017-07-04 16:09:08 +00:00
fkey = await load_uvarint(reader)
except EOFError:
break # no more fields to load
ftag = fkey >> 3
wtype = fkey & 7
field = fields.get(ftag, None)
if field is None: # unknown field, skip it
if wtype == 0:
await load_uvarint(reader)
elif wtype == 2:
ivalue = await load_uvarint(reader)
2017-08-15 13:09:09 +00:00
await reader.areadinto(bytearray(ivalue))
2017-07-04 16:09:08 +00:00
else:
raise ValueError
continue
fname, ftype, fflags = field
if wtype != ftype.WIRE_TYPE:
raise TypeError # parsed wire type differs from the schema
ivalue = await load_uvarint(reader)
if ftype is UVarintType:
fvalue = ivalue
elif ftype is SVarintType:
fvalue = uint_to_sint(ivalue)
2017-07-04 16:09:08 +00:00
elif ftype is BoolType:
fvalue = bool(ivalue)
elif ftype is BytesType:
fvalue = bytearray(ivalue)
2017-08-15 13:09:09 +00:00
await reader.areadinto(fvalue)
2017-07-04 16:09:08 +00:00
elif ftype is UnicodeType:
fvalue = bytearray(ivalue)
2017-08-15 13:09:09 +00:00
await reader.areadinto(fvalue)
2018-08-03 16:52:20 +00:00
fvalue = bytes(fvalue).decode()
2017-07-04 16:09:08 +00:00
elif issubclass(ftype, MessageType):
fvalue = await load_message(LimitedReader(reader, ivalue), ftype)
else:
raise TypeError # field type is unknown
if fflags & FLAG_REPEATED:
pvalue = getattr(msg, fname, [])
pvalue.append(fvalue)
fvalue = pvalue
setattr(msg, fname, fvalue)
# fill missing fields
for tag in fields:
field = fields[tag]
2017-07-04 16:09:08 +00:00
if not hasattr(msg, field[0]):
setattr(msg, field[0], None)
return msg
async def dump_message(writer, msg):
repvalue = [0]
mtype = msg.__class__
fields = mtype.get_fields()
2017-07-04 16:09:08 +00:00
for ftag in fields:
fname, ftype, fflags = fields[ftag]
2017-07-04 16:09:08 +00:00
fvalue = getattr(msg, fname, None)
if fvalue is None:
continue
fkey = (ftag << 3) | ftype.WIRE_TYPE
if not fflags & FLAG_REPEATED:
repvalue[0] = fvalue
fvalue = repvalue
for svalue in fvalue:
await dump_uvarint(writer, fkey)
if ftype is UVarintType:
await dump_uvarint(writer, svalue)
elif ftype is SVarintType:
await dump_uvarint(writer, sint_to_uint(svalue))
2017-07-04 16:09:08 +00:00
elif ftype is BoolType:
await dump_uvarint(writer, int(svalue))
elif ftype is BytesType:
await dump_uvarint(writer, len(svalue))
2017-08-15 13:09:09 +00:00
await writer.awrite(svalue)
2017-07-04 16:09:08 +00:00
elif ftype is UnicodeType:
2018-08-03 16:52:20 +00:00
bvalue = svalue.encode()
await dump_uvarint(writer, len(bvalue))
await writer.awrite(bvalue)
2017-07-04 16:09:08 +00:00
elif issubclass(ftype, MessageType):
counter = CountingWriter()
await dump_message(counter, svalue)
await dump_uvarint(writer, counter.size)
await dump_message(writer, svalue)
else:
2017-07-04 16:09:08 +00:00
raise TypeError