2017-11-26 19:14:28 +03:00
|
|
|
"""
|
|
|
|
This module contains the BinaryReader utility class.
|
|
|
|
"""
|
2016-11-30 00:29:42 +03:00
|
|
|
import os
|
2016-09-11 11:35:02 +03:00
|
|
|
from datetime import datetime
|
2016-11-30 00:29:42 +03:00
|
|
|
from io import BufferedReader, BytesIO
|
2016-08-30 14:11:19 +03:00
|
|
|
from struct import unpack
|
2016-11-30 00:29:42 +03:00
|
|
|
|
2017-12-28 02:22:28 +03:00
|
|
|
from ..errors import TypeNotFoundError
|
2017-05-21 14:02:54 +03:00
|
|
|
from ..tl.all_tlobjects import tlobjects
|
2016-08-26 13:58:53 +03:00
|
|
|
|
|
|
|
|
|
|
|
class BinaryReader:
|
|
|
|
"""
|
|
|
|
Small utility class to read binary data.
|
|
|
|
Also creates a "Memory Stream" if necessary
|
|
|
|
"""
|
2016-11-30 00:29:42 +03:00
|
|
|
|
2016-08-26 13:58:53 +03:00
|
|
|
def __init__(self, data=None, stream=None):
|
|
|
|
if data:
|
|
|
|
self.stream = BytesIO(data)
|
|
|
|
elif stream:
|
|
|
|
self.stream = stream
|
|
|
|
else:
|
2017-12-28 02:22:28 +03:00
|
|
|
raise ValueError('Either bytes or a stream must be provided')
|
2016-08-26 13:58:53 +03:00
|
|
|
|
|
|
|
self.reader = BufferedReader(self.stream)
|
2017-09-18 12:45:08 +03:00
|
|
|
self._last = None # Should come in handy to spot -404 errors
|
2016-08-26 13:58:53 +03:00
|
|
|
|
|
|
|
# region Reading
|
|
|
|
|
2017-09-04 18:10:04 +03:00
|
|
|
# "All numbers are written as little endian."
|
|
|
|
# https://core.telegram.org/mtproto
|
2016-08-30 14:11:19 +03:00
|
|
|
def read_byte(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a single byte value."""
|
2016-09-03 11:54:58 +03:00
|
|
|
return self.read(1)[0]
|
2016-08-30 14:11:19 +03:00
|
|
|
|
2016-08-26 13:58:53 +03:00
|
|
|
def read_int(self, signed=True):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads an integer (4 bytes) value."""
|
2016-09-03 11:54:58 +03:00
|
|
|
return int.from_bytes(self.read(4), byteorder='little', signed=signed)
|
2016-08-26 13:58:53 +03:00
|
|
|
|
|
|
|
def read_long(self, signed=True):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a long integer (8 bytes) value."""
|
2016-09-03 11:54:58 +03:00
|
|
|
return int.from_bytes(self.read(8), byteorder='little', signed=signed)
|
2016-08-30 14:11:19 +03:00
|
|
|
|
|
|
|
def read_float(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a real floating point (4 bytes) value."""
|
2016-09-03 11:54:58 +03:00
|
|
|
return unpack('<f', self.read(4))[0]
|
2016-08-30 14:11:19 +03:00
|
|
|
|
|
|
|
def read_double(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a real floating point (8 bytes) value."""
|
2016-09-03 11:54:58 +03:00
|
|
|
return unpack('<d', self.read(8))[0]
|
2016-08-26 13:58:53 +03:00
|
|
|
|
2016-08-30 14:11:19 +03:00
|
|
|
def read_large_int(self, bits, signed=True):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a n-bits long integer value."""
|
2016-11-30 00:29:42 +03:00
|
|
|
return int.from_bytes(
|
|
|
|
self.read(bits // 8), byteorder='little', signed=signed)
|
2016-08-27 22:49:38 +03:00
|
|
|
|
2016-08-26 13:58:53 +03:00
|
|
|
def read(self, length):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Read the given amount of bytes."""
|
2016-09-03 11:54:58 +03:00
|
|
|
result = self.reader.read(length)
|
|
|
|
if len(result) != length:
|
2017-09-18 12:45:08 +03:00
|
|
|
raise BufferError(
|
|
|
|
'No more data left to read (need {}, got {}: {}); last read {}'
|
|
|
|
.format(length, len(result), repr(result), repr(self._last))
|
|
|
|
)
|
2016-11-30 00:29:42 +03:00
|
|
|
|
2017-09-18 12:45:08 +03:00
|
|
|
self._last = result
|
2016-09-03 11:54:58 +03:00
|
|
|
return result
|
2016-08-26 13:58:53 +03:00
|
|
|
|
|
|
|
def get_bytes(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Gets the byte array representing the current buffer as a whole."""
|
2016-08-30 14:11:19 +03:00
|
|
|
return self.stream.getvalue()
|
2016-08-26 13:58:53 +03:00
|
|
|
|
|
|
|
# endregion
|
|
|
|
|
|
|
|
# region Telegram custom reading
|
|
|
|
|
|
|
|
def tgread_bytes(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""
|
|
|
|
Reads a Telegram-encoded byte array, without the need of
|
|
|
|
specifying its length.
|
2017-09-04 18:10:04 +03:00
|
|
|
"""
|
2016-08-30 14:11:19 +03:00
|
|
|
first_byte = self.read_byte()
|
2016-08-26 13:58:53 +03:00
|
|
|
if first_byte == 254:
|
2016-11-30 00:29:42 +03:00
|
|
|
length = self.read_byte() | (self.read_byte() << 8) | (
|
|
|
|
self.read_byte() << 16)
|
2016-08-26 13:58:53 +03:00
|
|
|
padding = length % 4
|
|
|
|
else:
|
|
|
|
length = first_byte
|
|
|
|
padding = (length + 1) % 4
|
|
|
|
|
|
|
|
data = self.read(length)
|
|
|
|
if padding > 0:
|
|
|
|
padding = 4 - padding
|
|
|
|
self.read(padding)
|
|
|
|
|
|
|
|
return data
|
|
|
|
|
|
|
|
def tgread_string(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a Telegram-encoded string."""
|
2017-05-03 14:02:44 +03:00
|
|
|
return str(self.tgread_bytes(), encoding='utf-8', errors='replace')
|
2016-08-26 13:58:53 +03:00
|
|
|
|
2016-09-04 22:07:09 +03:00
|
|
|
def tgread_bool(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a Telegram boolean value."""
|
2016-09-04 22:07:09 +03:00
|
|
|
value = self.read_int(signed=False)
|
|
|
|
if value == 0x997275b5: # boolTrue
|
|
|
|
return True
|
|
|
|
elif value == 0xbc799737: # boolFalse
|
|
|
|
return False
|
|
|
|
else:
|
2017-12-28 02:22:28 +03:00
|
|
|
raise RuntimeError('Invalid boolean code {}'.format(hex(value)))
|
2016-09-04 22:07:09 +03:00
|
|
|
|
2016-09-11 11:35:02 +03:00
|
|
|
def tgread_date(self):
|
2017-09-04 18:10:04 +03:00
|
|
|
"""Reads and converts Unix time (used by Telegram)
|
2017-11-26 19:14:28 +03:00
|
|
|
into a Python datetime object.
|
2017-09-04 18:10:04 +03:00
|
|
|
"""
|
2016-09-11 11:35:02 +03:00
|
|
|
value = self.read_int()
|
2017-11-22 19:06:43 +03:00
|
|
|
return None if value == 0 else datetime.utcfromtimestamp(value)
|
2016-09-11 11:35:02 +03:00
|
|
|
|
2016-08-27 22:49:38 +03:00
|
|
|
def tgread_object(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a Telegram object."""
|
2016-09-05 19:35:12 +03:00
|
|
|
constructor_id = self.read_int(signed=False)
|
2016-09-04 12:07:18 +03:00
|
|
|
clazz = tlobjects.get(constructor_id, None)
|
2016-08-27 22:49:38 +03:00
|
|
|
if clazz is None:
|
2016-09-11 14:10:27 +03:00
|
|
|
# The class was None, but there's still a
|
|
|
|
# chance of it being a manually parsed value like bool!
|
|
|
|
value = constructor_id
|
|
|
|
if value == 0x997275b5: # boolTrue
|
|
|
|
return True
|
|
|
|
elif value == 0xbc799737: # boolFalse
|
|
|
|
return False
|
|
|
|
|
|
|
|
# If there was still no luck, give up
|
2017-10-12 19:52:04 +03:00
|
|
|
self.seek(-4) # Go back
|
2016-09-05 19:35:12 +03:00
|
|
|
raise TypeNotFoundError(constructor_id)
|
2016-08-27 22:49:38 +03:00
|
|
|
|
2017-10-07 14:26:09 +03:00
|
|
|
return clazz.from_reader(self)
|
2016-08-27 22:49:38 +03:00
|
|
|
|
2016-09-26 17:10:07 +03:00
|
|
|
def tgread_vector(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Reads a vector (a list) of Telegram objects."""
|
2016-09-26 17:10:07 +03:00
|
|
|
if 0x1cb5c415 != self.read_int(signed=False):
|
2017-12-28 02:22:28 +03:00
|
|
|
raise RuntimeError('Invalid constructor code, vector was expected')
|
2016-09-26 17:10:07 +03:00
|
|
|
|
|
|
|
count = self.read_int()
|
|
|
|
return [self.tgread_object() for _ in range(count)]
|
|
|
|
|
2016-08-26 13:58:53 +03:00
|
|
|
# endregion
|
|
|
|
|
|
|
|
def close(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Closes the reader, freeing the BytesIO stream."""
|
2016-08-26 13:58:53 +03:00
|
|
|
self.reader.close()
|
|
|
|
|
|
|
|
# region Position related
|
|
|
|
|
|
|
|
def tell_position(self):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Tells the current position on the stream."""
|
2016-08-26 13:58:53 +03:00
|
|
|
return self.reader.tell()
|
|
|
|
|
|
|
|
def set_position(self, position):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""Sets the current position on the stream."""
|
2016-08-26 13:58:53 +03:00
|
|
|
self.reader.seek(position)
|
|
|
|
|
|
|
|
def seek(self, offset):
|
2017-11-26 19:14:28 +03:00
|
|
|
"""
|
|
|
|
Seeks the stream position given an offset from the current position.
|
|
|
|
The offset may be negative.
|
2017-09-04 18:10:04 +03:00
|
|
|
"""
|
2016-08-26 13:58:53 +03:00
|
|
|
self.reader.seek(offset, os.SEEK_CUR)
|
|
|
|
|
|
|
|
# endregion
|
|
|
|
|
|
|
|
# region with block
|
|
|
|
|
|
|
|
def __enter__(self):
|
|
|
|
return self
|
|
|
|
|
|
|
|
def __exit__(self, exc_type, exc_val, exc_tb):
|
|
|
|
self.close()
|
|
|
|
|
|
|
|
# endregion
|