mirror of
https://github.com/LonamiWebs/Telethon.git
synced 2025-01-24 08:14:14 +03:00
c4e26c95f5
This removes the need for a .clear_cache() method as now files are identified by their MD5 (which needs to be calculated always) and their file size (to make collisions even more unlikely) instead using the file path (which can now change).
936 lines
37 KiB
Python
936 lines
37 KiB
Python
import logging
|
|
import os
|
|
import threading
|
|
import warnings
|
|
from datetime import timedelta, datetime
|
|
from hashlib import md5
|
|
from io import BytesIO
|
|
from signal import signal, SIGINT, SIGTERM, SIGABRT
|
|
from threading import Lock
|
|
from time import sleep
|
|
|
|
from . import helpers as utils, version
|
|
from .crypto import rsa, CdnDecrypter
|
|
from .errors import (
|
|
RPCError, BrokenAuthKeyError, ServerError,
|
|
FloodWaitError, FileMigrateError, TypeNotFoundError,
|
|
UnauthorizedError, PhoneMigrateError, NetworkMigrateError, UserMigrateError
|
|
)
|
|
from .network import authenticator, MtProtoSender, Connection, ConnectionMode
|
|
from .tl import TLObject, Session
|
|
from .tl.all_tlobjects import LAYER
|
|
from .tl.functions import (
|
|
InitConnectionRequest, InvokeWithLayerRequest, PingRequest
|
|
)
|
|
from .tl.functions.auth import (
|
|
ImportAuthorizationRequest, ExportAuthorizationRequest
|
|
)
|
|
from .tl.functions.help import (
|
|
GetCdnConfigRequest, GetConfigRequest
|
|
)
|
|
from .tl.functions.updates import GetStateRequest
|
|
from .tl.functions.upload import (
|
|
GetFileRequest, SaveBigFilePartRequest, SaveFilePartRequest
|
|
)
|
|
from .tl.types import InputFile, InputFileBig
|
|
from .tl.types.auth import ExportedAuthorization
|
|
from .tl.types.upload import FileCdnRedirect
|
|
from .update_state import UpdateState
|
|
from .utils import get_appropriated_part_size
|
|
|
|
|
|
DEFAULT_DC_ID = 4
|
|
DEFAULT_IPV4_IP = '149.154.167.51'
|
|
DEFAULT_IPV6_IP = '[2001:67c:4e8:f002::a]'
|
|
DEFAULT_PORT = 443
|
|
|
|
__log__ = logging.getLogger(__name__)
|
|
|
|
|
|
class TelegramBareClient:
|
|
"""Bare Telegram Client with just the minimum -
|
|
|
|
The reason to distinguish between a MtProtoSender and a
|
|
TelegramClient itself is because the sender is just that,
|
|
a sender, which should know nothing about Telegram but
|
|
rather how to handle this specific connection.
|
|
|
|
The TelegramClient itself should know how to initialize
|
|
a proper connection to the servers, as well as other basic
|
|
methods such as disconnection and reconnection.
|
|
|
|
This distinction between a bare client and a full client
|
|
makes it possible to create clones of the bare version
|
|
(by using the same session, IP address and port) to be
|
|
able to execute queries on either, without the additional
|
|
cost that would involve having the methods for signing in,
|
|
logging out, and such.
|
|
"""
|
|
|
|
# Current TelegramClient version
|
|
__version__ = version.__version__
|
|
|
|
# TODO Make this thread-safe, all connections share the same DC
|
|
_config = None # Server configuration (with .dc_options)
|
|
|
|
# region Initialization
|
|
|
|
def __init__(self, session, api_id, api_hash,
|
|
connection_mode=ConnectionMode.TCP_FULL,
|
|
use_ipv6=False,
|
|
proxy=None,
|
|
update_workers=None,
|
|
spawn_read_thread=False,
|
|
timeout=timedelta(seconds=5),
|
|
**kwargs):
|
|
"""Refer to TelegramClient.__init__ for docs on this method"""
|
|
if not api_id or not api_hash:
|
|
raise ValueError(
|
|
"Your API ID or Hash cannot be empty or None. "
|
|
"Refer to Telethon's wiki for more information.")
|
|
|
|
self._use_ipv6 = use_ipv6
|
|
|
|
# Determine what session object we have
|
|
if isinstance(session, str) or session is None:
|
|
session = Session(session)
|
|
elif not isinstance(session, Session):
|
|
raise TypeError(
|
|
'The given session must be a str or a Session instance.'
|
|
)
|
|
|
|
# ':' in session.server_address is True if it's an IPv6 address
|
|
if (not session.server_address or
|
|
(':' in session.server_address) != use_ipv6):
|
|
session.set_dc(
|
|
DEFAULT_DC_ID,
|
|
DEFAULT_IPV6_IP if self._use_ipv6 else DEFAULT_IPV4_IP,
|
|
DEFAULT_PORT
|
|
)
|
|
|
|
self.session = session
|
|
self.api_id = int(api_id)
|
|
self.api_hash = api_hash
|
|
if self.api_id < 20: # official apps must use obfuscated
|
|
connection_mode = ConnectionMode.TCP_OBFUSCATED
|
|
|
|
# This is the main sender, which will be used from the thread
|
|
# that calls .connect(). Every other thread will spawn a new
|
|
# temporary connection. The connection on this one is always
|
|
# kept open so Telegram can send us updates.
|
|
self._sender = MtProtoSender(self.session, Connection(
|
|
mode=connection_mode, proxy=proxy, timeout=timeout
|
|
))
|
|
|
|
# Two threads may be calling reconnect() when the connection is lost,
|
|
# we only want one to actually perform the reconnection.
|
|
self._reconnect_lock = Lock()
|
|
|
|
# Cache "exported" sessions as 'dc_id: Session' not to recreate
|
|
# them all the time since generating a new key is a relatively
|
|
# expensive operation.
|
|
self._exported_sessions = {}
|
|
|
|
# This member will process updates if enabled.
|
|
# One may change self.updates.enabled at any later point.
|
|
self.updates = UpdateState(workers=update_workers)
|
|
|
|
# Used on connection - the user may modify these and reconnect
|
|
kwargs['app_version'] = kwargs.get('app_version', self.__version__)
|
|
for name, value in kwargs.items():
|
|
if not hasattr(self.session, name):
|
|
raise ValueError('Unknown named parameter', name)
|
|
setattr(self.session, name, value)
|
|
|
|
# Despite the state of the real connection, keep track of whether
|
|
# the user has explicitly called .connect() or .disconnect() here.
|
|
# This information is required by the read thread, who will be the
|
|
# one attempting to reconnect on the background *while* the user
|
|
# doesn't explicitly call .disconnect(), thus telling it to stop
|
|
# retrying. The main thread, knowing there is a background thread
|
|
# attempting reconnection as soon as it happens, will just sleep.
|
|
self._user_connected = False
|
|
|
|
# Save whether the user is authorized here (a.k.a. logged in)
|
|
self._authorized = None # None = We don't know yet
|
|
|
|
# The first request must be in invokeWithLayer(initConnection(X)).
|
|
# See https://core.telegram.org/api/invoking#saving-client-info.
|
|
self._first_request = True
|
|
|
|
# Constantly read for results and updates from within the main client,
|
|
# if the user has left enabled such option.
|
|
self._spawn_read_thread = spawn_read_thread
|
|
self._recv_thread = None
|
|
|
|
# Identifier of the main thread (the one that called .connect()).
|
|
# This will be used to create new connections from any other thread,
|
|
# so that requests can be sent in parallel.
|
|
self._main_thread_ident = None
|
|
|
|
# Default PingRequest delay
|
|
self._last_ping = datetime.now()
|
|
self._ping_delay = timedelta(minutes=1)
|
|
|
|
# Some errors are known but there's nothing we can do from the
|
|
# background thread. If any of these happens, call .disconnect(),
|
|
# and raise them next time .invoke() is tried to be called.
|
|
self._background_error = None
|
|
|
|
# endregion
|
|
|
|
# region Connecting
|
|
|
|
def connect(self, _sync_updates=True):
|
|
"""Connects to the Telegram servers, executing authentication if
|
|
required. Note that authenticating to the Telegram servers is
|
|
not the same as authenticating the desired user itself, which
|
|
may require a call (or several) to 'sign_in' for the first time.
|
|
|
|
Note that the optional parameters are meant for internal use.
|
|
|
|
If '_sync_updates', sync_updates() will be called and a
|
|
second thread will be started if necessary. Note that this
|
|
will FAIL if the client is not connected to the user's
|
|
native data center, raising a "UserMigrateError", and
|
|
calling .disconnect() in the process.
|
|
"""
|
|
__log__.info('Connecting to %s:%d...',
|
|
self.session.server_address, self.session.port)
|
|
|
|
self._main_thread_ident = threading.get_ident()
|
|
self._background_error = None # Clear previous errors
|
|
|
|
try:
|
|
self._sender.connect()
|
|
__log__.info('Connection success!')
|
|
|
|
# Connection was successful! Try syncing the update state
|
|
# UNLESS '_sync_updates' is False (we probably are in
|
|
# another data center and this would raise UserMigrateError)
|
|
# to also assert whether the user is logged in or not.
|
|
self._user_connected = True
|
|
if self._authorized is None and _sync_updates:
|
|
try:
|
|
self.sync_updates()
|
|
self._set_connected_and_authorized()
|
|
except UnauthorizedError:
|
|
self._authorized = False
|
|
elif self._authorized:
|
|
self._set_connected_and_authorized()
|
|
|
|
return True
|
|
|
|
except TypeNotFoundError as e:
|
|
# This is fine, probably layer migration
|
|
__log__.warning('Connection failed, got unexpected type with ID '
|
|
'%s. Migrating?', hex(e.invalid_constructor_id))
|
|
self.disconnect()
|
|
return self.connect(_sync_updates=_sync_updates)
|
|
|
|
except (RPCError, ConnectionError) as e:
|
|
# Probably errors from the previous session, ignore them
|
|
__log__.error('Connection failed due to %s', e)
|
|
self.disconnect()
|
|
return False
|
|
|
|
def is_connected(self):
|
|
return self._sender.is_connected()
|
|
|
|
def _wrap_init_connection(self, query):
|
|
"""Wraps query around InvokeWithLayerRequest(InitConnectionRequest())"""
|
|
return InvokeWithLayerRequest(LAYER, InitConnectionRequest(
|
|
api_id=self.api_id,
|
|
device_model=self.session.device_model,
|
|
system_version=self.session.system_version,
|
|
app_version=self.session.app_version,
|
|
lang_code=self.session.lang_code,
|
|
system_lang_code=self.session.system_lang_code,
|
|
lang_pack='', # "langPacks are for official apps only"
|
|
query=query
|
|
))
|
|
|
|
def disconnect(self):
|
|
"""Disconnects from the Telegram server
|
|
and stops all the spawned threads"""
|
|
__log__.info('Disconnecting...')
|
|
self._user_connected = False # This will stop recv_thread's loop
|
|
|
|
__log__.debug('Stopping all workers...')
|
|
self.updates.stop_workers()
|
|
|
|
# This will trigger a "ConnectionResetError" on the recv_thread,
|
|
# which won't attempt reconnecting as ._user_connected is False.
|
|
__log__.debug('Disconnecting the socket...')
|
|
self._sender.disconnect()
|
|
|
|
# TODO Shall we clear the _exported_sessions, or may be reused?
|
|
self._first_request = True # On reconnect it will be first again
|
|
|
|
def __del__(self):
|
|
self.disconnect()
|
|
|
|
def _reconnect(self, new_dc=None):
|
|
"""If 'new_dc' is not set, only a call to .connect() will be made
|
|
since it's assumed that the connection has been lost and the
|
|
library is reconnecting.
|
|
|
|
If 'new_dc' is set, the client is first disconnected from the
|
|
current data center, clears the auth key for the old DC, and
|
|
connects to the new data center.
|
|
"""
|
|
if new_dc is None:
|
|
if self.is_connected():
|
|
__log__.info('Reconnection aborted: already connected')
|
|
return True
|
|
|
|
try:
|
|
__log__.info('Attempting reconnection...')
|
|
return self.connect()
|
|
except ConnectionResetError as e:
|
|
__log__.warning('Reconnection failed due to %s', e)
|
|
return False
|
|
else:
|
|
# Since we're reconnecting possibly due to a UserMigrateError,
|
|
# we need to first know the Data Centers we can connect to. Do
|
|
# that before disconnecting.
|
|
dc = self._get_dc(new_dc)
|
|
__log__.info('Reconnecting to new data center %s', dc)
|
|
|
|
self.session.set_dc(dc.id, dc.ip_address, dc.port)
|
|
# auth_key's are associated with a server, which has now changed
|
|
# so it's not valid anymore. Set to None to force recreating it.
|
|
self.session.auth_key = None
|
|
self.session.save()
|
|
self.disconnect()
|
|
return self.connect()
|
|
|
|
def set_proxy(self, proxy):
|
|
"""Change the proxy used by the connections.
|
|
"""
|
|
if self.is_connected():
|
|
raise RuntimeError("You can't change the proxy while connected.")
|
|
self._sender.connection.conn.proxy = proxy
|
|
|
|
# endregion
|
|
|
|
# region Working with different connections/Data Centers
|
|
|
|
def _on_read_thread(self):
|
|
return self._recv_thread is not None and \
|
|
threading.get_ident() == self._recv_thread.ident
|
|
|
|
def _get_dc(self, dc_id, cdn=False):
|
|
"""Gets the Data Center (DC) associated to 'dc_id'"""
|
|
if not TelegramBareClient._config:
|
|
TelegramBareClient._config = self(GetConfigRequest())
|
|
|
|
try:
|
|
if cdn:
|
|
# Ensure we have the latest keys for the CDNs
|
|
for pk in self(GetCdnConfigRequest()).public_keys:
|
|
rsa.add_key(pk.public_key)
|
|
|
|
return next(
|
|
dc for dc in TelegramBareClient._config.dc_options
|
|
if dc.id == dc_id and bool(dc.ipv6) == self._use_ipv6 and bool(dc.cdn) == cdn
|
|
)
|
|
except StopIteration:
|
|
if not cdn:
|
|
raise
|
|
|
|
# New configuration, perhaps a new CDN was added?
|
|
TelegramBareClient._config = self(GetConfigRequest())
|
|
return self._get_dc(dc_id, cdn=cdn)
|
|
|
|
def _get_exported_client(self, dc_id):
|
|
"""Creates and connects a new TelegramBareClient for the desired DC.
|
|
|
|
If it's the first time calling the method with a given dc_id,
|
|
a new session will be first created, and its auth key generated.
|
|
Exporting/Importing the authorization will also be done so that
|
|
the auth is bound with the key.
|
|
"""
|
|
# Thanks badoualy/kotlogram on /telegram/api/DefaultTelegramClient.kt
|
|
# for clearly showing how to export the authorization! ^^
|
|
session = self._exported_sessions.get(dc_id)
|
|
if session:
|
|
export_auth = None # Already bound with the auth key
|
|
else:
|
|
# TODO Add a lock, don't allow two threads to create an auth key
|
|
# (when calling .connect() if there wasn't a previous session).
|
|
# for the same data center.
|
|
dc = self._get_dc(dc_id)
|
|
|
|
# Export the current authorization to the new DC.
|
|
__log__.info('Exporting authorization for data center %s', dc)
|
|
export_auth = self(ExportAuthorizationRequest(dc_id))
|
|
|
|
# Create a temporary session for this IP address, which needs
|
|
# to be different because each auth_key is unique per DC.
|
|
#
|
|
# Construct this session with the connection parameters
|
|
# (system version, device model...) from the current one.
|
|
session = Session(self.session)
|
|
session.set_dc(dc.id, dc.ip_address, dc.port)
|
|
self._exported_sessions[dc_id] = session
|
|
|
|
__log__.info('Creating exported new client')
|
|
client = TelegramBareClient(
|
|
session, self.api_id, self.api_hash,
|
|
proxy=self._sender.connection.conn.proxy,
|
|
timeout=self._sender.connection.get_timeout()
|
|
)
|
|
client.connect(_sync_updates=False)
|
|
if isinstance(export_auth, ExportedAuthorization):
|
|
client(ImportAuthorizationRequest(
|
|
id=export_auth.id, bytes=export_auth.bytes
|
|
))
|
|
elif export_auth is not None:
|
|
__log__.warning('Unknown export auth type %s', export_auth)
|
|
|
|
client._authorized = True # We exported the auth, so we got auth
|
|
return client
|
|
|
|
def _get_cdn_client(self, cdn_redirect):
|
|
"""Similar to ._get_exported_client, but for CDNs"""
|
|
session = self._exported_sessions.get(cdn_redirect.dc_id)
|
|
if not session:
|
|
dc = self._get_dc(cdn_redirect.dc_id, cdn=True)
|
|
session = Session(self.session)
|
|
session.set_dc(dc.id, dc.ip_address, dc.port)
|
|
self._exported_sessions[cdn_redirect.dc_id] = session
|
|
|
|
__log__.info('Creating new CDN client')
|
|
client = TelegramBareClient(
|
|
session, self.api_id, self.api_hash,
|
|
proxy=self._sender.connection.conn.proxy,
|
|
timeout=self._sender.connection.get_timeout()
|
|
)
|
|
|
|
# This will make use of the new RSA keys for this specific CDN.
|
|
#
|
|
# We won't be calling GetConfigRequest because it's only called
|
|
# when needed by ._get_dc, and also it's static so it's likely
|
|
# set already. Avoid invoking non-CDN methods by not syncing updates.
|
|
client.connect(_sync_updates=False)
|
|
client._authorized = self._authorized
|
|
return client
|
|
|
|
# endregion
|
|
|
|
# region Invoking Telegram requests
|
|
|
|
def __call__(self, *requests, retries=5):
|
|
"""Invokes (sends) a MTProtoRequest and returns (receives) its result.
|
|
|
|
The invoke will be retried up to 'retries' times before raising
|
|
RuntimeError().
|
|
"""
|
|
if not all(isinstance(x, TLObject) and
|
|
x.content_related for x in requests):
|
|
raise TypeError('You can only invoke requests, not types!')
|
|
|
|
# For logging purposes
|
|
if len(requests) == 1:
|
|
which = type(requests[0]).__name__
|
|
else:
|
|
which = '{} requests ({})'.format(
|
|
len(requests), [type(x).__name__ for x in requests])
|
|
|
|
# Determine the sender to be used (main or a new connection)
|
|
on_main_thread = threading.get_ident() == self._main_thread_ident
|
|
if on_main_thread or self._on_read_thread():
|
|
__log__.debug('Invoking %s from main thread', which)
|
|
sender = self._sender
|
|
update_state = self.updates
|
|
else:
|
|
__log__.debug('Invoking %s from background thread. '
|
|
'Creating temporary connection', which)
|
|
|
|
sender = self._sender.clone()
|
|
sender.connect()
|
|
# We're on another connection, Telegram will resend all the
|
|
# updates that we haven't acknowledged (potentially entering
|
|
# an infinite loop if we're calling this in response to an
|
|
# update event, as it would be received again and again). So
|
|
# to avoid this we will simply not process updates on these
|
|
# new temporary connections, as they will be sent and later
|
|
# acknowledged over the main connection.
|
|
update_state = None
|
|
|
|
# We should call receive from this thread if there's no background
|
|
# thread reading or if the server disconnected us and we're trying
|
|
# to reconnect. This is because the read thread may either be
|
|
# locked also trying to reconnect or we may be said thread already.
|
|
call_receive = not on_main_thread or self._recv_thread is None \
|
|
or self._reconnect_lock.locked()
|
|
try:
|
|
for attempt in range(retries):
|
|
if self._background_error and on_main_thread:
|
|
raise self._background_error
|
|
|
|
result = self._invoke(
|
|
sender, call_receive, update_state, *requests
|
|
)
|
|
if result is not None:
|
|
return result
|
|
|
|
__log__.warning('Invoking %s failed %d times, '
|
|
'reconnecting and retrying',
|
|
[str(x) for x in requests], attempt + 1)
|
|
sleep(1)
|
|
# The ReadThread has priority when attempting reconnection,
|
|
# since this thread is constantly running while __call__ is
|
|
# only done sometimes. Here try connecting only once/retry.
|
|
if sender == self._sender:
|
|
if not self._reconnect_lock.locked():
|
|
with self._reconnect_lock:
|
|
self._reconnect()
|
|
else:
|
|
sender.connect()
|
|
|
|
raise RuntimeError('Number of retries reached 0.')
|
|
finally:
|
|
if sender != self._sender:
|
|
sender.disconnect() # Close temporary connections
|
|
|
|
# Let people use client.invoke(SomeRequest()) instead client(...)
|
|
invoke = __call__
|
|
|
|
def _invoke(self, sender, call_receive, update_state, *requests):
|
|
try:
|
|
# Ensure that we start with no previous errors (i.e. resending)
|
|
for x in requests:
|
|
x.confirm_received.clear()
|
|
x.rpc_error = None
|
|
|
|
if not self.session.auth_key:
|
|
__log__.info('Need to generate new auth key before invoking')
|
|
self._first_request = True
|
|
self.session.auth_key, self.session.time_offset = \
|
|
authenticator.do_authentication(self._sender.connection)
|
|
|
|
if self._first_request:
|
|
__log__.info('Initializing a new connection while invoking')
|
|
if len(requests) == 1:
|
|
requests = [self._wrap_init_connection(requests[0])]
|
|
else:
|
|
# We need a SINGLE request (like GetConfig) to init conn.
|
|
# Once that's done, the N original requests will be
|
|
# invoked.
|
|
TelegramBareClient._config = self(
|
|
self._wrap_init_connection(GetConfigRequest())
|
|
)
|
|
|
|
sender.send(*requests)
|
|
|
|
if not call_receive:
|
|
# TODO This will be slightly troublesome if we allow
|
|
# switching between constant read or not on the fly.
|
|
# Must also watch out for calling .read() from two places,
|
|
# in which case a Lock would be required for .receive().
|
|
for x in requests:
|
|
x.confirm_received.wait(
|
|
sender.connection.get_timeout()
|
|
)
|
|
else:
|
|
while not all(x.confirm_received.is_set() for x in requests):
|
|
sender.receive(update_state=update_state)
|
|
|
|
except BrokenAuthKeyError:
|
|
__log__.error('Authorization key seems broken and was invalid!')
|
|
self.session.auth_key = None
|
|
|
|
except TimeoutError:
|
|
__log__.warning('Invoking timed out') # We will just retry
|
|
|
|
except ConnectionResetError:
|
|
__log__.warning('Connection was reset while invoking')
|
|
if self._user_connected:
|
|
# Server disconnected us, __call__ will try reconnecting.
|
|
return None
|
|
else:
|
|
# User never called .connect(), so raise this error.
|
|
raise
|
|
|
|
# Clear the flag if we got this far
|
|
self._first_request = False
|
|
|
|
try:
|
|
raise next(x.rpc_error for x in requests if x.rpc_error)
|
|
except StopIteration:
|
|
if any(x.result is None for x in requests):
|
|
# "A container may only be accepted or
|
|
# rejected by the other party as a whole."
|
|
return None
|
|
|
|
if len(requests) == 1:
|
|
return requests[0].result
|
|
else:
|
|
return [x.result for x in requests]
|
|
|
|
except (PhoneMigrateError, NetworkMigrateError,
|
|
UserMigrateError) as e:
|
|
|
|
# TODO What happens with the background thread here?
|
|
# For normal use cases, this won't happen, because this will only
|
|
# be on the very first connection (not authorized, not running),
|
|
# but may be an issue for people who actually travel?
|
|
self._reconnect(new_dc=e.new_dc)
|
|
return self._invoke(sender, call_receive, update_state, *requests)
|
|
|
|
except ServerError as e:
|
|
# Telegram is having some issues, just retry
|
|
__log__.error('Telegram servers are having internal errors %s', e)
|
|
|
|
except FloodWaitError as e:
|
|
__log__.warning('Request invoked too often, wait %ds', e.seconds)
|
|
if e.seconds > self.session.flood_sleep_threshold | 0:
|
|
raise
|
|
|
|
sleep(e.seconds)
|
|
|
|
# Some really basic functionality
|
|
|
|
def is_user_authorized(self):
|
|
"""Has the user been authorized yet
|
|
(code request sent and confirmed)?"""
|
|
return self._authorized
|
|
|
|
# endregion
|
|
|
|
# region Uploading media
|
|
|
|
def upload_file(self,
|
|
file,
|
|
part_size_kb=None,
|
|
file_name=None,
|
|
progress_callback=None):
|
|
"""Uploads the specified file and returns a handle (an instance
|
|
of InputFile or InputFileBig, as required) which can be later used.
|
|
|
|
Uploading a file will simply return a "handle" to the file stored
|
|
remotely in the Telegram servers, which can be later used on. This
|
|
will NOT upload the file to your own chat.
|
|
|
|
'file' may be either a file path, a byte array, or a stream.
|
|
Note that if the file is a stream it will need to be read
|
|
entirely into memory to tell its size first.
|
|
|
|
If 'progress_callback' is not None, it should be a function that
|
|
takes two parameters, (bytes_uploaded, total_bytes).
|
|
|
|
Default values for the optional parameters if left as None are:
|
|
part_size_kb = get_appropriated_part_size(file_size)
|
|
file_name = os.path.basename(file_path)
|
|
"""
|
|
if isinstance(file, (InputFile, InputFileBig)):
|
|
return file # Already uploaded
|
|
|
|
if isinstance(file, str):
|
|
file_size = os.path.getsize(file)
|
|
elif isinstance(file, bytes):
|
|
file_size = len(file)
|
|
else:
|
|
file = file.read()
|
|
file_size = len(file)
|
|
|
|
# File will now either be a string or bytes
|
|
if not part_size_kb:
|
|
part_size_kb = get_appropriated_part_size(file_size)
|
|
|
|
if part_size_kb > 512:
|
|
raise ValueError('The part size must be less or equal to 512KB')
|
|
|
|
part_size = int(part_size_kb * 1024)
|
|
if part_size % 1024 != 0:
|
|
raise ValueError('The part size must be evenly divisible by 1024')
|
|
|
|
# Set a default file name if None was specified
|
|
file_id = utils.generate_random_long()
|
|
if not file_name:
|
|
if isinstance(file, str):
|
|
file_name = os.path.basename(file)
|
|
else:
|
|
file_name = str(file_id)
|
|
|
|
# Determine whether the file is too big (over 10MB) or not
|
|
# Telegram does make a distinction between smaller or larger files
|
|
is_large = file_size > 10 * 1024 * 1024
|
|
if not is_large:
|
|
# Calculate the MD5 hash before anything else.
|
|
# As this needs to be done always for small files,
|
|
# might as well do it before anything else and
|
|
# check the cache.
|
|
if isinstance(file, str):
|
|
with open(file, 'rb') as stream:
|
|
file = stream.read()
|
|
hash_md5 = md5(file)
|
|
tuple_ = self.session.get_file(hash_md5.digest(), file_size)
|
|
if tuple_:
|
|
__log__.info('File was already cached, not uploading again')
|
|
return InputFile(name=file_name,
|
|
md5_checksum=tuple_[0], id=tuple_[2], parts=tuple_[3])
|
|
else:
|
|
hash_md5 = None
|
|
|
|
part_count = (file_size + part_size - 1) // part_size
|
|
__log__.info('Uploading file of %d bytes in %d chunks of %d',
|
|
file_size, part_count, part_size)
|
|
|
|
with open(file, 'rb') if isinstance(file, str) else BytesIO(file) \
|
|
as stream:
|
|
for part_index in range(part_count):
|
|
# Read the file by in chunks of size part_size
|
|
part = stream.read(part_size)
|
|
|
|
# The SavePartRequest is different depending on whether
|
|
# the file is too large or not (over or less than 10MB)
|
|
if is_large:
|
|
request = SaveBigFilePartRequest(file_id, part_index,
|
|
part_count, part)
|
|
else:
|
|
request = SaveFilePartRequest(file_id, part_index, part)
|
|
|
|
result = self(request)
|
|
if result:
|
|
__log__.debug('Uploaded %d/%d', part_index + 1, part_count)
|
|
if progress_callback:
|
|
progress_callback(stream.tell(), file_size)
|
|
else:
|
|
raise RuntimeError(
|
|
'Failed to upload file part {}.'.format(part_index))
|
|
|
|
if is_large:
|
|
return InputFileBig(file_id, part_count, file_name)
|
|
else:
|
|
self.session.cache_file(
|
|
hash_md5.digest(), file_size, file_id, part_count)
|
|
|
|
return InputFile(file_id, part_count, file_name,
|
|
md5_checksum=hash_md5.hexdigest())
|
|
|
|
# endregion
|
|
|
|
# region Downloading media
|
|
|
|
def download_file(self,
|
|
input_location,
|
|
file,
|
|
part_size_kb=None,
|
|
file_size=None,
|
|
progress_callback=None):
|
|
"""Downloads the given InputFileLocation to file (a stream or str).
|
|
|
|
If 'progress_callback' is not None, it should be a function that
|
|
takes two parameters, (bytes_downloaded, total_bytes). Note that
|
|
'total_bytes' simply equals 'file_size', and may be None.
|
|
"""
|
|
if not part_size_kb:
|
|
if not file_size:
|
|
part_size_kb = 64 # Reasonable default
|
|
else:
|
|
part_size_kb = get_appropriated_part_size(file_size)
|
|
|
|
part_size = int(part_size_kb * 1024)
|
|
# https://core.telegram.org/api/files says:
|
|
# > part_size % 1024 = 0 (divisible by 1KB)
|
|
#
|
|
# But https://core.telegram.org/cdn (more recent) says:
|
|
# > limit must be divisible by 4096 bytes
|
|
# So we just stick to the 4096 limit.
|
|
if part_size % 4096 != 0:
|
|
raise ValueError('The part size must be evenly divisible by 4096.')
|
|
|
|
if isinstance(file, str):
|
|
# Ensure that we'll be able to download the media
|
|
utils.ensure_parent_dir_exists(file)
|
|
f = open(file, 'wb')
|
|
else:
|
|
f = file
|
|
|
|
# The used client will change if FileMigrateError occurs
|
|
client = self
|
|
cdn_decrypter = None
|
|
|
|
__log__.info('Downloading file in chunks of %d bytes', part_size)
|
|
try:
|
|
offset = 0
|
|
while True:
|
|
try:
|
|
if cdn_decrypter:
|
|
result = cdn_decrypter.get_file()
|
|
else:
|
|
result = client(GetFileRequest(
|
|
input_location, offset, part_size
|
|
))
|
|
|
|
if isinstance(result, FileCdnRedirect):
|
|
__log__.info('File lives in a CDN')
|
|
cdn_decrypter, result = \
|
|
CdnDecrypter.prepare_decrypter(
|
|
client, self._get_cdn_client(result), result
|
|
)
|
|
|
|
except FileMigrateError as e:
|
|
__log__.info('File lives in another DC')
|
|
client = self._get_exported_client(e.new_dc)
|
|
continue
|
|
|
|
offset += part_size
|
|
|
|
# If we have received no data (0 bytes), the file is over
|
|
# So there is nothing left to download and write
|
|
if not result.bytes:
|
|
# Return some extra information, unless it's a CDN file
|
|
return getattr(result, 'type', '')
|
|
|
|
f.write(result.bytes)
|
|
__log__.debug('Saved %d more bytes', len(result.bytes))
|
|
if progress_callback:
|
|
progress_callback(f.tell(), file_size)
|
|
finally:
|
|
if client != self:
|
|
client.disconnect()
|
|
|
|
if cdn_decrypter:
|
|
try:
|
|
cdn_decrypter.client.disconnect()
|
|
except:
|
|
pass
|
|
if isinstance(file, str):
|
|
f.close()
|
|
|
|
# endregion
|
|
|
|
# region Updates handling
|
|
|
|
def sync_updates(self):
|
|
"""Synchronizes self.updates to their initial state. Will be
|
|
called automatically on connection if self.updates.enabled = True,
|
|
otherwise it should be called manually after enabling updates.
|
|
"""
|
|
self.updates.process(self(GetStateRequest()))
|
|
|
|
def add_update_handler(self, handler):
|
|
"""Adds an update handler (a function which takes a TLObject,
|
|
an update, as its parameter) and listens for updates"""
|
|
if self.updates.workers is None:
|
|
warnings.warn(
|
|
"You have not setup any workers, so you won't receive updates."
|
|
" Pass update_workers=4 when creating the TelegramClient,"
|
|
" or set client.self.updates.workers = 4"
|
|
)
|
|
|
|
self.updates.handlers.append(handler)
|
|
|
|
def remove_update_handler(self, handler):
|
|
self.updates.handlers.remove(handler)
|
|
|
|
def list_update_handlers(self):
|
|
return self.updates.handlers[:]
|
|
|
|
# endregion
|
|
|
|
# region Constant read
|
|
|
|
def _set_connected_and_authorized(self):
|
|
self._authorized = True
|
|
self.updates.setup_workers()
|
|
if self._spawn_read_thread and self._recv_thread is None:
|
|
self._recv_thread = threading.Thread(
|
|
name='ReadThread', daemon=True,
|
|
target=self._recv_thread_impl
|
|
)
|
|
self._recv_thread.start()
|
|
|
|
def _signal_handler(self, signum, frame):
|
|
if self._user_connected:
|
|
self.disconnect()
|
|
else:
|
|
os._exit(1)
|
|
|
|
def idle(self, stop_signals=(SIGINT, SIGTERM, SIGABRT)):
|
|
"""
|
|
Idles the program by looping forever and listening for updates
|
|
until one of the signals are received, which breaks the loop.
|
|
|
|
:param stop_signals:
|
|
Iterable containing signals from the signal module that will
|
|
be subscribed to TelegramClient.disconnect() (effectively
|
|
stopping the idle loop), which will be called on receiving one
|
|
of those signals.
|
|
:return:
|
|
"""
|
|
if self._spawn_read_thread and not self._on_read_thread():
|
|
raise RuntimeError('Can only idle if spawn_read_thread=False')
|
|
|
|
for sig in stop_signals:
|
|
signal(sig, self._signal_handler)
|
|
|
|
if self._on_read_thread():
|
|
__log__.info('Starting to wait for items from the network')
|
|
else:
|
|
__log__.info('Idling to receive items from the network')
|
|
|
|
while self._user_connected:
|
|
try:
|
|
if datetime.now() > self._last_ping + self._ping_delay:
|
|
self._sender.send(PingRequest(
|
|
int.from_bytes(os.urandom(8), 'big', signed=True)
|
|
))
|
|
self._last_ping = datetime.now()
|
|
|
|
__log__.debug('Receiving items from the network...')
|
|
self._sender.receive(update_state=self.updates)
|
|
except TimeoutError:
|
|
# No problem
|
|
__log__.info('Receiving items from the network timed out')
|
|
except ConnectionResetError:
|
|
if self._user_connected:
|
|
__log__.error('Connection was reset while receiving '
|
|
'items. Reconnecting')
|
|
with self._reconnect_lock:
|
|
while self._user_connected and not self._reconnect():
|
|
sleep(0.1) # Retry forever, this is instant messaging
|
|
|
|
__log__.info('Connection closed by the user, not reading anymore')
|
|
|
|
# By using this approach, another thread will be
|
|
# created and started upon connection to constantly read
|
|
# from the other end. Otherwise, manual calls to .receive()
|
|
# must be performed. The MtProtoSender cannot be connected,
|
|
# or an error will be thrown.
|
|
#
|
|
# This way, sending and receiving will be completely independent.
|
|
def _recv_thread_impl(self):
|
|
# This thread is "idle" (only listening for updates), but also
|
|
# excepts everything unlike the manual idle because it should
|
|
# not crash.
|
|
while self._user_connected:
|
|
try:
|
|
self.idle(stop_signals=tuple())
|
|
except Exception as error:
|
|
__log__.exception('Unknown exception in the read thread! '
|
|
'Disconnecting and leaving it to main thread')
|
|
# Unknown exception, pass it to the main thread
|
|
|
|
try:
|
|
import socks
|
|
if isinstance(error, (
|
|
socks.GeneralProxyError, socks.ProxyConnectionError
|
|
)):
|
|
# This is a known error, and it's not related to
|
|
# Telegram but rather to the proxy. Disconnect and
|
|
# hand it over to the main thread.
|
|
self._background_error = error
|
|
self.disconnect()
|
|
break
|
|
except ImportError:
|
|
"Not using PySocks, so it can't be a proxy error"
|
|
|
|
self._recv_thread = None
|
|
|
|
# endregion
|