import hashlib import itertools import logging import os import sys import time from collections import OrderedDict, UserList from datetime import datetime, timedelta from io import BytesIO from mimetypes import guess_type from .crypto import CdnDecrypter from .tl.custom import InputSizedFile from .tl.functions.upload import ( SaveBigFilePartRequest, SaveFilePartRequest, GetFileRequest ) from .tl.types.upload import FileCdnRedirect try: import socks except ImportError: socks = None from . import TelegramBareClient from . import helpers, utils from .errors import ( RPCError, UnauthorizedError, PhoneCodeEmptyError, PhoneCodeExpiredError, PhoneCodeHashEmptyError, PhoneCodeInvalidError, LocationInvalidError, SessionPasswordNeededError, FileMigrateError ) from .network import ConnectionMode from .tl import TLObject from .tl.custom import Draft, Dialog from .tl.functions.account import ( GetPasswordRequest ) from .tl.functions.auth import ( CheckPasswordRequest, LogOutRequest, SendCodeRequest, SignInRequest, SignUpRequest, ResendCodeRequest, ImportBotAuthorizationRequest ) from .tl.functions.contacts import ( GetContactsRequest, ResolveUsernameRequest ) from .tl.functions.messages import ( GetDialogsRequest, GetHistoryRequest, SendMediaRequest, SendMessageRequest, GetChatsRequest, GetAllDraftsRequest, CheckChatInviteRequest, ReadMentionsRequest, SendMultiMediaRequest, UploadMediaRequest ) from .tl.functions import channels from .tl.functions import messages from .tl.functions.users import ( GetUsersRequest ) from .tl.functions.channels import ( GetChannelsRequest, GetFullChannelRequest ) from .tl.types import ( DocumentAttributeAudio, DocumentAttributeFilename, InputDocumentFileLocation, InputFileLocation, InputMediaUploadedDocument, InputMediaUploadedPhoto, InputPeerEmpty, Message, MessageMediaContact, MessageMediaDocument, MessageMediaPhoto, InputUserSelf, UserProfilePhoto, ChatPhoto, UpdateMessageID, UpdateNewChannelMessage, UpdateNewMessage, UpdateShortSentMessage, PeerUser, InputPeerUser, InputPeerChat, InputPeerChannel, MessageEmpty, ChatInvite, ChatInviteAlready, PeerChannel, Photo, InputPeerSelf, InputSingleMedia, InputMediaPhoto, InputPhoto, InputFile, InputFileBig, InputDocument, InputMediaDocument ) from .tl.types.messages import DialogsSlice from .extensions import markdown __log__ = logging.getLogger(__name__) class TelegramClient(TelegramBareClient): """ Initializes the Telegram client with the specified API ID and Hash. Args: session (:obj:`str` | :obj:`Session` | :obj:`None`): The file name of the session file to be used if a string is given (it may be a full path), or the Session instance to be used otherwise. If it's ``None``, the session will not be saved, and you should call :meth:`.log_out()` when you're done. api_id (:obj:`int` | :obj:`str`): The API ID you obtained from https://my.telegram.org. api_hash (:obj:`str`): The API ID you obtained from https://my.telegram.org. connection_mode (:obj:`ConnectionMode`, optional): The connection mode to be used when creating a new connection to the servers. Defaults to the ``TCP_FULL`` mode. This will only affect how messages are sent over the network and how much processing is required before sending them. use_ipv6 (:obj:`bool`, optional): Whether to connect to the servers through IPv6 or not. By default this is ``False`` as IPv6 support is not too widespread yet. proxy (:obj:`tuple` | :obj:`dict`, optional): A tuple consisting of ``(socks.SOCKS5, 'host', port)``. See https://github.com/Anorov/PySocks#usage-1 for more. update_workers (:obj:`int`, optional): If specified, represents how many extra threads should be spawned to handle incoming updates, and updates will be kept in memory until they are processed. Note that you must set this to at least ``0`` if you want to be able to process updates through :meth:`updates.poll()`. timeout (:obj:`int` | :obj:`float` | :obj:`timedelta`, optional): The timeout to be used when receiving responses from the network. Defaults to 5 seconds. spawn_read_thread (:obj:`bool`, optional): Whether to use an extra background thread or not. Defaults to ``True`` so receiving items from the network happens instantly, as soon as they arrive. Can still be disabled if you want to run the library without any additional thread. Kwargs: Extra parameters will be forwarded to the ``Session`` file. Most relevant parameters are: .. code-block:: python device_model = platform.node() system_version = platform.system() app_version = TelegramClient.__version__ lang_code = 'en' system_lang_code = lang_code report_errors = True """ # region Initialization def __init__(self, session, api_id, api_hash, connection_mode=ConnectionMode.TCP_FULL, use_ipv6=False, proxy=None, update_workers=None, timeout=timedelta(seconds=5), spawn_read_thread=True, **kwargs): super().__init__( session, api_id, api_hash, connection_mode=connection_mode, use_ipv6=use_ipv6, proxy=proxy, update_workers=update_workers, spawn_read_thread=spawn_read_thread, timeout=timeout, **kwargs ) # Some fields to easy signing in. Let {phone: hash} be # a dictionary because the user may change their mind. self._phone_code_hash = {} self._phone = None # endregion # region Telegram requests functions # region Authorization requests def send_code_request(self, phone, force_sms=False): """ Sends a code request to the specified phone number. Args: phone (:obj:`str` | :obj:`int`): The phone to which the code will be sent. force_sms (:obj:`bool`, optional): Whether to force sending as SMS. Returns: Information about the result of the request. """ phone = utils.parse_phone(phone) or self._phone phone_hash = self._phone_code_hash.get(phone) if not phone_hash: result = self(SendCodeRequest(phone, self.api_id, self.api_hash)) self._phone_code_hash[phone] = phone_hash = result.phone_code_hash else: force_sms = True self._phone = phone if force_sms: result = self(ResendCodeRequest(phone, phone_hash)) self._phone_code_hash[phone] = result.phone_code_hash return result def start(self, phone=lambda: input('Please enter your phone: '), password=None, bot_token=None, force_sms=False, code_callback=None): """ Convenience method to interactively connect and sign in if required, also taking into consideration that 2FA may be enabled in the account. Example usage: >>> client = TelegramClient(session, api_id, api_hash).start(phone) Please enter the code you received: 12345 Please enter your password: ******* (You are now logged in) Args: phone (:obj:`str` | :obj:`int` | :obj:`callable`): The phone (or callable without arguments to get it) to which the code will be sent. password (:obj:`callable`, optional): The password for 2 Factor Authentication (2FA). This is only required if it is enabled in your account. bot_token (:obj:`str`): Bot Token obtained by @BotFather to log in as a bot. Cannot be specified with `phone` (only one of either allowed). force_sms (:obj:`bool`, optional): Whether to force sending the code request as SMS. This only makes sense when signing in with a `phone`. code_callback (:obj:`callable`, optional): A callable that will be used to retrieve the Telegram login code. Defaults to `input()`. Returns: :obj:`TelegramClient`: This client, so initialization can be chained with `.start()`. """ if code_callback is None: def code_callback(): return input('Please enter the code you received: ') elif not callable(code_callback): raise ValueError( 'The code_callback parameter needs to be a callable ' 'function that returns the code you received by Telegram.' ) if not phone and not bot_token: raise ValueError('No phone number or bot token provided.') if phone and bot_token: raise ValueError('Both a phone and a bot token provided, ' 'must only provide one of either') if not self.is_connected(): self.connect() if self.is_user_authorized(): return self if bot_token: self.sign_in(bot_token=bot_token) return self # Turn the callable into a valid phone number while callable(phone): phone = utils.parse_phone(phone()) or phone me = None attempts = 0 max_attempts = 3 two_step_detected = False self.send_code_request(phone, force_sms=force_sms) while attempts < max_attempts: try: # Raises SessionPasswordNeededError if 2FA enabled me = self.sign_in(phone, code_callback()) break except SessionPasswordNeededError: two_step_detected = True break except (PhoneCodeEmptyError, PhoneCodeExpiredError, PhoneCodeHashEmptyError, PhoneCodeInvalidError): print('Invalid code. Please try again.', file=sys.stderr) attempts += 1 else: raise RuntimeError( '{} consecutive sign-in attempts failed. Aborting' .format(max_attempts) ) if two_step_detected: if not password: raise ValueError( "Two-step verification is enabled for this account. " "Please provide the 'password' argument to 'start()'." ) me = self.sign_in(phone=phone, password=password) # We won't reach here if any step failed (exit by exception) print('Signed in successfully as', utils.get_display_name(me)) return self def sign_in(self, phone=None, code=None, password=None, bot_token=None, phone_code_hash=None): """ Starts or completes the sign in process with the given phone number or code that Telegram sent. Args: phone (:obj:`str` | :obj:`int`): The phone to send the code to if no code was provided, or to override the phone that was previously used with these requests. code (:obj:`str` | :obj:`int`): The code that Telegram sent. password (:obj:`str`): 2FA password, should be used if a previous call raised SessionPasswordNeededError. bot_token (:obj:`str`): Used to sign in as a bot. Not all requests will be available. This should be the hash the @BotFather gave you. phone_code_hash (:obj:`str`): The hash returned by .send_code_request. This can be set to None to use the last hash known. Returns: The signed in user, or the information about :meth:`.send_code_request()`. """ if phone and not code and not password: return self.send_code_request(phone) elif code: phone = utils.parse_phone(phone) or self._phone phone_code_hash = \ phone_code_hash or self._phone_code_hash.get(phone, None) if not phone: raise ValueError( 'Please make sure to call send_code_request first.' ) if not phone_code_hash: raise ValueError('You also need to provide a phone_code_hash.') # May raise PhoneCodeEmptyError, PhoneCodeExpiredError, # PhoneCodeHashEmptyError or PhoneCodeInvalidError. result = self(SignInRequest(phone, phone_code_hash, str(code))) elif password: salt = self(GetPasswordRequest()).current_salt result = self(CheckPasswordRequest( helpers.get_password_hash(password, salt) )) elif bot_token: result = self(ImportBotAuthorizationRequest( flags=0, bot_auth_token=bot_token, api_id=self.api_id, api_hash=self.api_hash )) else: raise ValueError( 'You must provide a phone and a code the first time, ' 'and a password only if an RPCError was raised before.' ) self._set_connected_and_authorized() return result.user def sign_up(self, code, first_name, last_name=''): """ Signs up to Telegram if you don't have an account yet. You must call .send_code_request(phone) first. Args: code (:obj:`str` | :obj:`int`): The code sent by Telegram first_name (:obj:`str`): The first name to be used by the new account. last_name (:obj:`str`, optional) Optional last name. Returns: The new created user. """ result = self(SignUpRequest( phone_number=self._phone, phone_code_hash=self._phone_code_hash.get(self._phone, ''), phone_code=code, first_name=first_name, last_name=last_name )) self._set_connected_and_authorized() return result.user def log_out(self): """ Logs out Telegram and deletes the current *.session file. Returns: True if the operation was successful. """ try: self(LogOutRequest()) except RPCError: return False self.disconnect() self.session.delete() self.session = None return True def get_me(self): """ Gets "me" (the self user) which is currently authenticated, or None if the request fails (hence, not authenticated). Returns: :obj:`User`: Your own user. """ try: return self(GetUsersRequest([InputUserSelf()]))[0] except UnauthorizedError: return None # endregion # region Dialogs ("chats") requests def get_dialogs(self, limit=10, offset_date=None, offset_id=0, offset_peer=InputPeerEmpty()): """ Gets N "dialogs" (open "chats" or conversations with other people). Args: limit (:obj:`int` | :obj:`None`): How many dialogs to be retrieved as maximum. Can be set to ``None`` to retrieve all dialogs. Note that this may take whole minutes if you have hundreds of dialogs, as Telegram will tell the library to slow down through a ``FloodWaitError``. offset_date (:obj:`datetime`, optional): The offset date to be used. offset_id (:obj:`int`, optional): The message ID to be used as an offset. offset_peer (:obj:`InputPeer`, optional): The peer to be used as an offset. Returns: A list dialogs, with an additional .total attribute on the list. """ limit = float('inf') if limit is None else int(limit) if limit == 0: # Special case, get a single dialog and determine count dialogs = self(GetDialogsRequest( offset_date=offset_date, offset_id=offset_id, offset_peer=offset_peer, limit=1 )) result = UserList() result.total = getattr(dialogs, 'count', len(dialogs.dialogs)) return result total_count = 0 dialogs = OrderedDict() # Use peer id as identifier to avoid dupes while len(dialogs) < limit: real_limit = min(limit - len(dialogs), 100) r = self(GetDialogsRequest( offset_date=offset_date, offset_id=offset_id, offset_peer=offset_peer, limit=real_limit )) total_count = getattr(r, 'count', len(r.dialogs)) messages = {m.id: m for m in r.messages} entities = {utils.get_peer_id(x): x for x in itertools.chain(r.users, r.chats)} for d in r.dialogs: dialogs[utils.get_peer_id(d.peer)] = \ Dialog(self, d, entities, messages) if len(r.dialogs) < real_limit or not isinstance(r, DialogsSlice): # Less than we requested means we reached the end, or # we didn't get a DialogsSlice which means we got all. break offset_date = r.messages[-1].date offset_peer = entities[utils.get_peer_id(r.dialogs[-1].peer)] offset_id = r.messages[-1].id & 4294967296 # Telegram/danog magic dialogs = UserList( itertools.islice(dialogs.values(), min(limit, len(dialogs))) ) dialogs.total = total_count return dialogs def get_drafts(self): # TODO: Ability to provide a `filter` """ Gets all open draft messages. Returns: A list of custom ``Draft`` objects that are easy to work with: You can call :meth:`draft.set_message('text')` to change the message, or delete it through :meth:`draft.delete()`. """ response = self(GetAllDraftsRequest()) self.session.process_entities(response) self.session.generate_sequence(response.seq) drafts = [Draft._from_update(self, u) for u in response.updates] return drafts @staticmethod def _get_response_message(request, result): """ Extracts the response message known a request and Update result. The request may also be the ID of the message to match. """ # Telegram seems to send updateMessageID first, then updateNewMessage, # however let's not rely on that just in case. if isinstance(request, int): msg_id = request else: msg_id = None for update in result.updates: if isinstance(update, UpdateMessageID): if update.random_id == request.random_id: msg_id = update.id break for update in result.updates: if isinstance(update, (UpdateNewChannelMessage, UpdateNewMessage)): if update.message.id == msg_id: return update.message def send_message(self, entity, message, reply_to=None, parse_mode=None, link_preview=True): """ Sends the given message to the specified entity (user/chat/channel). Args: entity (:obj:`entity`): To who will it be sent. message (:obj:`str`): The message to be sent. reply_to (:obj:`int` | :obj:`Message`, optional): Whether to reply to a message or not. If an integer is provided, it should be the ID of the message that it should reply to. parse_mode (:obj:`str`, optional): Can be 'md' or 'markdown' for markdown-like parsing, in a similar fashion how official clients work. link_preview (:obj:`bool`, optional): Should the link preview be shown? Returns: the sent message """ entity = self.get_input_entity(entity) if parse_mode: parse_mode = parse_mode.lower() if parse_mode in {'md', 'markdown'}: message, msg_entities = markdown.parse(message) else: raise ValueError('Unknown parsing mode: {}'.format(parse_mode)) else: msg_entities = [] request = SendMessageRequest( peer=entity, message=message, entities=msg_entities, no_webpage=not link_preview, reply_to_msg_id=self._get_reply_to(reply_to) ) result = self(request) if isinstance(result, UpdateShortSentMessage): return Message( id=result.id, to_id=entity, message=message, date=result.date, out=result.out, media=result.media, entities=result.entities ) return self._get_response_message(request, result) def delete_messages(self, entity, message_ids, revoke=True): """ Deletes a message from a chat, optionally "for everyone". Args: entity (:obj:`entity`): From who the message will be deleted. This can actually be ``None`` for normal chats, but **must** be present for channels and megagroups. message_ids (:obj:`list` | :obj:`int` | :obj:`Message`): The IDs (or ID) or messages to be deleted. revoke (:obj:`bool`, optional): Whether the message should be deleted for everyone or not. By default it has the opposite behaviour of official clients, and it will delete the message for everyone. This has no effect on channels or megagroups. Returns: The affected messages. """ if not isinstance(message_ids, list): message_ids = [message_ids] message_ids = [m.id if isinstance(m, Message) else int(m) for m in message_ids] if entity is None: return self(messages.DeleteMessagesRequest(message_ids, revoke=revoke)) entity = self.get_input_entity(entity) if isinstance(entity, InputPeerChannel): return self(channels.DeleteMessagesRequest(entity, message_ids)) else: return self(messages.DeleteMessagesRequest(message_ids, revoke=revoke)) def get_message_history(self, entity, limit=20, offset_date=None, offset_id=0, max_id=0, min_id=0, add_offset=0): """ Gets the message history for the specified entity Args: entity (:obj:`entity`): The entity from whom to retrieve the message history. limit (:obj:`int` | :obj:`None`, optional): Number of messages to be retrieved. Due to limitations with the API retrieving more than 3000 messages will take longer than half a minute (or even more based on previous calls). The limit may also be ``None``, which would eventually return the whole history. offset_date (:obj:`datetime`): Offset date (messages *previous* to this date will be retrieved). Exclusive. offset_id (:obj:`int`): Offset message ID (only messages *previous* to the given ID will be retrieved). Exclusive. max_id (:obj:`int`): All the messages with a higher (newer) ID or equal to this will be excluded min_id (:obj:`int`): All the messages with a lower (older) ID or equal to this will be excluded. add_offset (:obj:`int`): Additional message offset (all of the specified offsets + this offset = older messages). Returns: A list of messages with extra attributes: * ``.total`` = (on the list) total amount of messages sent. * ``.sender`` = entity of the sender. * ``.fwd_from.sender`` = if fwd_from, who sent it originally. * ``.fwd_from.channel`` = if fwd_from, original channel. * ``.to`` = entity to which the message was sent. """ entity = self.get_input_entity(entity) limit = float('inf') if limit is None else int(limit) if limit == 0: # No messages, but we still need to know the total message count result = self(GetHistoryRequest( peer=entity, limit=1, offset_date=None, offset_id=0, max_id=0, min_id=0, add_offset=0 )) return getattr(result, 'count', len(result.messages)), [], [] total_messages = 0 messages = UserList() entities = {} while len(messages) < limit: # Telegram has a hard limit of 100 real_limit = min(limit - len(messages), 100) result = self(GetHistoryRequest( peer=entity, limit=real_limit, offset_date=offset_date, offset_id=offset_id, max_id=max_id, min_id=min_id, add_offset=add_offset, hash=0 )) messages.extend( m for m in result.messages if not isinstance(m, MessageEmpty) ) total_messages = getattr(result, 'count', len(result.messages)) # TODO We can potentially use self.session.database, but since # it might be disabled, use a local dictionary. for u in result.users: entities[utils.get_peer_id(u)] = u for c in result.chats: entities[utils.get_peer_id(c)] = c if len(result.messages) < real_limit: break offset_id = result.messages[-1].id offset_date = result.messages[-1].date # Telegram limit seems to be 3000 messages within 30 seconds in # batches of 100 messages each request (since the FloodWait was # of 30 seconds). If the limit is greater than that, we will # sleep 1s between each request. if limit > 3000: time.sleep(1) # Add a few extra attributes to the Message to make it friendlier. messages.total = total_messages for m in messages: m.sender = (None if not m.from_id else entities[utils.get_peer_id(m.from_id)]) if getattr(m, 'fwd_from', None): m.fwd_from.sender = ( None if not m.fwd_from.from_id else entities[utils.get_peer_id(m.fwd_from.from_id)] ) m.fwd_from.channel = ( None if not m.fwd_from.channel_id else entities[utils.get_peer_id( PeerChannel(m.fwd_from.channel_id) )] ) m.to = entities[utils.get_peer_id(m.to_id)] return messages def send_read_acknowledge(self, entity, message=None, max_id=None, clear_mentions=False): """ Sends a "read acknowledge" (i.e., notifying the given peer that we've read their messages, also known as the "double check"). Args: entity (:obj:`entity`): The chat where these messages are located. message (:obj:`list` | :obj:`Message`): Either a list of messages or a single message. max_id (:obj:`int`): Overrides messages, until which message should the acknowledge should be sent. clear_mentions (:obj:`bool`): Whether the mention badge should be cleared (so that there are no more mentions) or not for the given entity. If no message is provided, this will be the only action taken. """ if max_id is None: if message: if hasattr(message, '__iter__'): max_id = max(msg.id for msg in message) else: max_id = message.id elif not clear_mentions: raise ValueError( 'Either a message list or a max_id must be provided.') entity = self.get_input_entity(entity) if clear_mentions: self(ReadMentionsRequest(entity)) if max_id is None: return True if max_id is not None: if isinstance(entity, InputPeerChannel): return self(channels.ReadHistoryRequest(entity, max_id=max_id)) else: return self(messages.ReadHistoryRequest(entity, max_id=max_id)) return False @staticmethod def _get_reply_to(reply_to): """Sanitizes the 'reply_to' parameter a user may send""" if reply_to is None: return None if isinstance(reply_to, int): return reply_to try: if reply_to.SUBCLASS_OF_ID == 0x790009e3: # hex(crc32(b'Message')) = 0x790009e3 return reply_to.id except AttributeError: pass raise TypeError('Invalid reply_to type: {}'.format(type(reply_to))) # endregion # region Uploading files def send_file(self, entity, file, caption='', force_document=False, progress_callback=None, reply_to=None, attributes=None, thumb=None, allow_cache=True, **kwargs): """ Sends a file to the specified entity. Args: entity (:obj:`entity`): Who will receive the file. file (:obj:`str` | :obj:`bytes` | :obj:`file`): The path of the file, byte array, or stream that will be sent. Note that if a byte array or a stream is given, a filename or its type won't be inferred, and it will be sent as an "unnamed application/octet-stream". Subsequent calls with the very same file will result in immediate uploads, unless ``.clear_file_cache()`` is called. caption (:obj:`str`, optional): Optional caption for the sent media message. force_document (:obj:`bool`, optional): If left to ``False`` and the file is a path that ends with ``.png``, ``.jpg`` and such, the file will be sent as a photo. Otherwise always as a document. progress_callback (:obj:`callable`, optional): A callback function accepting two parameters: ``(sent bytes, total)``. reply_to (:obj:`int` | :obj:`Message`): Same as reply_to from .send_message(). attributes (:obj:`list`, optional): Optional attributes that override the inferred ones, like ``DocumentAttributeFilename`` and so on. thumb (:obj:`str` | :obj:`bytes` | :obj:`file`, optional): Optional thumbnail (for videos). allow_cache (:obj:`bool`, optional): Whether to allow using the cached version stored in the database or not. Defaults to ``True`` to avoid re-uploads. Must be ``False`` if you wish to use different attributes or thumb than those that were used when the file was cached. Kwargs: If "is_voice_note" in kwargs, despite its value, and the file is sent as a document, it will be sent as a voice note. Returns: The message (or messages) containing the sent file. """ # First check if the user passed an iterable, in which case # we may want to send as an album if all are photo files. if hasattr(file, '__iter__') and not isinstance(file, (str, bytes)): # Convert to tuple so we can iterate several times file = tuple(x for x in file) if all(utils.is_image(x) for x in file): return self._send_album( entity, file, caption=caption, progress_callback=progress_callback, reply_to=reply_to ) # Not all are images, so send all the files one by one return [ self.send_file( entity, x, allow_cache=False, caption=caption, force_document=force_document, progress_callback=progress_callback, reply_to=reply_to, attributes=attributes, thumb=thumb, **kwargs ) for x in file ] as_image = utils.is_image(file) and not force_document use_cache = InputPhoto if as_image else InputDocument file_handle = self.upload_file( file, progress_callback=progress_callback, use_cache=use_cache if allow_cache else None ) if isinstance(file_handle, use_cache): # File was cached, so an instance of use_cache was returned if as_image: media = InputMediaPhoto(file_handle, caption) else: media = InputMediaDocument(file_handle, caption) elif as_image: media = InputMediaUploadedPhoto(file_handle, caption) else: mime_type = None if isinstance(file, str): # Determine mime-type and attributes # Take the first element by using [0] since it returns a tuple mime_type = guess_type(file)[0] attr_dict = { DocumentAttributeFilename: DocumentAttributeFilename(os.path.basename(file)) # TODO If the input file is an audio, find out: # Performer and song title and add DocumentAttributeAudio } else: attr_dict = { DocumentAttributeFilename: DocumentAttributeFilename('unnamed') } if 'is_voice_note' in kwargs: attr_dict[DocumentAttributeAudio] = \ DocumentAttributeAudio(0, voice=True) # Now override the attributes if any. As we have a dict of # {cls: instance}, we can override any class with the list # of attributes provided by the user easily. if attributes: for a in attributes: attr_dict[type(a)] = a # Ensure we have a mime type, any; but it cannot be None # 'The "octet-stream" subtype is used to indicate that a body # contains arbitrary binary data.' if not mime_type: mime_type = 'application/octet-stream' input_kw = {} if thumb: input_kw['thumb'] = self.upload_file(thumb) media = InputMediaUploadedDocument( file=file_handle, mime_type=mime_type, attributes=list(attr_dict.values()), caption=caption, **input_kw ) # Once the media type is properly specified and the file uploaded, # send the media message to the desired entity. request = SendMediaRequest( peer=self.get_input_entity(entity), media=media, reply_to_msg_id=self._get_reply_to(reply_to) ) msg = self._get_response_message(request, self(request)) if msg and isinstance(file_handle, InputSizedFile): # There was a response message and we didn't use cached # version, so cache whatever we just sent to the database. md5, size = file_handle.md5, file_handle.size if as_image: to_cache = utils.get_input_photo(msg.media.photo) else: to_cache = utils.get_input_document(msg.media.document) self.session.cache_file(md5, size, to_cache) return msg def send_voice_note(self, entity, file, caption='', progress_callback=None, reply_to=None): """Wrapper method around .send_file() with is_voice_note=()""" return self.send_file(entity, file, caption, progress_callback=progress_callback, reply_to=reply_to, is_voice_note=()) # empty tuple is enough def _send_album(self, entity, files, caption='', progress_callback=None, reply_to=None): """Specialized version of .send_file for albums""" # We don't care if the user wants to avoid cache, we will use it # anyway. Why? The cached version will be exactly the same thing # we need to produce right now to send albums (uploadMedia), and # cache only makes a difference for documents where the user may # want the attributes used on them to change. Caption's ignored. entity = self.get_input_entity(entity) reply_to = self._get_reply_to(reply_to) # Need to upload the media first, but only if they're not cached yet media = [] for file in files: # fh will either be InputPhoto or a modified InputFile fh = self.upload_file(file, use_cache=InputPhoto) if not isinstance(fh, InputPhoto): input_photo = utils.get_input_photo(self(UploadMediaRequest( entity, media=InputMediaUploadedPhoto(fh, caption) )).photo) self.session.cache_file(fh.md5, fh.size, input_photo) fh = input_photo media.append(InputSingleMedia(InputMediaPhoto(fh, caption))) # Now we can construct the multi-media request result = self(SendMultiMediaRequest( entity, reply_to_msg_id=reply_to, multi_media=media )) return [ self._get_response_message(update.id, result) for update in result.updates if isinstance(update, UpdateMessageID) ] def upload_file(self, file, part_size_kb=None, file_name=None, use_cache=None, progress_callback=None): """ Uploads the specified file and returns a handle (an instance of InputFile or InputFileBig, as required) which can be later used before it expires (they are usable during less than a day). Uploading a file will simply return a "handle" to the file stored remotely in the Telegram servers, which can be later used on. This will **not** upload the file to your own chat or any chat at all. Args: file (:obj:`str` | :obj:`bytes` | :obj:`file`): The path of the file, byte array, or stream that will be sent. Note that if a byte array or a stream is given, a filename or its type won't be inferred, and it will be sent as an "unnamed application/octet-stream". Subsequent calls with the very same file will result in immediate uploads, unless ``.clear_file_cache()`` is called. part_size_kb (:obj:`int`, optional): Chunk size when uploading files. The larger, the less requests will be made (up to 512KB maximum). file_name (:obj:`str`, optional): The file name which will be used on the resulting InputFile. If not specified, the name will be taken from the ``file`` and if this is not a ``str``, it will be ``"unnamed"``. use_cache (:obj:`type`, optional): The type of cache to use (currently either ``InputDocument`` or ``InputPhoto``). If present and the file is small enough to need the MD5, it will be checked against the database, and if a match is found, the upload won't be made. Instead, an instance of type ``use_cache`` will be returned. progress_callback (:obj:`callable`, optional): A callback function accepting two parameters: ``(sent bytes, total)``. Returns: ``InputFileBig`` if the file size is larger than 10MB, ``InputSizedFile`` (subclass of ``InputFile``) otherwise. """ if isinstance(file, (InputFile, InputFileBig)): return file # Already uploaded if isinstance(file, str): file_size = os.path.getsize(file) elif isinstance(file, bytes): file_size = len(file) else: file = file.read() file_size = len(file) # File will now either be a string or bytes if not part_size_kb: part_size_kb = utils.get_appropriated_part_size(file_size) if part_size_kb > 512: raise ValueError('The part size must be less or equal to 512KB') part_size = int(part_size_kb * 1024) if part_size % 1024 != 0: raise ValueError( 'The part size must be evenly divisible by 1024') # Set a default file name if None was specified file_id = helpers.generate_random_long() if not file_name: if isinstance(file, str): file_name = os.path.basename(file) else: file_name = str(file_id) # Determine whether the file is too big (over 10MB) or not # Telegram does make a distinction between smaller or larger files is_large = file_size > 10 * 1024 * 1024 hash_md5 = hashlib.md5() if not is_large: # Calculate the MD5 hash before anything else. # As this needs to be done always for small files, # might as well do it before anything else and # check the cache. if isinstance(file, str): with open(file, 'rb') as stream: file = stream.read() hash_md5.update(file) if use_cache: cached = self.session.get_file( hash_md5.digest(), file_size, cls=use_cache ) if cached: return cached part_count = (file_size + part_size - 1) // part_size __log__.info('Uploading file of %d bytes in %d chunks of %d', file_size, part_count, part_size) with open(file, 'rb') if isinstance(file, str) else BytesIO(file) \ as stream: for part_index in range(part_count): # Read the file by in chunks of size part_size part = stream.read(part_size) # The SavePartRequest is different depending on whether # the file is too large or not (over or less than 10MB) if is_large: request = SaveBigFilePartRequest(file_id, part_index, part_count, part) else: request = SaveFilePartRequest(file_id, part_index, part) result = self(request) if result: __log__.debug('Uploaded %d/%d', part_index + 1, part_count) if progress_callback: progress_callback(stream.tell(), file_size) else: raise RuntimeError( 'Failed to upload file part {}.'.format(part_index)) if is_large: return InputFileBig(file_id, part_count, file_name) else: return InputSizedFile( file_id, part_count, file_name, md5=hash_md5, size=file_size ) # endregion # region Downloading media requests def download_profile_photo(self, entity, file=None, download_big=True): """ Downloads the profile photo of the given entity (user/chat/channel). Args: entity (:obj:`entity`): From who the photo will be downloaded. file (:obj:`str` | :obj:`file`, optional): The output file path, directory, or stream-like object. If the path exists and is a file, it will be overwritten. download_big (:obj:`bool`, optional): Whether to use the big version of the available photos. Returns: ``None`` if no photo was provided, or if it was Empty. On success the file path is returned since it may differ from the one given. """ photo = entity possible_names = [] try: is_entity = entity.SUBCLASS_OF_ID in ( 0x2da17977, 0xc5af5d94, 0x1f4661b9, 0xd49a2697 ) except AttributeError: return None # Not even a TLObject as attribute access failed if is_entity: # Maybe it is an user or a chat? Or their full versions? # # The hexadecimal numbers above are simply: # hex(crc32(x.encode('ascii'))) for x in # ('User', 'Chat', 'UserFull', 'ChatFull') entity = self.get_entity(entity) if not hasattr(entity, 'photo'): # Special case: may be a ChatFull with photo:Photo # This is different from a normal UserProfilePhoto and Chat if hasattr(entity, 'chat_photo'): return self._download_photo( entity.chat_photo, file, date=None, progress_callback=None ) else: # Give up return None for attr in ('username', 'first_name', 'title'): possible_names.append(getattr(entity, attr, None)) photo = entity.photo if not isinstance(photo, UserProfilePhoto) and \ not isinstance(photo, ChatPhoto): return None photo_location = photo.photo_big if download_big else photo.photo_small file = self._get_proper_filename( file, 'profile_photo', '.jpg', possible_names=possible_names ) # Download the media with the largest size input file location try: self.download_file( InputFileLocation( volume_id=photo_location.volume_id, local_id=photo_location.local_id, secret=photo_location.secret ), file ) except LocationInvalidError: # See issue #500, Android app fails as of v4.6.0 (1155). # The fix seems to be using the full channel chat photo. ie = self.get_input_entity(entity) if isinstance(ie, InputPeerChannel): full = self(GetFullChannelRequest(ie)) return self._download_photo( full.full_chat.chat_photo, file, date=None, progress_callback=None ) else: # Until there's a report for chats, no need to. return None return file def download_media(self, message, file=None, progress_callback=None): """ Downloads the given media, or the media from a specified Message. message (:obj:`Message` | :obj:`Media`): The media or message containing the media that will be downloaded. file (:obj:`str` | :obj:`file`, optional): The output file path, directory, or stream-like object. If the path exists and is a file, it will be overwritten. progress_callback (:obj:`callable`, optional): A callback function accepting two parameters: ``(recv bytes, total)``. Returns: ``None`` if no media was provided, or if it was Empty. On success the file path is returned since it may differ from the one given. """ # TODO This won't work for messageService if isinstance(message, Message): date = message.date media = message.media else: date = datetime.now() media = message if isinstance(media, (MessageMediaPhoto, Photo)): return self._download_photo( media, file, date, progress_callback ) elif isinstance(media, MessageMediaDocument): return self._download_document( media, file, date, progress_callback ) elif isinstance(media, MessageMediaContact): return self._download_contact( media, file ) def _download_photo(self, photo, file, date, progress_callback): """Specialized version of .download_media() for photos""" # Determine the photo and its largest size if isinstance(photo, MessageMediaPhoto): photo = photo.photo if not isinstance(photo, Photo): return largest_size = photo.sizes[-1] file_size = largest_size.size largest_size = largest_size.location file = self._get_proper_filename(file, 'photo', '.jpg', date=date) # Download the media with the largest size input file location self.download_file( InputFileLocation( volume_id=largest_size.volume_id, local_id=largest_size.local_id, secret=largest_size.secret ), file, file_size=file_size, progress_callback=progress_callback ) return file def _download_document(self, mm_doc, file, date, progress_callback): """Specialized version of .download_media() for documents""" document = mm_doc.document file_size = document.size possible_names = [] for attr in document.attributes: if isinstance(attr, DocumentAttributeFilename): possible_names.insert(0, attr.file_name) elif isinstance(attr, DocumentAttributeAudio): possible_names.append('{} - {}'.format( attr.performer, attr.title )) file = self._get_proper_filename( file, 'document', utils.get_extension(mm_doc), date=date, possible_names=possible_names ) self.download_file( InputDocumentFileLocation( id=document.id, access_hash=document.access_hash, version=document.version ), file, file_size=file_size, progress_callback=progress_callback ) return file @staticmethod def _download_contact(mm_contact, file): """Specialized version of .download_media() for contacts. Will make use of the vCard 4.0 format """ first_name = mm_contact.first_name last_name = mm_contact.last_name phone_number = mm_contact.phone_number if isinstance(file, str): file = TelegramClient._get_proper_filename( file, 'contact', '.vcard', possible_names=[first_name, phone_number, last_name] ) f = open(file, 'w', encoding='utf-8') else: f = file try: # Remove these pesky characters first_name = first_name.replace(';', '') last_name = (last_name or '').replace(';', '') f.write('BEGIN:VCARD\n') f.write('VERSION:4.0\n') f.write('N:{};{};;;\n'.format(first_name, last_name)) f.write('FN:{} {}\n'.format(first_name, last_name)) f.write('TEL;TYPE=cell;VALUE=uri:tel:+{}\n'.format(phone_number)) f.write('END:VCARD\n') finally: # Only close the stream if we opened it if isinstance(file, str): f.close() return file @staticmethod def _get_proper_filename(file, kind, extension, date=None, possible_names=None): """Gets a proper filename for 'file', if this is a path. 'kind' should be the kind of the output file (photo, document...) 'extension' should be the extension to be added to the file if the filename doesn't have any yet 'date' should be when this file was originally sent, if known 'possible_names' should be an ordered list of possible names If no modification is made to the path, any existing file will be overwritten. If any modification is made to the path, this method will ensure that no existing file will be overwritten. """ if file is not None and not isinstance(file, str): # Probably a stream-like object, we cannot set a filename here return file if file is None: file = '' elif os.path.isfile(file): # Make no modifications to valid existing paths return file if os.path.isdir(file) or not file: try: name = None if possible_names is None else next( x for x in possible_names if x ) except StopIteration: name = None if not name: if not date: date = datetime.now() name = '{}_{}-{:02}-{:02}_{:02}-{:02}-{:02}'.format( kind, date.year, date.month, date.day, date.hour, date.minute, date.second, ) file = os.path.join(file, name) directory, name = os.path.split(file) name, ext = os.path.splitext(name) if not ext: ext = extension result = os.path.join(directory, name + ext) if not os.path.isfile(result): return result i = 1 while True: result = os.path.join(directory, '{} ({}){}'.format(name, i, ext)) if not os.path.isfile(result): return result i += 1 def download_file(self, input_location, file, part_size_kb=None, file_size=None, progress_callback=None): """ Downloads the given input location to a file. Args: input_location (:obj:`InputFileLocation`): The file location from which the file will be downloaded. file (:obj:`str` | :obj:`file`, optional): The output file path, directory, or stream-like object. If the path exists and is a file, it will be overwritten. part_size_kb (:obj:`int`, optional): Chunk size when downloading files. The larger, the less requests will be made (up to 512KB maximum). file_size (:obj:`int`, optional): The file size that is about to be downloaded, if known. Only used if ``progress_callback`` is specified. progress_callback (:obj:`callable`, optional): A callback function accepting two parameters: ``(downloaded bytes, total)``. Note that the ``total`` is the provided ``file_size``. """ if not part_size_kb: if not file_size: part_size_kb = 64 # Reasonable default else: part_size_kb = utils.get_appropriated_part_size(file_size) part_size = int(part_size_kb * 1024) # https://core.telegram.org/api/files says: # > part_size % 1024 = 0 (divisible by 1KB) # # But https://core.telegram.org/cdn (more recent) says: # > limit must be divisible by 4096 bytes # So we just stick to the 4096 limit. if part_size % 4096 != 0: raise ValueError( 'The part size must be evenly divisible by 4096.') if isinstance(file, str): # Ensure that we'll be able to download the media helpers.ensure_parent_dir_exists(file) f = open(file, 'wb') else: f = file # The used client will change if FileMigrateError occurs client = self cdn_decrypter = None __log__.info('Downloading file in chunks of %d bytes', part_size) try: offset = 0 while True: try: if cdn_decrypter: result = cdn_decrypter.get_file() else: result = client(GetFileRequest( input_location, offset, part_size )) if isinstance(result, FileCdnRedirect): __log__.info('File lives in a CDN') cdn_decrypter, result = \ CdnDecrypter.prepare_decrypter( client, self._get_cdn_client(result), result ) except FileMigrateError as e: __log__.info('File lives in another DC') client = self._get_exported_client(e.new_dc) continue offset += part_size # If we have received no data (0 bytes), the file is over # So there is nothing left to download and write if not result.bytes: # Return some extra information, unless it's a CDN file return getattr(result, 'type', '') f.write(result.bytes) __log__.debug('Saved %d more bytes', len(result.bytes)) if progress_callback: progress_callback(f.tell(), file_size) finally: if client != self: client.disconnect() if cdn_decrypter: try: cdn_decrypter.client.disconnect() except: pass if isinstance(file, str): f.close() # endregion # endregion # region Small utilities to make users' life easier def get_entity(self, entity): """ Turns the given entity into a valid Telegram user or chat. entity (:obj:`str` | :obj:`int` | :obj:`Peer` | :obj:`InputPeer`): The entity (or iterable of entities) to be transformed. If it's a string which can be converted to an integer or starts with '+' it will be resolved as if it were a phone number. If it doesn't start with '+' or starts with a '@' it will be be resolved from the username. If no exact match is returned, an error will be raised. If the entity is an integer or a Peer, its information will be returned through a call to self.get_input_peer(entity). If the entity is neither, and it's not a TLObject, an error will be raised. Returns: ``User``, ``Chat`` or ``Channel`` corresponding to the input entity. """ if hasattr(entity, '__iter__') and not isinstance(entity, str): single = False else: single = True entity = (entity,) # Group input entities by string (resolve username), # input users (get users), input chat (get chats) and # input channels (get channels) to get the most entities # in the less amount of calls possible. inputs = [ x if isinstance(x, str) else self.get_input_entity(x) for x in entity ] users = [x for x in inputs if isinstance(x, InputPeerUser)] chats = [x.chat_id for x in inputs if isinstance(x, InputPeerChat)] channels = [x for x in inputs if isinstance(x, InputPeerChannel)] if users: # GetUsersRequest has a limit of 200 per call tmp = [] while users: curr, users = users[:200], users[200:] tmp.extend(self(GetUsersRequest(curr))) users = tmp if chats: # TODO Handle chats slice? chats = self(GetChatsRequest(chats)).chats if channels: channels = self(GetChannelsRequest(channels)).chats # Merge users, chats and channels into a single dictionary id_entity = { utils.get_peer_id(x): x for x in itertools.chain(users, chats, channels) } # We could check saved usernames and put them into the users, # chats and channels list from before. While this would reduce # the amount of ResolveUsername calls, it would fail to catch # username changes. result = [ self._get_entity_from_string(x) if isinstance(x, str) else id_entity[utils.get_peer_id(x)] for x in inputs ] return result[0] if single else result def _get_entity_from_string(self, string): """ Gets a full entity from the given string, which may be a phone or an username, and processes all the found entities on the session. The string may also be a user link, or a channel/chat invite link. This method has the side effect of adding the found users to the session database, so it can be queried later without API calls, if this option is enabled on the session. Returns the found entity, or raises TypeError if not found. """ phone = utils.parse_phone(string) if phone: for user in self(GetContactsRequest(0)).users: if user.phone == phone: return user else: string, is_join_chat = utils.parse_username(string) if is_join_chat: invite = self(CheckChatInviteRequest(string)) if isinstance(invite, ChatInvite): # If it's an invite to a chat, the user must join before # for the link to be resolved and work, otherwise raise. if invite.channel: return invite.channel elif isinstance(invite, ChatInviteAlready): return invite.chat else: if string in ('me', 'self'): return self.get_me() result = self(ResolveUsernameRequest(string)) for entity in itertools.chain(result.users, result.chats): if entity.username.lower() == string: return entity raise TypeError( 'Cannot turn "{}" into any entity (user or chat)'.format(string) ) def get_input_entity(self, peer): """ Turns the given peer into its input entity version. Most requests use this kind of InputUser, InputChat and so on, so this is the most suitable call to make for those cases. entity (:obj:`str` | :obj:`int` | :obj:`Peer` | :obj:`InputPeer`): The integer ID of an user or otherwise either of a ``PeerUser``, ``PeerChat`` or ``PeerChannel``, for which to get its ``Input*`` version. If this ``Peer`` hasn't been seen before by the library, the top dialogs will be loaded and their entities saved to the session file (unless this feature was disabled explicitly). If in the end the access hash required for the peer was not found, a ValueError will be raised. Returns: ``InputPeerUser``, ``InputPeerChat`` or ``InputPeerChannel``. """ try: # First try to get the entity from cache, otherwise figure it out return self.session.get_input_entity(peer) except ValueError: pass if isinstance(peer, str): if peer in ('me', 'self'): return InputPeerSelf() return utils.get_input_peer(self._get_entity_from_string(peer)) is_peer = False if isinstance(peer, int): peer = PeerUser(peer) is_peer = True else: try: is_peer = peer.SUBCLASS_OF_ID == 0x2d45687 # crc32(b'Peer') if not is_peer: return utils.get_input_peer(peer) except (AttributeError, TypeError): pass # Attribute if not TLObject, Type if not "casteable" if not is_peer: raise TypeError( 'Cannot turn "{}" into an input entity.'.format(peer) ) # Not found, look in the latest dialogs. # This is useful if for instance someone just sent a message but # the updates didn't specify who, as this person or chat should # be in the latest dialogs. dialogs = self(GetDialogsRequest( offset_date=None, offset_id=0, offset_peer=InputPeerEmpty(), limit=0, exclude_pinned=True )) target = utils.get_peer_id(peer) for entity in itertools.chain(dialogs.users, dialogs.chats): if utils.get_peer_id(entity) == target: return utils.get_input_peer(entity) raise TypeError( 'Could not find the input entity corresponding to "{}".' 'Make sure you have encountered this peer before.'.format(peer) ) # endregion