You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

219 lines
7.8 KiB

4 years ago
4 years ago
4 years ago
  1. # Copyright (c) 2020 Tulir Asokan
  2. #
  3. # This Source Code Form is subject to the terms of the Mozilla Public
  4. # License, v. 2.0. If a copy of the MPL was not distributed with this
  5. # file, You can obtain one at http://mozilla.org/MPL/2.0/.
  6. from typing import Dict, TypedDict
  7. from io import BytesIO
  8. import argparse
  9. import os.path
  10. import asyncio
  11. import json
  12. import re
  13. from aiohttp import ClientSession
  14. from yarl import URL
  15. from PIL import Image
  16. from telethon import TelegramClient
  17. from telethon.tl.functions.messages import GetAllStickersRequest, GetStickerSetRequest
  18. from telethon.tl.types.messages import AllStickers
  19. from telethon.tl.types import InputStickerSetShortName, Document
  20. from telethon.tl.types.messages import StickerSet as StickerSetFull
  21. parser = argparse.ArgumentParser()
  22. parser.add_argument("--list", help="List your saved sticker packs", action="store_true")
  23. parser.add_argument("--session", help="Telethon session file name", default="sticker-import")
  24. parser.add_argument("--config", help="Path to JSON file with Matrix homeserver and access_token",
  25. type=str, default="config.json")
  26. parser.add_argument("--output-dir", help="Directory to write packs to", default="web/packs/",
  27. type=str)
  28. parser.add_argument("pack", help="Sticker pack URLs to import", action="append", nargs="*")
  29. args = parser.parse_args()
  30. async def whoami(url: URL, access_token: str) -> str:
  31. headers = {"Authorization": f"Bearer {access_token}"}
  32. async with ClientSession() as sess, sess.get(url, headers=headers) as resp:
  33. resp.raise_for_status()
  34. user_id = (await resp.json())["user_id"]
  35. print(f"Access token validated (user ID: {user_id})")
  36. return user_id
  37. try:
  38. with open(args.config) as config_file:
  39. config = json.load(config_file)
  40. homeserver_url = config["homeserver"]
  41. access_token = config["access_token"]
  42. except FileNotFoundError:
  43. print("Matrix config file not found. Please enter your homeserver and access token.")
  44. homeserver_url = input("Homeserver URL: ")
  45. access_token = input("Access token: ")
  46. whoami_url = URL(homeserver_url) / "_matrix" / "client" / "r0" / "account" / "whoami"
  47. user_id = asyncio.run(whoami(whoami_url, access_token))
  48. with open(args.config, "w") as config_file:
  49. json.dump({
  50. "homeserver": homeserver_url,
  51. "user_id": user_id,
  52. "access_token": access_token
  53. }, config_file)
  54. print(f"Wrote config to {args.config}")
  55. upload_url = URL(homeserver_url) / "_matrix" / "media" / "r0" / "upload"
  56. async def upload(data: bytes, mimetype: str, filename: str) -> str:
  57. url = upload_url.with_query({"filename": filename})
  58. headers = {"Content-Type": mimetype, "Authorization": f"Bearer {access_token}"}
  59. async with ClientSession() as sess, sess.post(url, data=data, headers=headers) as resp:
  60. return (await resp.json())["content_uri"]
  61. class MatrixMediaInfo(TypedDict):
  62. w: int
  63. h: int
  64. size: int
  65. mimetype: str
  66. class MatrixStickerInfo(TypedDict, total=False):
  67. body: str
  68. url: str
  69. info: MatrixMediaInfo
  70. def convert_image(data: bytes) -> (bytes, int, int):
  71. image: Image.Image = Image.open(BytesIO(data)).convert("RGBA")
  72. image.thumbnail((256, 256), Image.ANTIALIAS)
  73. new_file = BytesIO()
  74. image.save(new_file, "png")
  75. w, h = image.size
  76. return new_file.getvalue(), w, h
  77. async def reupload_document(client: TelegramClient, document: Document) -> MatrixStickerInfo:
  78. print(f"Reuploading {document.id}", end="", flush=True)
  79. data = await client.download_media(document, file=bytes)
  80. print(".", end="", flush=True)
  81. data, width, height = convert_image(data)
  82. print(".", end="", flush=True)
  83. mxc = await upload(data, "image/png", f"{document.id}.png")
  84. print(".", flush=True)
  85. return {
  86. "body": "",
  87. "url": mxc,
  88. "info": {
  89. "w": width,
  90. "h": height,
  91. "size": len(data),
  92. "mimetype": "image/png",
  93. },
  94. }
  95. def add_to_index(name: str) -> None:
  96. index_path = os.path.join(args.output_dir, "index.json")
  97. try:
  98. with open(index_path) as index_file:
  99. index_data = json.load(index_file)
  100. except (FileNotFoundError, json.JSONDecodeError):
  101. index_data = {"packs": [], "homeserver_url": homeserver_url}
  102. if name not in index_data["packs"]:
  103. index_data["packs"].append(name)
  104. with open(index_path, "w") as index_file:
  105. json.dump(index_data, index_file, indent=" ")
  106. print(f"Added {name} to {index_path}")
  107. async def reupload_pack(client: TelegramClient, pack: StickerSetFull) -> None:
  108. if pack.set.animated:
  109. print("Animated stickerpacks are currently not supported")
  110. return
  111. pack_path = os.path.join(args.output_dir, f"{pack.set.short_name}.json")
  112. try:
  113. os.mkdir(os.path.dirname(pack_path))
  114. except FileExistsError:
  115. pass
  116. print(f"Reuploading {pack.set.title} with {pack.set.count} stickers "
  117. f"and writing output to {pack_path}")
  118. already_uploaded = {}
  119. try:
  120. with open(pack_path) as pack_file:
  121. existing_pack = json.load(pack_file)
  122. already_uploaded = {sticker["net.maunium.telegram.sticker"]["id"]: sticker
  123. for sticker in existing_pack["stickers"]}
  124. print(f"Found {len(already_uploaded)} already reuploaded stickers")
  125. except FileNotFoundError:
  126. pass
  127. reuploaded_documents: Dict[int, MatrixStickerInfo] = {}
  128. for document in pack.documents:
  129. try:
  130. reuploaded_documents[document.id] = already_uploaded[document.id]
  131. print(f"Skipped reuploading {document.id}")
  132. except KeyError:
  133. reuploaded_documents[document.id] = await reupload_document(client, document)
  134. for sticker in pack.packs:
  135. for document_id in sticker.documents:
  136. doc = reuploaded_documents[document_id]
  137. doc["body"] = sticker.emoticon
  138. doc["net.maunium.telegram.sticker"] = {
  139. "pack": {
  140. "id": pack.set.id,
  141. "short_name": pack.set.short_name,
  142. },
  143. "id": document_id,
  144. "emoticon": sticker.emoticon,
  145. }
  146. with open(pack_path, "w") as pack_file:
  147. json.dump({
  148. "title": pack.set.title,
  149. "short_name": pack.set.short_name,
  150. "id": pack.set.id,
  151. "hash": pack.set.hash,
  152. "stickers": list(reuploaded_documents.values()),
  153. }, pack_file, ensure_ascii=False)
  154. print(f"Saved {pack.set.title} as {pack.set.short_name}.json")
  155. add_to_index(os.path.basename(pack_path))
  156. pack_url_regex = re.compile(r"^(?:(?:https?://)?(?:t|telegram)\.(?:me|dog)/addstickers/)?"
  157. r"([A-Za-z0-9-_]+)"
  158. r"(?:\.json)?$")
  159. async def main():
  160. client = TelegramClient(args.session, 298751, "cb676d6bae20553c9996996a8f52b4d7")
  161. await client.start()
  162. if args.list:
  163. stickers: AllStickers = await client(GetAllStickersRequest(hash=0))
  164. index = 1
  165. width = len(str(stickers.sets))
  166. print("Your saved sticker packs:")
  167. for saved_pack in stickers.sets:
  168. print(f"{index:>{width}}. {saved_pack.title} "
  169. f"(t.me/addstickers/{saved_pack.short_name})")
  170. elif args.pack[0]:
  171. input_packs = []
  172. for pack_url in args.pack[0]:
  173. match = pack_url_regex.match(pack_url)
  174. if not match:
  175. print(f"'{pack_url}' doesn't look like a sticker pack URL")
  176. return
  177. input_packs.append(InputStickerSetShortName(short_name=match.group(1)))
  178. for input_pack in input_packs:
  179. pack: StickerSetFull = await client(GetStickerSetRequest(input_pack))
  180. await reupload_pack(client, pack)
  181. else:
  182. parser.print_help()
  183. asyncio.run(main())