├── requirements.txt
├── README.md
├── docker-compose.yml
├── Dockerfile
├── src
    ├── utils.py
    ├── text.py
    └── bot.py
├── LICENSE
└── .gitignore


/requirements.txt:
--------------------------------------------------------------------------------
1 | setuptools
2 | wheel
3 | pyTelegramBotAPI
4 | requests
5 | hurry.filesize


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # webm2mp4 Telegram bot
2 | 
3 | [This bot](https://t.me/webm2mp4bot) converts .webm and .webp links/files to .mp4 videos and .jpg images respectively via ffmpeg.
4 | 
5 | ## License
6 | 
7 | MIT
8 | 


--------------------------------------------------------------------------------
/docker-compose.yml:
--------------------------------------------------------------------------------
1 | services:
2 |   webm2mp4bot:
3 |     build: .
4 |     container_name: webm2mp4bot
5 |     environment:
6 |       - TELEGRAM_BOT_TOKEN=
7 |       - FFMPEG_THREADS=2
8 |     restart: always
9 | 


--------------------------------------------------------------------------------
/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM debian:11
 2 | RUN apt update && apt install -y --no-install-recommends python3 python3-pip ffmpeg
 3 | RUN adduser bot
 4 | 
 5 | COPY src /opt
 6 | COPY requirements.txt /opt
 7 | RUN pip3 install --upgrade -r /opt/requirements.txt
 8 | 
 9 | USER bot
10 | WORKDIR /opt
11 | ENTRYPOINT ["python3", "./bot.py"]
12 | 


--------------------------------------------------------------------------------
/src/utils.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import random
 3 | import string
 4 | 
 5 | from hurry.filesize import alternative, size
 6 | 
 7 | 
 8 | def bytes2human(raw):
 9 |     return size(raw, system=alternative)
10 | 
11 | 
12 | def filesize(filename):
13 |     return os.stat(filename).st_size
14 | 
15 | 
16 | def rm(filename):
17 |     """Delete file"""
18 |     try:
19 |         os.remove(filename)
20 |     except Exception as e:
21 |         print(f"Unable to rm {filename}: {e}")
22 | 
23 | 
24 | def random_string(length=12):
25 |     """Random string of uppercase ASCII and digits"""
26 |     return "".join(
27 |         random.choice(string.ascii_uppercase + string.digits) for _ in range(length)
28 |     )
29 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2017 Mike_Went
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/src/text.py:
--------------------------------------------------------------------------------
 1 | start = """Hello! I am WebM to MP4 (H.264) and WebP to PNG converter bot 📺
 2 | 
 3 | I can convert:
 4 | 🎥 <b>webm</b> and other ffmpeg supported video format → mp4
 5 | 🖼 <b>webp</b> and stickers → png & jpg"""
 6 | help = "Send me a <b>link</b> (http://...) or a <b>document</b> (including stickers)"
 7 | starting = "🚀 Starting..."
 8 | downloading = "📥 Downloading..."
 9 | converting = "☕️ Converting... {}"
10 | generating_thumbnail = "🖼 Generating thumbnail.."
11 | uploading = "☁️ Uploading to Telegram..."
12 | 
13 | class error:
14 |     contact_hint = "Contat @Mike_Went if you think it's a bot-side error."
15 | 
16 |     downloading = "⚠️ Unable to download this file. " + contact_hint
17 |     converting = "⚠️ Sorry, <code>ffmpeg</code> seems unable to convert this file. " + contact_hint
18 |     generating_thumbnail = "⚠️ Sorry, <code>ffmpeg</code> seems unable to generate a thumbnail image for this file. " + contact_hint
19 |     huge_file = "🍉 File is bigger than 50 MB. Telegram <b>does not<b> allow bots to upload huge files, sorry."
20 |     animated_sticker = "🎬 Animated stickers are unsupported yet, submit a <a href='https://github.com/MikeWent/webm2mp4'>pull-request</a> if you implement it!"
21 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | env/
 12 | build/
 13 | develop-eggs/
 14 | dist/
 15 | downloads/
 16 | eggs/
 17 | .eggs/
 18 | lib/
 19 | lib64/
 20 | parts/
 21 | sdist/
 22 | var/
 23 | wheels/
 24 | *.egg-info/
 25 | .installed.cfg
 26 | *.egg
 27 | 
 28 | # PyInstaller
 29 | #  Usually these files are written by a python script from a template
 30 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 31 | *.manifest
 32 | *.spec
 33 | 
 34 | # Installer logs
 35 | pip-log.txt
 36 | pip-delete-this-directory.txt
 37 | 
 38 | # Unit test / coverage reports
 39 | htmlcov/
 40 | .tox/
 41 | .coverage
 42 | .coverage.*
 43 | .cache
 44 | nosetests.xml
 45 | coverage.xml
 46 | *.cover
 47 | .hypothesis/
 48 | 
 49 | # Translations
 50 | *.mo
 51 | *.pot
 52 | 
 53 | # Django stuff:
 54 | *.log
 55 | local_settings.py
 56 | 
 57 | # Flask stuff:
 58 | instance/
 59 | .webassets-cache
 60 | 
 61 | # Scrapy stuff:
 62 | .scrapy
 63 | 
 64 | # Sphinx documentation
 65 | docs/_build/
 66 | 
 67 | # PyBuilder
 68 | target/
 69 | 
 70 | # Jupyter Notebook
 71 | .ipynb_checkpoints
 72 | 
 73 | # pyenv
 74 | .python-version
 75 | 
 76 | # celery beat schedule file
 77 | celerybeat-schedule
 78 | 
 79 | # SageMath parsed files
 80 | *.sage.py
 81 | 
 82 | # dotenv
 83 | .env
 84 | 
 85 | # virtualenv
 86 | .venv
 87 | venv/
 88 | ENV/
 89 | 
 90 | # Spyder project settings
 91 | .spyderproject
 92 | .spyproject
 93 | 
 94 | # Rope project settings
 95 | .ropeproject
 96 | 
 97 | # mkdocs documentation
 98 | /site
 99 | 
100 | # mypy
101 | .mypy_cache/
102 | 
103 | # Bot config
104 | config.json
105 | 
106 | # Generated service file
107 | *.service
108 | 


--------------------------------------------------------------------------------
/src/bot.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | 
  3 | # https://github.com/MikeWent/webm2mp4
  4 | # https://t.me/webm2mp4bot
  5 | 
  6 | import re
  7 | import subprocess
  8 | import threading
  9 | import time
 10 | from os import getenv
 11 | 
 12 | import requests
 13 | import telebot
 14 | 
 15 | import text
 16 | import utils
 17 | 
 18 | MAXIMUM_FILESIZE_ALLOWED = 50 * 1024 * 1024  # ~50 MB
 19 | TEMP_PATH = "/tmp/"
 20 | TELEGRAM_BOT_TOKEN = getenv("TELEGRAM_BOT_TOKEN")
 21 | FFMPEG_THREADS = getenv("FFMPEG_THREADS")
 22 | 
 23 | 
 24 | def convert_worker(target_format, message, url, bot):
 25 |     """Generic process spawned every time user sends a link or a file"""
 26 |     input_filename = "".join([TEMP_PATH, utils.random_string()])
 27 |     output_filename = "".join([TEMP_PATH, utils.random_string(), ".", target_format])
 28 | 
 29 |     # Tell user that we are working
 30 |     status_message = bot.reply_to(message, text.starting, parse_mode="HTML")
 31 | 
 32 |     def update_status_message(new_text):
 33 |         bot.edit_message_text(
 34 |             chat_id=status_message.chat.id,
 35 |             message_id=status_message.message_id,
 36 |             text=new_text,
 37 |             parse_mode="HTML",
 38 |         )
 39 | 
 40 |     # Try to download URL
 41 |     try:
 42 |         r = requests.get(url, stream=True)
 43 |     except:
 44 |         update_status_message(text.error.downloading)
 45 |         return
 46 | 
 47 |     # Check file size
 48 |     if int(r.headers.get("Content-Length", "0")) >= MAXIMUM_FILESIZE_ALLOWED:
 49 |         update_status_message(text.error.huge_file)
 50 |         return
 51 | 
 52 |     # Download the file
 53 |     update_status_message(text.downloading)
 54 |     chunk_size = 4096
 55 |     raw_input_size = 0
 56 |     try:
 57 |         with open(input_filename, "wb") as f:
 58 |             for chunk in r.iter_content(chunk_size=chunk_size):
 59 |                 f.write(chunk)
 60 |                 raw_input_size += chunk_size
 61 |                 # Download files without Content-Length, but apply standard limit to them
 62 |                 if raw_input_size >= MAXIMUM_FILESIZE_ALLOWED:
 63 |                     update_status_message(text.error.huge_file)
 64 |                     utils.rm(input_filename)
 65 |                     return
 66 |     except:
 67 |         update_status_message(text.error.downloading)
 68 |         bot.reply_to(message, f"HTTP {r.status_code}")
 69 |         return
 70 | 
 71 |     # Start ffmpeg
 72 |     ffmpeg_process = None
 73 |     if target_format == "mp4":
 74 |         ffmpeg_process = subprocess.Popen(
 75 |             [
 76 |                 "ffmpeg",
 77 |                 "-v",
 78 |                 "error",
 79 |                 "-threads",
 80 |                 FFMPEG_THREADS,
 81 |                 "-i",
 82 |                 input_filename,
 83 |                 "-map",
 84 |                 "V:0?",  # select video stream
 85 |                 "-map",
 86 |                 "0:a?",  # ignore audio if doesn't exist
 87 |                 "-c:v",
 88 |                 "libx264",  # specify video encoder
 89 |                 "-max_muxing_queue_size",
 90 |                 "9999",  # https://trac.ffmpeg.org/ticket/6375
 91 |                 "-movflags",
 92 |                 "+faststart",  # optimize for streaming
 93 |                 "-preset",
 94 |                 "veryslow",  # https://trac.ffmpeg.org/wiki/Encode/H.264#a2.Chooseapresetandtune
 95 |                 "-timelimit",
 96 |                 "900",  # prevent DoS (exit after 15 min)
 97 |                 "-vf",
 98 |                 "pad=ceil(iw/2)*2:ceil(ih/2)*2",  # https://stackoverflow.com/questions/20847674/ffmpeg-libx264-height-not-divisible-by-2#20848224
 99 |                 output_filename,
100 |             ]
101 |         )
102 |     elif target_format == "png":
103 |         ffmpeg_process = subprocess.Popen(
104 |             [
105 |                 "ffmpeg",
106 |                 "-v",
107 |                 "error",
108 |                 "-threads",
109 |                 FFMPEG_THREADS,
110 |                 "-thread_type",
111 |                 "slice",
112 |                 "-i",
113 |                 input_filename,
114 |                 "-timelimit",
115 |                 "60",  # prevent DoS (exit after 15 min)
116 |                 output_filename,
117 |             ]
118 |         )
119 | 
120 |     # Update progress while ffmpeg is alive
121 |     old_progress = ""
122 |     while ffmpeg_process.poll() == None:
123 |         try:
124 |             raw_output_size = utils.filesize(output_filename)
125 |         except FileNotFoundError:
126 |             raw_output_size = 0
127 | 
128 |         if raw_output_size >= MAXIMUM_FILESIZE_ALLOWED:
129 |             update_status_message(text.error.huge_file)
130 |             ffmpeg_process.kill()
131 |             utils.rm(output_filename)
132 | 
133 |         input_size = utils.bytes2human(raw_input_size)
134 |         output_size = utils.bytes2human(raw_output_size)
135 | 
136 |         progress = f"{output_size} / {input_size}"
137 |         # Update progress only if it changed
138 |         if progress != old_progress:
139 |             update_status_message(text.converting.format(progress))
140 |             old_progress = progress
141 |         time.sleep(2)
142 | 
143 |     # Exit in case of error with ffmpeg
144 |     if ffmpeg_process.returncode != 0:
145 |         update_status_message(text.error.converting)
146 |         # Clean up and close pipe explicitly
147 |         utils.rm(output_filename)
148 |         return
149 | 
150 |     # Check output file size
151 |     output_size = utils.filesize(output_filename)
152 |     if output_size >= MAXIMUM_FILESIZE_ALLOWED:
153 |         update_status_message(text.error.huge_file)
154 |         # Clean up and close pipe explicitly
155 |         utils.rm(output_filename)
156 |         return
157 | 
158 |     # Default params for sending operation
159 |     data = {"chat_id": message.chat.id, "reply_to_message_id": message.message_id}
160 | 
161 |     if target_format == "mp4":
162 |         data.update({"supports_streaming": True})
163 |         # 1. Get video duration in seconds
164 |         video_duration = (
165 |             subprocess.run(
166 |                 [
167 |                     "ffprobe",
168 |                     "-v",
169 |                     "error",
170 |                     "-select_streams",
171 |                     "v:0",
172 |                     "-show_entries",
173 |                     "format=duration",
174 |                     "-of",
175 |                     "default=noprint_wrappers=1:nokey=1",
176 |                     output_filename,
177 |                 ],
178 |                 stdout=subprocess.PIPE,
179 |             )
180 |             .stdout.decode("utf-8")
181 |             .strip()
182 |         )
183 | 
184 |         video_duration = round(float(video_duration))
185 |         data.update({"duration": video_duration})
186 | 
187 |         # 2. Get video height and width
188 |         video_props = (
189 |             subprocess.run(
190 |                 [
191 |                     "ffprobe",
192 |                     "-v",
193 |                     "error",
194 |                     "-select_streams",
195 |                     "v:0",
196 |                     "-show_entries",
197 |                     "stream=width,height",
198 |                     "-of",
199 |                     "csv=s=x:p=0",
200 |                     output_filename,
201 |                 ],
202 |                 stdout=subprocess.PIPE,
203 |             )
204 |             .stdout.decode("utf-8")
205 |             .strip()
206 |         )
207 | 
208 |         video_width, video_height = video_props.split("x")
209 |         data.update({"width": video_width, "height": video_height})
210 | 
211 |         # 3. Take one frame from the middle of the video
212 |         update_status_message(text.generating_thumbnail)
213 |         thumbnail = "".join([TEMP_PATH, utils.random_string(), ".jpg"])
214 |         generate_thumbnail_process = subprocess.Popen(
215 |             [
216 |                 "ffmpeg",
217 |                 "-v",
218 |                 "error",
219 |                 "-i",
220 |                 output_filename,
221 |                 "-vcodec",
222 |                 "mjpeg",
223 |                 "-vframes",
224 |                 "1",
225 |                 "-an",
226 |                 "-f",
227 |                 "rawvideo",
228 |                 "-ss",
229 |                 str(int(video_duration / 2)),
230 |                 # keep the limit of 90px height/width (Telegram API) while preserving the aspect ratio
231 |                 "-vf",
232 |                 "scale='if(gt(iw,ih),90,trunc(oh*a/2)*2)':'if(gt(iw,ih),trunc(ow/a/2)*2,90)'",
233 |                 thumbnail,
234 |             ]
235 |         )
236 | 
237 |         # While process is alive (i.e. is working)
238 |         while generate_thumbnail_process.poll() == None:
239 |             time.sleep(1)
240 | 
241 |         # Exit in case of error with ffmpeg
242 |         if generate_thumbnail_process.returncode != 0:
243 |             update_status_message(text.error.generating_thumbnail)
244 |             return
245 | 
246 |         update_status_message(text.uploading)
247 |         requests.post(
248 |             "https://api.telegram.org/bot{}/sendVideo".format(TELEGRAM_BOT_TOKEN),
249 |             data=data,
250 |             files=[
251 |                 (
252 |                     "video",
253 |                     (
254 |                         utils.random_string() + ".mp4",
255 |                         open(output_filename, "rb"),
256 |                         "video/mp4",
257 |                     ),
258 |                 ),
259 |                 (
260 |                     "thumb",
261 |                     (
262 |                         utils.random_string() + ".jpg",
263 |                         open(thumbnail, "rb"),
264 |                         "image/jpeg",
265 |                     ),
266 |                 ),
267 |             ],
268 |         )
269 |         utils.rm(input_filename)
270 |         utils.rm(output_filename)
271 |         utils.rm(thumbnail)
272 | 
273 |     elif target_format == "png":
274 |         # Upload to Telegram
275 |         update_status_message(text.uploading)
276 |         requests.post(
277 |             "https://api.telegram.org/bot{}/sendPhoto".format(TELEGRAM_BOT_TOKEN),
278 |             data=data,
279 |             files=[
280 |                 (
281 |                     "photo",
282 |                     (
283 |                         utils.random_string() + ".png",
284 |                         open(output_filename, "rb"),
285 |                         "image/png",
286 |                     ),
287 |                 )
288 |             ],
289 |         )
290 |         requests.post(
291 |             "https://api.telegram.org/bot{}/sendDocument".format(TELEGRAM_BOT_TOKEN),
292 |             data=data,
293 |             files=[
294 |                 (
295 |                     "document",
296 |                     (
297 |                         utils.random_string() + ".png",
298 |                         open(output_filename, "rb"),
299 |                         "image/png",
300 |                     ),
301 |                 )
302 |             ],
303 |         )
304 |         utils.rm(input_filename)
305 |         utils.rm(output_filename)
306 | 
307 |     bot.delete_message(message.chat.id, status_message.message_id)
308 | 
309 | 
310 | bot = telebot.TeleBot(TELEGRAM_BOT_TOKEN)
311 | 
312 | 
313 | @bot.message_handler(commands=["start", "help"])
314 | def start_help(message):
315 |     if message.chat.type != "private":
316 |         try:
317 |             bot.leave_chat(message.chat.id)
318 |         except:
319 |             pass
320 |         return
321 | 
322 |     bot.send_message(message.chat.id, text.start, parse_mode="HTML")
323 |     bot.send_message(message.chat.id, text.help, parse_mode="HTML")
324 | 
325 | 
326 | # Handle URLs
327 | URL_REGEXP = r"(http.?:\/\/.*\.(webm|webp|mp4))"
328 | 
329 | 
330 | @bot.message_handler(regexp=URL_REGEXP)
331 | def handle_urls(message):
332 |     if message.chat.type != "private":
333 |         try:
334 |             bot.leave_chat(message.chat.id)
335 |         except:
336 |             pass
337 |         return
338 | 
339 |     # Get first url in message
340 |     match = re.findall(URL_REGEXP, message.text)[0]
341 |     url = match[0]
342 |     extension = match[1]
343 |     if extension == "webp":
344 |         target_format = "png"
345 |     else:
346 |         target_format = "mp4"
347 | 
348 |     threading.Thread(
349 |         target=convert_worker,
350 |         kwargs={
351 |             "target_format": target_format,
352 |             "message": message,
353 |             "url": url,
354 |             "bot": bot,
355 |         },
356 |     ).run()
357 | 
358 | 
359 | # Handle files
360 | @bot.message_handler(content_types=["document", "video", "sticker"])
361 | def handle_files(message):
362 |     if message.chat.type != "private":
363 |         try:
364 |             bot.leave_chat(message.chat.id)
365 |         except:
366 |             pass
367 |         return
368 | 
369 |     # Get file url
370 |     target = None
371 |     if message.document:
372 |         target = message.document.file_id
373 |     if message.video:
374 |         target = message.video.file_id
375 |     if message.sticker:
376 |         # Ignore animated stickers
377 |         if message.sticker.is_animated:
378 |             bot.reply_to(message, text.error.animated_sticker, parse_mode="HTML")
379 |             return
380 |         target = message.sticker.file_id
381 | 
382 |     url = "https://api.telegram.org/file/bot{0}/{1}".format(
383 |         TELEGRAM_BOT_TOKEN, bot.get_file(target).file_path
384 |     )
385 |     if url.endswith("webp"):
386 |         target_format = "png"
387 |     else:
388 |         target_format = "mp4"
389 | 
390 |     threading.Thread(
391 |         target=convert_worker,
392 |         kwargs={
393 |             "target_format": target_format,
394 |             "message": message,
395 |             "url": url,
396 |             "bot": bot,
397 |         },
398 |     ).run()
399 | 
400 | 
401 | bot.polling(none_stop=True)
402 | 


--------------------------------------------------------------------------------