├── .gitignore ├── requirements.txt ├── LICENSE ├── tweet2json.py ├── README.md ├── tweet2img.py ├── mastodon2html.py └── tweet2html.py /.gitignore: -------------------------------------------------------------------------------- 1 | output 2 | -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | Pillow==10.4.0 2 | pyperclip==1.9.0 3 | python-dateutil==2.9.0.post0 4 | Requests==2.32.3 5 | selenium==4.23.1 6 | webdriver_manager==4.0.2 7 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2024 Terence Eden 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /tweet2json.py: -------------------------------------------------------------------------------- 1 | # For command line 2 | import argparse 3 | 4 | # File and Bits 5 | import os 6 | import json 7 | 8 | # Etc 9 | import requests 10 | import random 11 | from urllib.parse import urlparse 12 | 13 | def is_valid_url(url): 14 | try: 15 | result = urlparse(url) 16 | return all([result.scheme, result.netloc, result.path]) 17 | except ValueError: 18 | return False 19 | 20 | # Command line options 21 | arguments = argparse.ArgumentParser( 22 | prog='tweet2json', 23 | description='Download the JSON representation of any public Tweet') 24 | arguments.add_argument("id", type=str, help="ID of the Tweet (integer)") 25 | arguments.add_argument("-p", "--pretty", action="store_true", help="Pretty Print the output (default false)", required=False) 26 | 27 | args = arguments.parse_args() 28 | 29 | if (is_valid_url(args.id)): 30 | url_parts = result = urlparse(args.id) 31 | tweet_id = url_parts.path.split("/")[-1] 32 | else : 33 | tweet_id = args.id 34 | 35 | if (tweet_id.isdecimal() is False) : 36 | print( "No valid Tweet ID found." ) 37 | raise SystemExit 38 | 39 | pretty_print = True if args.pretty else False 40 | 41 | # Get the data from the Twitter embed API 42 | for _ in range(5): 43 | # Lazy retry strategy 44 | try : 45 | print( "Downloading data…" ) 46 | token = random.randint(1,10000) 47 | json_url = f"https://cdn.syndication.twimg.com/tweet-result?id={tweet_id}&lang=en&token={token}" 48 | response = requests.get(json_url) 49 | data = response.json() 50 | break 51 | except : 52 | print( "Retrying…" ) 53 | continue 54 | 55 | # If Tweet was deleted, exit. 56 | if "TweetTombstone" == data["__typename"] : 57 | print( "This Post was deleted by the Post author." ) 58 | raise SystemExit 59 | 60 | if (pretty_print) : 61 | twitter_json = json.dumps(data, indent=3) 62 | else : 63 | twitter_json = json.dumps(data) 64 | 65 | # Save directory 66 | output_directory = "output" 67 | os.makedirs(output_directory, exist_ok = True) 68 | save_location = os.path.join( output_directory, f"{tweet_id}.json" ) 69 | 70 | # Save as JSON 71 | with open( save_location, 'w', encoding="utf-8" ) as json_file: 72 | json_file.write( twitter_json ) 73 | print( f"Saved to {save_location}" ) -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # Tweet2Embed 2 | 3 | Convert a public Tweet into either: 4 | 5 | * Image & alt text 6 | * Semantic HTML and CSS 7 | 8 | Uses Selenium's Webdriver to launch a Firefox or Chrome instance and takes a screenshot. Uses the Twitter embed API to get a copy of the text and any alt text. An HTML representation is copied to the clipboard. 9 | 10 | ## Features 11 | 12 | * 🗣 Avatars inlined as WebP 13 | * 📸 All attached photos inlined 14 | * 🎥 Video poster inline,