2021-07-21 23:36:05 +02:00
from flask import Flask , render_template , request , redirect , Response
2021-07-04 01:52:30 +02:00
import youtube_dl
2021-07-12 22:48:21 +02:00
import textwrap
2021-07-12 10:49:07 +02:00
import twitter
import pymongo
2021-07-04 11:40:22 +02:00
import json
2021-07-04 03:41:47 +02:00
import re
2021-07-11 22:48:17 +02:00
import os
2021-08-03 03:52:13 +02:00
import urllib . parse
2021-07-04 01:52:30 +02:00
app = Flask ( __name__ )
2021-10-01 23:59:20 +02:00
pathregex = re . compile ( " \\ w { 1,15} \\ /(status|statuses) \\ / \\ d { 2,20} " )
2021-12-03 01:58:36 +01:00
generate_embed_user_agents = [ " Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots) " , " Mozilla/5.0 (Macintosh; Intel Mac OS X 10.10; rv:38.0) Gecko/20100101 Firefox/38.0 " , " Mozilla/5.0 (compatible; Discordbot/2.0; +https://discordapp.com) " , " TelegramBot (like TwitterBot) " , " Mozilla/5.0 (compatible; January/1.0; +https://gitlab.insrt.uk/revolt/january) " , " test " ]
2021-07-04 01:52:30 +02:00
2021-07-13 19:18:50 +02:00
# Read config from config.json. If it does not exist, create new.
2021-07-11 22:48:17 +02:00
if not os . path . exists ( " config.json " ) :
with open ( " config.json " , " w " ) as outfile :
2021-07-14 10:33:46 +02:00
default_config = { " config " : { " link_cache " : " json " , " database " : " [url to mongo database goes here] " , " method " : " youtube-dl " , " color " : " #43B581 " , " appname " : " TwitFix " , " repo " : " https://github.com/robinuniverse/twitfix " , " url " : " https://fxtwitter.com " } , " api " : { " api_key " : " [api_key goes here] " , " api_secret " : " [api_secret goes here] " , " access_token " : " [access_token goes here] " , " access_secret " : " [access_secret goes here] " } }
2021-07-13 19:18:50 +02:00
json . dump ( default_config , outfile , indent = 4 , sort_keys = True )
2021-07-11 22:48:17 +02:00
2021-07-13 19:18:50 +02:00
config = default_config
else :
f = open ( " config.json " )
config = json . load ( f )
f . close ( )
2021-07-11 22:48:17 +02:00
2021-07-13 20:57:09 +02:00
# If method is set to API or Hybrid, attempt to auth with the Twitter API
2021-07-12 21:49:29 +02:00
if config [ ' config ' ] [ ' method ' ] in ( ' api ' , ' hybrid ' ) :
2021-07-12 10:49:07 +02:00
auth = twitter . oauth . OAuth ( config [ ' api ' ] [ ' access_token ' ] , config [ ' api ' ] [ ' access_secret ' ] , config [ ' api ' ] [ ' api_key ' ] , config [ ' api ' ] [ ' api_secret ' ] )
twitter_api = twitter . Twitter ( auth = auth )
link_cache_system = config [ ' config ' ] [ ' link_cache ' ]
2021-07-08 05:17:23 +02:00
if link_cache_system == " json " :
link_cache = { }
2021-07-11 22:48:17 +02:00
if not os . path . exists ( " config.json " ) :
with open ( " config.json " , " w " ) as outfile :
2021-07-13 19:18:50 +02:00
default_link_cache = { " test " : " test " }
json . dump ( default_link_cache , outfile , indent = 4 , sort_keys = True )
2021-07-11 22:48:17 +02:00
2021-07-08 05:17:23 +02:00
f = open ( ' links.json ' , )
link_cache = json . load ( f )
f . close ( )
elif link_cache_system == " db " :
2021-07-11 22:48:17 +02:00
client = pymongo . MongoClient ( config [ ' config ' ] [ ' database ' ] , connect = False )
2021-07-08 05:17:23 +02:00
db = client . TwitFix
2021-07-04 11:40:22 +02:00
2021-12-03 01:58:36 +01:00
@app.route ( ' /latest/ ' ) # Try to return the latest video
def latest ( ) :
vnf = db . linkCache . find_one ( sort = [ ( ' _id ' , pymongo . DESCENDING ) ] )
desc = re . sub ( r ' http.*t \ .co \ S+ ' , ' ' , vnf [ ' description ' ] )
urlUser = urllib . parse . quote ( vnf [ ' uploader ' ] )
urlDesc = urllib . parse . quote ( desc )
urlLink = urllib . parse . quote ( vnf [ ' url ' ] )
print ( " [ ✔ ] Latest video page loaded: " + vnf [ ' tweet ' ] )
return render_template ( ' inline.html ' , vidlink = vnf [ ' url ' ] , vidurl = vnf [ ' url ' ] , desc = desc , pic = vnf [ ' thumbnail ' ] , user = vnf [ ' uploader ' ] , video_link = vnf [ ' url ' ] , color = config [ ' config ' ] [ ' color ' ] , appname = config [ ' config ' ] [ ' appname ' ] , repo = config [ ' config ' ] [ ' repo ' ] , url = config [ ' config ' ] [ ' url ' ] , urlDesc = urlDesc , urlUser = urlUser , urlLink = urlLink , tweet = vnf [ ' tweet ' ] )
2021-07-14 10:33:46 +02:00
@app.route ( ' / ' ) # If the useragent is discord, return the embed, if not, redirect to configured repo directly
2021-07-06 05:30:16 +02:00
def default ( ) :
2021-07-14 10:33:46 +02:00
user_agent = request . headers . get ( ' user-agent ' )
2021-08-03 03:52:13 +02:00
if user_agent in generate_embed_user_agents :
2021-07-14 10:33:46 +02:00
return message ( " TwitFix is an attempt to fix twitter video embeds in discord! created by Robin Universe :) \n \n 💖 \n \n Click me to be redirected to the repo! " )
else :
return redirect ( config [ ' config ' ] [ ' repo ' ] , 301 )
2021-07-06 05:30:16 +02:00
2021-07-09 12:32:04 +02:00
@app.route ( ' /oembed.json ' )
def oembedend ( ) :
desc = request . args . get ( " desc " , None )
user = request . args . get ( " user " , None )
link = request . args . get ( " link " , None )
2021-07-13 19:18:50 +02:00
return o_embed_gen ( desc , user , link )
2021-07-09 12:32:04 +02:00
2021-07-13 20:57:09 +02:00
@app.route ( ' /<path:sub_path> ' )
2021-07-13 19:18:50 +02:00
def twitfix ( sub_path ) :
2021-07-13 02:45:30 +02:00
user_agent = request . headers . get ( ' user-agent ' )
2021-07-13 19:18:50 +02:00
match = pathregex . search ( sub_path )
2021-10-01 23:59:20 +02:00
if sub_path . endswith ( " .mp4 " ) :
return dir ( sub_path . replace ( " .mp4 " , " " ) )
2021-07-13 08:32:25 +02:00
if match is not None :
2021-07-13 19:18:50 +02:00
twitter_url = sub_path
2021-07-04 03:41:47 +02:00
2021-07-13 08:32:25 +02:00
if match . start ( ) == 0 :
2021-07-13 19:18:50 +02:00
twitter_url = " https://twitter.com/ " + sub_path
2021-07-04 03:41:47 +02:00
2021-08-03 03:52:13 +02:00
if user_agent in generate_embed_user_agents :
2021-07-16 22:25:43 +02:00
res = embed_video ( twitter_url )
return res
2021-08-03 03:52:13 +02:00
2021-07-13 02:45:30 +02:00
else :
2021-12-03 01:58:36 +01:00
print ( " [ R ] Redirect to " + twitter_url )
2021-07-13 08:32:25 +02:00
return redirect ( twitter_url , 301 )
2021-07-04 01:52:30 +02:00
else :
2021-07-21 23:36:05 +02:00
return message ( " This doesn ' t appear to be a twitter URL " )
2021-07-04 01:52:30 +02:00
2021-07-14 10:33:46 +02:00
@app.route ( ' /other/<path:sub_path> ' ) # Show all info that Youtube-DL can get about a video as a json
2021-07-13 19:18:50 +02:00
def other ( sub_path ) :
2021-12-03 03:14:01 +01:00
otherurl = request . url . split ( " /other/ " , 1 ) [ 1 ] . replace ( " :/ " , " :// " )
print ( " [ OTHER ] Other URL embed attempted: " + otherurl )
res = embed_video ( otherurl )
2021-07-05 18:02:17 +02:00
return res
2021-07-14 10:33:46 +02:00
@app.route ( ' /info/<path:sub_path> ' ) # Show all info that Youtube-DL can get about a video as a json
2021-07-13 19:18:50 +02:00
def info ( sub_path ) :
2021-12-03 03:14:01 +01:00
infourl = request . url . split ( " /info/ " , 1 ) [ 1 ] . replace ( " :/ " , " :// " )
print ( " [ INFO ] Info data requested: " + infourl )
2021-07-04 23:54:23 +02:00
with youtube_dl . YoutubeDL ( { ' outtmpl ' : ' %(id)s . %(ext)s ' } ) as ydl :
2021-12-03 03:14:01 +01:00
result = ydl . extract_info ( infourl , download = False )
2021-07-04 01:52:30 +02:00
return result
2021-07-21 23:36:05 +02:00
@app.route ( ' /dir/<path:sub_path> ' )
def dir ( sub_path ) :
user_agent = request . headers . get ( ' user-agent ' )
url = sub_path
match = pathregex . search ( url )
if match is not None :
twitter_url = url
if match . start ( ) == 0 :
twitter_url = " https://twitter.com/ " + url
2021-08-03 03:52:13 +02:00
if user_agent in generate_embed_user_agents :
2021-10-01 23:59:20 +02:00
res = embed_video ( twitter_url )
2021-07-21 23:36:05 +02:00
return res
2021-08-03 03:52:13 +02:00
2021-07-21 23:36:05 +02:00
else :
2021-12-03 01:58:36 +01:00
print ( " [ R ] Redirect to direct MP4 URL " )
2021-07-21 23:36:05 +02:00
return direct_video ( twitter_url )
else :
return redirect ( url , 301 )
def direct_video ( video_link ) : # Just get a redirect to a MP4 link from any tweet link
cached_vnf = get_vnf_from_link_cache ( video_link )
if cached_vnf == None :
try :
vnf = link_to_vnf ( video_link )
add_vnf_to_link_cache ( video_link , vnf )
return redirect ( vnf [ ' url ' ] , 301 )
2021-12-03 01:58:36 +01:00
print ( " [ D ] Redirecting to direct URL: " + vnf [ ' url ' ] )
2021-07-21 23:36:05 +02:00
except Exception as e :
print ( e )
return message ( " Failed to scan your link! " )
else :
return redirect ( cached_vnf [ ' url ' ] , 301 )
2021-12-03 01:58:36 +01:00
print ( " [ D ] Redirecting to direct URL: " + vnf [ ' url ' ] )
2021-07-21 23:36:05 +02:00
def embed_video ( video_link ) : # Return Embed from any tweet link
2021-07-13 19:19:24 +02:00
cached_vnf = get_vnf_from_link_cache ( video_link )
2021-07-08 05:17:23 +02:00
2021-07-12 10:49:07 +02:00
if cached_vnf == None :
2021-07-08 05:17:23 +02:00
try :
2021-07-13 19:19:24 +02:00
vnf = link_to_vnf ( video_link )
add_vnf_to_link_cache ( video_link , vnf )
return embed ( video_link , vnf )
2021-07-21 23:36:05 +02:00
2021-07-12 10:49:07 +02:00
except Exception as e :
print ( e )
2021-07-14 10:33:46 +02:00
return message ( " Failed to scan your link! " )
2021-07-12 10:49:07 +02:00
else :
2021-07-13 19:19:24 +02:00
return embed ( video_link , cached_vnf )
2021-07-05 18:02:17 +02:00
2021-07-13 19:18:50 +02:00
def video_info ( url , tweet = " " , desc = " " , thumb = " " , uploader = " " ) : # Return a dict of video info with default values
2021-07-05 18:02:17 +02:00
vnf = {
2021-07-08 05:17:23 +02:00
" tweet " : tweet ,
2021-07-05 18:02:17 +02:00
" url " : url ,
" description " : desc ,
" thumbnail " : thumb ,
" uploader " : uploader
}
return vnf
2021-07-13 19:19:24 +02:00
def link_to_vnf_from_api ( video_link ) :
2021-12-03 01:58:36 +01:00
print ( " [ + ] Attempting to download tweet info from Twitter API " )
2021-07-13 19:19:24 +02:00
twid = int ( re . sub ( r ' \ ?.*$ ' , ' ' , video_link . rsplit ( " / " , 1 ) [ - 1 ] ) ) # gets the tweet ID as a int from the passed url
2021-07-12 20:49:19 +02:00
tweet = twitter_api . statuses . show ( _id = twid , tweet_mode = " extended " )
2021-07-15 02:15:06 +02:00
# Check to see if tweet has a video, if not, make the url passed to the VNF the first t.co link in the tweet
if ' extended_entities ' in tweet :
if ' video_info ' in tweet [ ' extended_entities ' ] [ ' media ' ] [ 0 ] :
if tweet [ ' extended_entities ' ] [ ' media ' ] [ 0 ] [ ' video_info ' ] [ ' variants ' ] [ - 1 ] [ ' content_type ' ] == " video/mp4 " :
url = tweet [ ' extended_entities ' ] [ ' media ' ] [ 0 ] [ ' video_info ' ] [ ' variants ' ] [ - 1 ] [ ' url ' ]
thumb = tweet [ ' extended_entities ' ] [ ' media ' ] [ 0 ] [ ' media_url ' ]
else :
url = tweet [ ' extended_entities ' ] [ ' media ' ] [ 0 ] [ ' video_info ' ] [ ' variants ' ] [ - 2 ] [ ' url ' ]
thumb = tweet [ ' extended_entities ' ] [ ' media ' ] [ 0 ] [ ' media_url ' ]
else :
url = re . findall ( r ' (https?://[^ \ s]+) ' , tweet [ ' full_text ' ] ) [ 0 ]
thumb = " Non video link with url "
2021-12-03 01:58:36 +01:00
print ( " [ NV ] Non video tweet, but has a link: " + url )
2021-07-12 20:49:19 +02:00
else :
2021-07-15 02:15:06 +02:00
url = re . findall ( r ' (https?://[^ \ s]+) ' , tweet [ ' full_text ' ] ) [ 0 ]
thumb = " Non video link with url "
2021-12-03 01:58:36 +01:00
print ( " [ NV ] Non video tweet, but has a link: " + url )
2021-07-12 23:41:07 +02:00
if len ( tweet [ ' full_text ' ] ) > 200 :
text = textwrap . shorten ( tweet [ ' full_text ' ] , width = 200 , placeholder = " ... " )
else :
text = tweet [ ' full_text ' ]
2021-07-15 02:15:06 +02:00
vnf = video_info ( url , video_link , text , thumb , tweet [ ' user ' ] [ ' name ' ] )
2021-07-12 20:49:19 +02:00
return vnf
2021-07-13 19:19:24 +02:00
def link_to_vnf_from_youtubedl ( video_link ) :
2021-07-12 20:49:19 +02:00
print ( " Attempting to download tweet info via YoutubeDL " )
with youtube_dl . YoutubeDL ( { ' outtmpl ' : ' %(id)s . %(ext)s ' } ) as ydl :
2021-07-13 19:19:24 +02:00
result = ydl . extract_info ( video_link , download = False )
vnf = video_info ( result [ ' url ' ] , video_link , result [ ' description ' ] . rsplit ( ' ' , 1 ) [ 0 ] , result [ ' thumbnail ' ] , result [ ' uploader ' ] )
2021-07-12 10:49:07 +02:00
return vnf
2021-07-12 20:49:19 +02:00
2021-07-13 19:19:24 +02:00
def link_to_vnf ( video_link ) : # Return a VideoInfo object or die trying
2021-07-12 20:49:19 +02:00
if config [ ' config ' ] [ ' method ' ] == ' hybrid ' :
try :
2021-07-13 19:19:24 +02:00
return link_to_vnf_from_api ( video_link )
2021-07-12 21:49:29 +02:00
except Exception as e :
2021-07-12 20:49:19 +02:00
print ( " API Failed " )
2021-07-12 21:49:29 +02:00
print ( e )
2021-07-13 19:19:24 +02:00
return link_to_vnf_from_youtubedl ( video_link )
2021-07-12 20:49:19 +02:00
elif config [ ' config ' ] [ ' method ' ] == ' api ' :
try :
2021-07-13 19:19:24 +02:00
return link_to_vnf_from_api ( video_link )
2021-07-12 20:49:19 +02:00
except Exception as e :
2021-12-03 01:58:36 +01:00
print ( " [ X ] API Failed " )
2021-07-12 20:49:19 +02:00
print ( e )
return None
elif config [ ' config ' ] [ ' method ' ] == ' youtube-dl ' :
try :
2021-07-13 19:19:24 +02:00
return link_to_vnf_from_youtubedl ( video_link )
2021-07-12 20:49:19 +02:00
except Exception as e :
2021-12-03 01:58:36 +01:00
print ( " [ X ] Youtube-DL Failed " )
2021-07-12 20:49:19 +02:00
print ( e )
return None
else :
print ( " Please set the method key in your config file to ' api ' ' youtube-dl ' or ' hybrid ' " )
return None
2021-07-13 19:18:50 +02:00
def get_vnf_from_link_cache ( video_link ) :
2021-07-12 10:49:07 +02:00
if link_cache_system == " db " :
collection = db . linkCache
2021-07-13 19:18:50 +02:00
vnf = collection . find_one ( { ' tweet ' : video_link } )
2021-12-03 01:58:36 +01:00
if vnf != None :
print ( " [ ✔ ] Link located in DB cache " )
2021-07-12 10:49:07 +02:00
return vnf
else :
2021-12-03 01:58:36 +01:00
print ( " [ X ] Link not in DB cache " )
2021-07-12 10:49:07 +02:00
return None
elif link_cache_system == " json " :
2021-07-13 19:18:50 +02:00
if video_link in link_cache :
2021-07-12 10:49:07 +02:00
print ( " Link located in json cache " )
2021-07-13 19:18:50 +02:00
vnf = link_cache [ video_link ]
2021-07-12 10:49:07 +02:00
return vnf
else :
2021-12-03 01:58:36 +01:00
print ( " [ X ] Link not in json cache " )
2021-07-12 10:49:07 +02:00
return None
2021-07-13 19:18:50 +02:00
def add_vnf_to_link_cache ( video_link , vnf ) :
2021-07-12 10:49:07 +02:00
if link_cache_system == " db " :
try :
out = db . linkCache . insert_one ( vnf )
2021-12-03 01:58:36 +01:00
print ( " [ + ] Link added to DB cache " )
2021-07-12 10:49:07 +02:00
return True
except Exception :
2021-12-03 01:58:36 +01:00
print ( " [ X ] Failed to add link to DB cache " )
2021-07-12 10:49:07 +02:00
return None
elif link_cache_system == " json " :
2021-07-13 19:18:50 +02:00
link_cache [ video_link ] = vnf
2021-12-03 01:58:36 +01:00
with open ( " links.json " , " w " ) as outfile :
2021-07-12 10:49:07 +02:00
json . dump ( link_cache , outfile , indent = 4 , sort_keys = True )
return None
2021-07-14 10:33:46 +02:00
def message ( text ) :
return render_template ( ' default.html ' , message = text , color = config [ ' config ' ] [ ' color ' ] , appname = config [ ' config ' ] [ ' appname ' ] , repo = config [ ' config ' ] [ ' repo ' ] , url = config [ ' config ' ] [ ' url ' ] )
2021-07-13 19:19:24 +02:00
def embed ( video_link , vnf ) :
2021-12-03 01:58:36 +01:00
print ( " [ E ] Embedding " + vnf [ ' url ' ] )
2021-07-15 02:15:06 +02:00
if vnf [ ' url ' ] . startswith ( ' https://t.co ' ) is not True :
2021-08-03 03:52:13 +02:00
desc = re . sub ( r ' http.*t \ .co \ S+ ' , ' ' , vnf [ ' description ' ] )
urlUser = urllib . parse . quote ( vnf [ ' uploader ' ] )
urlDesc = urllib . parse . quote ( desc )
urlLink = urllib . parse . quote ( video_link )
2021-12-03 01:58:36 +01:00
return render_template ( ' index.html ' , vidlink = vnf [ ' url ' ] , vidurl = vnf [ ' url ' ] , desc = desc , pic = vnf [ ' thumbnail ' ] , user = vnf [ ' uploader ' ] , video_link = video_link , color = config [ ' config ' ] [ ' color ' ] , appname = config [ ' config ' ] [ ' appname ' ] , repo = config [ ' config ' ] [ ' repo ' ] , url = config [ ' config ' ] [ ' url ' ] , urlDesc = urlDesc , urlUser = urlUser , urlLink = urlLink )
2021-07-15 02:15:06 +02:00
else :
return redirect ( vnf [ ' url ' ] , 301 )
2021-07-12 10:49:07 +02:00
2021-07-13 19:19:24 +02:00
def o_embed_gen ( description , user , video_link ) :
2021-07-09 12:32:04 +02:00
out = {
" type " : " video " ,
" version " : " 1.0 " ,
" provider_name " : " TwitFix " ,
" provider_url " : " https://github.com/robinuniverse/twitfix " ,
" title " : description ,
" author_name " : user ,
2021-07-13 19:19:24 +02:00
" author_url " : video_link
2021-07-09 12:32:04 +02:00
}
return out
2021-07-04 01:52:30 +02:00
if __name__ == " __main__ " :
2021-07-08 05:17:23 +02:00
app . run ( host = ' 0.0.0.0 ' )