downloading missing trailers to archive

This commit is contained in:
simon 2021-04-16 14:16:27 +07:00
parent 4817c1d752
commit cc6e0198a0
3 changed files with 197 additions and 3 deletions

View File

@ -12,6 +12,7 @@ import src.tvsort as tvsort
import src.tvsort_id as tvsort_id
import src.moviesort as moviesort
import src.db_export as db_export
import src.trailers as trailers
def get_config():
@ -42,6 +43,15 @@ def get_config():
config["emby_url"] = config_parser.get('emby', 'emby_url')
config["emby_user_id"] = config_parser.get('emby', 'emby_user_id')
config["emby_api_key"] = config_parser.get('emby', 'emby_api_key')
# youtubedl_ops
ydl_opts = dict(config_parser.items('ydl_opts'))
# dedect string literals, is there a better way to do that?
for key, value in ydl_opts.items():
if value.isdigit():
ydl_opts[key] = int(value)
elif value.lower() in ['true', 'false']:
ydl_opts[key] = bool(value)
config['ydl_opts'] = ydl_opts
return config
@ -50,11 +60,13 @@ def get_pending_all(config):
# call subfunction to collect pending
pending_movie = moviesort.get_pending(config['movie_downpath'])
pending_tv = tvsort.get_pending(config['tv_downpath'])
pending_total = pending_movie + pending_tv
pending_trailer = trailers.get_pending(config)
pending_total = pending_movie + pending_tv + pending_trailer
# build dict
pending = {}
pending['movies'] = pending_movie
pending['tv'] = pending_tv
pending['trailer'] = pending_trailer
pending['total'] = pending_total
return pending
@ -76,8 +88,10 @@ def print_menu(stdscr, current_row_idx, menu, config):
pending_count = pending['movies']
elif row == 'TV shows':
pending_count = pending['tv']
elif row == 'Trailer download':
pending_count = pending['trailer']
else:
pending_count = 0
pending_count = ' '
# center whole
y = h // 2 - len(menu) + idx
# print string to menu
@ -104,6 +118,8 @@ def sel_handler(menu_item, config):
tvsort.main(config, tvsort_id)
elif menu_item == 'DB export':
db_export.main(config)
elif menu_item == 'Trailer download':
trailers.main(config)
def curses_main(stdscr, menu, config):
@ -141,7 +157,7 @@ def curses_main(stdscr, menu, config):
def main():
""" main wraps the curses menu """
# setup
menu = ['All', 'Movies', 'TV shows', 'DB export', 'Exit']
menu = ['All', 'Movies', 'TV shows', 'DB export', 'Trailer download', 'Exit']
config = get_config()
log_file = path.join(config["log_folder"], 'rename.log')
logging.basicConfig(filename=log_file,level=logging.INFO,format='%(asctime)s:%(message)s')

178
src/trailers.py Normal file
View File

@ -0,0 +1,178 @@
""" download trailers found in emby with youtube-dl """
import os
import re
import requests
import subprocess
import youtube_dl
from time import sleep
def incomplete(config):
""" search for incomplete downloads and trash them """
sortpath = config['sortpath']
file_list = os.listdir(sortpath)
trashed = False
for file in file_list:
if file.endswith('.part') or file.endswith('.ytdl'):
trashed = True
file_path = os.path.join(sortpath, file)
os.path.isfile(file_path)
subprocess.call(['trash', file_path])
return trashed
def get_local_trailers(config):
""" gets a list of existing trailers on filesystem """
emby_url = config['emby_url']
emby_api_key = config['emby_api_key']
url = (emby_url + '/Trailers?api_key=' + emby_api_key +
'&Recursive=True&Fields=Path,MediaStreams')
r = requests.get(url).json()
local_trailer_list = []
for movie in r['Items']:
trailer_name = movie['Name']
trailing_pattern = re.compile(r'(.*_)([0-9a-zA-Z-_]{11})(-trailer)$')
youtube_id = trailing_pattern.findall(trailer_name)[0][1]
movie_name = movie['Path'].split('/')[-2]
media_streams = movie['MediaSources'][0]['MediaStreams']
video_stream = list(filter(lambda stream: stream['Type'] == 'Video', media_streams))
width = video_stream[0]['Width']
height = video_stream[0]['Height']
trailer_details = {'movie_name': movie_name, 'youtube_id': youtube_id,
'width': width, 'height': height}
local_trailer_list.append(trailer_details)
return local_trailer_list
def get_remote_trailers(config):
""" get a list of available trailers on emby """
emby_url = config['emby_url']
emby_api_key = config['emby_api_key']
# remote trailer urls
url = (emby_url + '/Items?api_key=' + emby_api_key +
'&Recursive=True&Fields=LocalTrailerCount,RemoteTrailers,Path&' +
'IncludeItemTypes=Movie')
r = requests.get(url).json()
remote_trailers_list = []
for movie in r['Items']:
movie_name = movie['Path'].split('/')[-2]
movie_path = '/'.join(movie['Path'].split('/')[-3:-1])
local_trailer_count = movie['LocalTrailerCount']
remote_trailers = movie['RemoteTrailers']
trailer_details = {'movie_name': movie_name, 'movie_path': movie_path,
'local_trailer_count': local_trailer_count,
'remote_trailers': remote_trailers}
remote_trailers_list.append(trailer_details)
return remote_trailers_list
def compare_download(local_trailer_list, remote_trailers_list, config):
""" figure out which trailers need downloading """
# failed before
log_file = os.path.join(config['log_folder'], 'trailers')
# check if log file exists
if not os.path.isfile(log_file):
# create empty file
open(log_file, 'a').close()
failed_ids = []
else:
with open(log_file, 'r') as f:
lines = f.readlines()
failed_ids = [i.split()[0] for i in lines]
# ids already downloaded
local_ids = [i['youtube_id'] for i in local_trailer_list]
# find pending
pending = []
for movie in remote_trailers_list:
movie_name = movie['movie_name']
for trailer in movie['remote_trailers']:
vid_id = trailer['Url'].split('?v=')[1]
if vid_id not in failed_ids and vid_id not in local_ids:
pending.append((vid_id, movie_name))
return pending
def dl_pending(pending, config):
""" download pending trailers """
sortpath = config['sortpath']
ydl_opts = config['ydl_opts']
# loop thrugh list
downloaded = []
for trailer in pending:
to_down_id = trailer[0]
movie_name = trailer[1]
filename = os.path.join(sortpath, movie_name + '_' + to_down_id + '-trailer.mkv')
ydl_opts['outtmpl'] = filename
# try up to 5 times
for i in range(5):
try:
print(f'[{i}] {to_down_id} {movie_name}')
youtube_dl.YoutubeDL(ydl_opts).download(['https://www.youtube.com/watch?v=' + to_down_id])
except KeyboardInterrupt:
return False
except:
if i == 4:
# giving up
log_file = os.path.join(config['log_folder'], 'trailers')
with open(log_file, 'a') as f:
f.write(f'{to_down_id} {movie_name}\n')
return False
else:
sleep((i + 1) ** 2)
continue
else:
downloaded.append(to_down_id)
break
return downloaded
def archive(config):
""" move downloaded trailers to movie archive """
sortpath = config['sortpath']
moviepath = config['moviepath']
new_trailers = os.listdir(sortpath)
# loop through new trailers
for trailer in new_trailers:
# build path
year_pattern = re.compile(r'(\()([0-9]{4})(\))')
trailing_pattern = re.compile(r'(.*)(_[0-9a-zA-Z-_]{11}-trailer\.mkv)$')
movie_name = trailing_pattern.findall(trailer)[0][0]
year = year_pattern.findall(trailer)[0][1]
movie_folder = os.path.join(moviepath, year, movie_name)
# move if all good
if os.path.isdir(movie_folder):
old_file = os.path.join(sortpath, trailer)
new_file = os.path.join(movie_folder, trailer)
os.rename(old_file, new_file)
return new_trailers
def get_pending(config):
""" get a list of pending trailers """
local_trailer_list = get_local_trailers(config)
remote_trailers_list = get_remote_trailers(config)
pending = compare_download(local_trailer_list, remote_trailers_list, config)
return pending
def main(config):
""" main function to download pending trailers """
# check for clean folder
trashed = incomplete(config)
# look for trailer
if not trashed:
pending = get_pending(config)
# download if needed
if pending:
print(f'downloading {len(pending)} trailers')
downloaded = dl_pending(pending, config)
else:
print('no missing trailers found')
# move to archive
if downloaded:
new_trailers = archive(config)
print(f'downloaded {len(new_trailers)} new trailers')