vcinema/vcinema_utils/VCinemaUtils.py

151 lines
4.9 KiB
Python
Raw Normal View History

2022-02-27 14:34:23 +00:00
from collections import Counter
2022-04-03 20:23:22 +01:00
from concurrent.futures import ThreadPoolExecutor
2022-03-12 16:08:02 +00:00
import csv
2022-02-20 21:26:38 +00:00
from imdb_utils import IMDbUtils
2022-02-27 14:34:23 +00:00
from bookstack import Bookstack
2022-02-20 21:26:38 +00:00
2022-02-20 21:53:36 +00:00
JACKNET_WIKI_URL = "https://wiki.jacknet.io"
2022-03-26 00:33:39 +00:00
# Page ID of https://wiki.jacknet.io/books/vcinema/page/csv
CSV_PAGE_ID = 11
2022-02-20 21:53:36 +00:00
2022-04-03 20:23:22 +01:00
def get_viewings_csv_attachment_id(token_id, token_secret):
2022-02-27 14:34:23 +00:00
attachments = Bookstack.get_attachments(JACKNET_WIKI_URL, token_id, token_secret)
viewings_csv_file_name = "vcinema.csv"
2022-03-26 00:33:39 +00:00
return next((x['id'] for x in attachments if x['uploaded_to'] == CSV_PAGE_ID and x['name'] == viewings_csv_file_name), None)
def get_vcinema_viewings(token_id, token_secret, viewings_csv=None, combine_repeat_viewings=True):
if viewings_csv is None:
attachment_id = get_viewings_csv_attachment_id(token_id, token_secret)
viewings_csv = Bookstack.get_attachment(JACKNET_WIKI_URL, token_id, token_secret, attachment_id)
2022-02-20 21:26:38 +00:00
viewings_csv = viewings_csv.decode("utf-8")
viewings_csv_rows = viewings_csv.strip().split("\n")
2022-02-20 21:26:38 +00:00
2022-04-03 18:24:58 +01:00
viewings = list(csv.DictReader(viewings_csv_rows, quotechar='"'))
2022-02-27 14:34:23 +00:00
if combine_repeat_viewings:
2022-03-12 16:08:02 +00:00
for viewing in viewings:
viewing['viewings'] = [
{'date_watched': viewing['date_watched'], 'season': viewing['season'], 'rating': viewing['rating']}]
viewing.pop('date_watched')
viewing.pop('season')
viewing.pop('rating')
2022-02-27 14:34:23 +00:00
watch_counts = Counter([x['imdb_id'] for x in viewings])
repeat_watches = [k for k, v in watch_counts.items() if v > 1]
for film in repeat_watches:
viewing_indexes = [index for index, viewing in enumerate(viewings) if viewing['imdb_id'] == film]
first_watch = viewings[viewing_indexes[0]]
for index in viewing_indexes[1::]:
2022-03-12 12:14:32 +00:00
first_watch['viewings'].extend(viewings[index]['viewings'])
2022-02-27 14:34:23 +00:00
for index in reversed(viewing_indexes[1::]):
viewings.pop(index)
2022-02-20 21:26:38 +00:00
return viewings
2022-04-03 20:23:22 +01:00
def add_imdb_data(imdb_id, viewings, data_fields, progressbar=None):
movie = IMDbUtils.get_movie(imdb_id)
2022-02-27 14:34:23 +00:00
2022-04-03 20:23:22 +01:00
for viewing in viewings:
if viewing['imdb_id'] == movie.movieID:
for field_name in data_fields:
if field_name in movie:
viewing[field_name] = movie[field_name]
2022-02-27 14:34:23 +00:00
2022-04-03 20:23:22 +01:00
if progressbar is not None:
progressbar.next()
2022-02-27 14:34:23 +00:00
2022-04-03 20:27:09 +01:00
def add_imdb_keywords(imdb_id, viewings, progressbar=None):
movie = IMDbUtils.get_movie_keywords(imdb_id)
for viewing in viewings:
if viewing['imdb_id'] == movie.movieID:
if 'keywords' in movie:
viewing['keywords'] = movie['keywords']
if progressbar is not None:
progressbar.next()
2022-04-03 20:23:22 +01:00
def add_imdb_data_to_viewings(viewings, field_names, progress_bar=None):
with ThreadPoolExecutor(4) as executor:
future_imdb_tasks = set()
2022-04-08 21:06:31 +01:00
if ('keywords' in field_names and len(field_names) > 1) or ('keywords' not in field_names and len(field_names) > 0):
2022-04-03 20:27:09 +01:00
future_imdb_tasks.update(executor.submit(add_imdb_data, viewing['imdb_id'], viewings, field_names, progress_bar) for viewing in viewings)
if 'keywords' in field_names:
future_imdb_tasks.update(executor.submit(add_imdb_keywords, viewing['imdb_id'], viewings, progress_bar) for viewing in viewings)
2022-02-20 21:26:38 +00:00
2022-04-03 20:23:22 +01:00
progress_bar.max = len(future_imdb_tasks)
2022-02-20 21:26:38 +00:00
2022-04-03 20:23:22 +01:00
if progress_bar is not None:
progress_bar.finish()
2022-03-26 00:33:39 +00:00
2022-02-20 21:26:38 +00:00
2022-04-03 22:27:49 +01:00
def filter_viewings(viewings, filter_field):
2022-02-20 21:26:38 +00:00
viewings_filtered = {}
for viewing in viewings:
if filter_field in viewing:
viewing_field = viewing[filter_field]
if isinstance(viewing_field, list):
for fve in list(viewing_field):
if fve in viewings_filtered.keys():
viewings_filtered[fve] += [viewing]
2022-02-27 14:34:23 +00:00
else:
viewings_filtered[fve] = [viewing]
else:
if viewing_field in viewings_filtered.keys():
viewings_filtered[viewing_field] += [viewing]
else:
viewings_filtered[viewing_field] = [viewing]
2022-02-27 14:34:23 +00:00
2022-02-20 21:26:38 +00:00
return viewings_filtered
2022-04-08 21:37:14 +01:00
def get_film_list(films):
film_links = []
for film in films:
2022-12-04 14:11:27 +00:00
film_link = generate_imdb_film_link(film)
2022-04-08 21:37:14 +01:00
film_links.append(film_link)
if len(film_links) > 0:
return "<br>".join(film_links)
else:
return ""
2022-12-04 14:11:27 +00:00
def generate_markdown_link(text, url):
return "[{}]({})".format(text, url)
def generate_imdb_film_link(film):
2022-12-04 14:20:36 +00:00
return generate_markdown_link(film['title'], generate_imdb_url(film['imdb_id']))
2022-12-04 14:11:27 +00:00
def generate_wikipedia_page_link(page_title):
2022-12-04 14:25:17 +00:00
return generate_markdown_link(page_title, generate_wikipedia_url(page_title))
def generate_imdb_url(imdb_id):
return "https://www.imdb.com/title/tt{}/".format(imdb_id)
def generate_wikipedia_url(page_title):
"https://en.wikipedia.org/wiki/{}".format(page_title.replace(" ", "_"))