vcinema/vcinema_utils/VCinemaUtils.py

from concurrent.futures import ThreadPoolExecutor
import csv
from datetime import datetime

from vcinema_utils.VCinemaFilm import VCinemaFilm
from imdb_utils import IMDbUtils
from bookstack import Bookstack


JACKNET_WIKI_URL = "https://wiki.jacknet.io"

# Page ID of https://wiki.jacknet.io/books/vcinema/page/csv
CSV_PAGE_ID = 11


def get_viewings_csv_attachment_id(token_id, token_secret):
    attachments = Bookstack.get_attachments(JACKNET_WIKI_URL, token_id, token_secret)

    viewings_csv_file_name = "vcinema.csv"

    return next((x['id'] for x in attachments if x['uploaded_to'] == CSV_PAGE_ID and x['name'] == viewings_csv_file_name), None)


def get_vcinema_viewings(token_id, token_secret):
    attachment_id = get_viewings_csv_attachment_id(token_id, token_secret)

    viewings_csv = Bookstack.get_attachment(JACKNET_WIKI_URL, token_id, token_secret, attachment_id)
    viewings_csv = viewings_csv.decode("utf-8")

    viewings_csv_rows = viewings_csv.strip().split("\n")

    viewings = list(csv.DictReader(viewings_csv_rows, quotechar='"'))

    return viewings


def get_vcinema_films(token_id, token_secret):
    viewings = get_vcinema_viewings(token_id, token_secret)
    films = {}

    for viewing in viewings:
        imdb_id = viewing["imdb_id"]
        title = viewing["title"]

        if imdb_id not in films.keys():
            film = VCinemaFilm(imdb_id=imdb_id, title=title)
            films[imdb_id] = film

        date_watched = datetime.strptime(viewing['date_watched'], "%Y-%m-%d")
        season = viewing['season']
        rating = viewing['rating']

        films[imdb_id].add_viewing(date_watched, season, rating)

    return list(films.values())


def add_imdb_data(imdb_id, films, data_fields, progressbar=None):
    movie = IMDbUtils.get_movie(imdb_id)

    for film in films:
        if film.get_imdb_id() == movie.movieID:
            for field_name in data_fields:
                if field_name in movie:
                    film.add_imdb_data(field_name, movie[field_name])

    if progressbar is not None:
        progressbar.next()


def add_imdb_keywords(imdb_id, films, progressbar=None):
    movie = IMDbUtils.get_movie_keywords(imdb_id)

    for film in films:
        if film.get_imdb_id() == movie.movieID:
            if 'keywords' in movie:
                film.add_imdb_data('keywords', movie['keywords'])

    if progressbar is not None:
        progressbar.next()


def add_imdb_data_to_films(films, field_names, progress_bar=None):
    with ThreadPoolExecutor(4) as executor:
        future_imdb_tasks = set()

        if ('keywords' in field_names and len(field_names) > 1) or ('keywords' not in field_names and len(field_names) > 0):
            future_imdb_tasks.update(executor.submit(add_imdb_data, film.get_imdb_id(), films, field_names, progress_bar) for film in films)

        if 'keywords' in field_names:
            future_imdb_tasks.update(executor.submit(add_imdb_keywords, film.get_imdb_id(), films, progress_bar) for film in films)

        progress_bar.max = len(future_imdb_tasks)

    if progress_bar is not None:
        progress_bar.finish()


def filter_films(films: [VCinemaFilm], field: str) -> [VCinemaFilm]:
    films_filtered = {}

    for film in films:
        if film.get_imdb_data(field) is not None:
            field_value = film.get_imdb_data(field)
            if isinstance(field_value, list):
                for value in list(field_value):
                    if value in films_filtered.keys():
                        films_filtered[value] += [film]
                    else:
                        films_filtered[value] = [film]
            else:
                if field_value in films_filtered.keys():
                    films_filtered[field_value] += [film]
                else:
                    films_filtered[field_value] = [film]

    return films_filtered


def get_film_list(films: [VCinemaFilm]) -> str:
    film_links = []

    for film in films:
        film_link = film.get_imdb_link()
        film_links.append(film_link)

    if len(film_links) > 0:
        return "<br>".join(film_links)
    else:
        return ""


def generate_markdown_link(text, url) -> str:
    return "[{}]({})".format(text, url)


def generate_wikipedia_page_link(page_title):
    return generate_markdown_link(page_title, generate_wikipedia_url(page_title))


def generate_wikipedia_url(page_title):
    return "https://en.wikipedia.org/wiki/{}".format(page_title.replace(" ", "_"))
refactor 2022-04-03 20:23:22 +01:00			`from concurrent.futures import ThreadPoolExecutor`
fix csv reading 2022-03-12 16:08:02 +00:00			`import csv`
apply changes 2022-12-19 22:26:38 +00:00			`from datetime import datetime`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`from vcinema_utils.VCinemaFilm import VCinemaFilm`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00			`from imdb_utils import IMDbUtils`
fix files by year page 2022-02-27 14:34:23 +00:00			`from bookstack import Bookstack`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00

move url to utils 2022-02-20 21:53:36 +00:00			`JACKNET_WIKI_URL = "https://wiki.jacknet.io"`

add start of wiki update script 2022-03-26 00:33:39 +00:00			`# Page ID of https://wiki.jacknet.io/books/vcinema/page/csv`
			`CSV_PAGE_ID = 11`
move url to utils 2022-02-20 21:53:36 +00:00
refactor 2022-04-03 20:23:22 +01:00
use csv file instead of reading from csv page 2022-02-20 22:00:14 +00:00			`def get_viewings_csv_attachment_id(token_id, token_secret):`
fix files by year page 2022-02-27 14:34:23 +00:00			`attachments = Bookstack.get_attachments(JACKNET_WIKI_URL, token_id, token_secret)`
use csv file instead of reading from csv page 2022-02-20 22:00:14 +00:00
			`viewings_csv_file_name = "vcinema.csv"`

add start of wiki update script 2022-03-26 00:33:39 +00:00			`return next((x['id'] for x in attachments if x['uploaded_to'] == CSV_PAGE_ID and x['name'] == viewings_csv_file_name), None)`
use csv file instead of reading from csv page 2022-02-20 22:00:14 +00:00

apply changes 2022-12-19 22:26:38 +00:00			`def get_vcinema_viewings(token_id, token_secret):`
			`attachment_id = get_viewings_csv_attachment_id(token_id, token_secret)`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`viewings_csv = Bookstack.get_attachment(JACKNET_WIKI_URL, token_id, token_secret, attachment_id)`
use csv file instead of reading from csv page 2022-02-20 22:00:14 +00:00			`viewings_csv = viewings_csv.decode("utf-8")`
apply changes 2022-12-19 22:26:38 +00:00
use csv file instead of reading from csv page 2022-02-20 22:00:14 +00:00			`viewings_csv_rows = viewings_csv.strip().split("\n")`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
use dictreader 2022-04-03 18:24:58 +01:00			`viewings = list(csv.DictReader(viewings_csv_rows, quotechar='"'))`
add season and rating to viewing list for each film 2022-03-08 22:44:20 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`return viewings`
fix csv reading 2022-03-12 16:08:02 +00:00
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`def get_vcinema_films(token_id, token_secret):`
			`viewings = get_vcinema_viewings(token_id, token_secret)`
			`films = {}`
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`for viewing in viewings:`
			`imdb_id = viewing["imdb_id"]`
			`title = viewing["title"]`
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`if imdb_id not in films.keys():`
			`film = VCinemaFilm(imdb_id=imdb_id, title=title)`
			`films[imdb_id] = film`
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`date_watched = datetime.strptime(viewing['date_watched'], "%Y-%m-%d")`
			`season = viewing['season']`
			`rating = viewing['rating']`
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`films[imdb_id].add_viewing(date_watched, season, rating)`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`return list(films.values())`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
apply changes 2022-12-19 22:26:38 +00:00
			`def add_imdb_data(imdb_id, films, data_fields, progressbar=None):`
refactor 2022-04-03 20:23:22 +01:00			`movie = IMDbUtils.get_movie(imdb_id)`
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`for film in films:`
			`if film.get_imdb_id() == movie.movieID:`
refactor 2022-04-03 20:23:22 +01:00			`for field_name in data_fields:`
			`if field_name in movie:`
apply changes 2022-12-19 22:26:38 +00:00			`film.add_imdb_data(field_name, movie[field_name])`
fix files by year page 2022-02-27 14:34:23 +00:00
refactor 2022-04-03 20:23:22 +01:00			`if progressbar is not None:`
			`progressbar.next()`
use callback for tasks instead of adding extra function 2022-02-27 15:23:20 +00:00
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`def add_imdb_keywords(imdb_id, films, progressbar=None):`
add keywords to data 2022-04-03 20:27:09 +01:00			`movie = IMDbUtils.get_movie_keywords(imdb_id)`

apply changes 2022-12-19 22:26:38 +00:00			`for film in films:`
			`if film.get_imdb_id() == movie.movieID:`
add keywords to data 2022-04-03 20:27:09 +01:00			`if 'keywords' in movie:`
apply changes 2022-12-19 22:26:38 +00:00			`film.add_imdb_data('keywords', movie['keywords'])`
add keywords to data 2022-04-03 20:27:09 +01:00
			`if progressbar is not None:`
			`progressbar.next()`


apply changes 2022-12-19 22:26:38 +00:00			`def add_imdb_data_to_films(films, field_names, progress_bar=None):`
refactor 2022-04-03 20:23:22 +01:00			`with ThreadPoolExecutor(4) as executor:`
			`future_imdb_tasks = set()`

fix check 2022-04-08 21:06:31 +01:00			`if ('keywords' in field_names and len(field_names) > 1) or ('keywords' not in field_names and len(field_names) > 0):`
apply changes 2022-12-19 22:26:38 +00:00			`future_imdb_tasks.update(executor.submit(add_imdb_data, film.get_imdb_id(), films, field_names, progress_bar) for film in films)`
add keywords to data 2022-04-03 20:27:09 +01:00
			`if 'keywords' in field_names:`
apply changes 2022-12-19 22:26:38 +00:00			`future_imdb_tasks.update(executor.submit(add_imdb_keywords, film.get_imdb_id(), films, progress_bar) for film in films)`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
refactor 2022-04-03 20:23:22 +01:00			`progress_bar.max = len(future_imdb_tasks)`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
refactor 2022-04-03 20:23:22 +01:00			`if progress_bar is not None:`
			`progress_bar.finish()`
add start of wiki update script 2022-03-26 00:33:39 +00:00
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`def filter_films(films: [VCinemaFilm], field: str) -> [VCinemaFilm]:`
			`films_filtered = {}`
add update_films_by_year_page script 2022-02-20 21:26:38 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`for film in films:`
			`if film.get_imdb_data(field) is not None:`
			`field_value = film.get_imdb_data(field)`
			`if isinstance(field_value, list):`
			`for value in list(field_value):`
			`if value in films_filtered.keys():`
			`films_filtered[value] += [film]`
fix files by year page 2022-02-27 14:34:23 +00:00			`else:`
apply changes 2022-12-19 22:26:38 +00:00			`films_filtered[value] = [film]`
refactor script to take progress bar as arg 2022-02-27 15:34:06 +00:00			`else:`
apply changes 2022-12-19 22:26:38 +00:00			`if field_value in films_filtered.keys():`
			`films_filtered[field_value] += [film]`
refactor script to take progress bar as arg 2022-02-27 15:34:06 +00:00			`else:`
apply changes 2022-12-19 22:26:38 +00:00			`films_filtered[field_value] = [film]`
fix files by year page 2022-02-27 14:34:23 +00:00
apply changes 2022-12-19 22:26:38 +00:00			`return films_filtered`
add helper method 2022-04-08 21:37:14 +01:00

apply changes 2022-12-19 22:26:38 +00:00			`def get_film_list(films: [VCinemaFilm]) -> str:`
add helper method 2022-04-08 21:37:14 +01:00			`film_links = []`

			`for film in films:`
apply changes 2022-12-19 22:26:38 +00:00			`film_link = film.get_imdb_link()`
add helper method 2022-04-08 21:37:14 +01:00			`film_links.append(film_link)`

			`if len(film_links) > 0:`
			`return "<br>".join(film_links)`
			`else:`
			`return ""`
add helper functions 2022-12-04 14:11:27 +00:00

apply changes 2022-12-19 22:26:38 +00:00			`def generate_markdown_link(text, url) -> str:`
add helper functions 2022-12-04 14:11:27 +00:00			`return "[{}]({})".format(text, url)`


			`def generate_wikipedia_page_link(page_title):`
add missing helper functions 2022-12-04 14:25:17 +00:00			`return generate_markdown_link(page_title, generate_wikipedia_url(page_title))`


			`def generate_wikipedia_url(page_title):`
fix link 2022-12-10 07:59:05 +00:00			`return "https://en.wikipedia.org/wiki/{}".format(page_title.replace(" ", "_"))`