From d0ad869d8117ba5b87333b4827aade7408128698 Mon Sep 17 00:00:00 2001 From: Sarah Date: Thu, 14 Apr 2022 20:03:16 +0100 Subject: [PATCH] add get_hidden_themes script --- get_hidden_themes.py | 37 +++++++++++++++++++++++++++++++++++++ 1 file changed, 37 insertions(+) create mode 100644 get_hidden_themes.py diff --git a/get_hidden_themes.py b/get_hidden_themes.py new file mode 100644 index 0000000..6990393 --- /dev/null +++ b/get_hidden_themes.py @@ -0,0 +1,37 @@ +from imdb_utils import IMDbUtils + +import argparse +from progress.bar import IncrementalBar + + +def get_hidden_themes(imdb_ids): + hidden_themes = set() + is_first = True + + with IncrementalBar('Retrieving movie data', max=len(imdb_ids), suffix='%(percent).1f%% - %(eta)ds remaining', check_tty=False) as bar: + for imdb_id in imdb_ids: + movie_data = IMDbUtils.get_movie_keywords(imdb_id) + + if 'keywords' in movie_data: + keywords = set(movie_data['keywords']) + if is_first: + hidden_themes = keywords + is_first = False + else: + hidden_themes = hidden_themes.intersection(keywords) + + bar.next() + + return hidden_themes + + +if __name__ == '__main__': + parser = argparse.ArgumentParser() + parser.add_argument('imdb_ids', nargs="+", default=[]) + + args = parser.parse_args() + + hidden_themes = get_hidden_themes(args.imdb_ids) + + print(hidden_themes) +