#!/usr/bin/env python # -*- coding: utf-8 -*- """ usage: plex_netflix_check.py [-h] [-l [...]] [-s ] [-t ] Use instantwatcher.com to find if Plex items are on Netflix, Amazon, or both. optional arguments: -h, --help show this help message and exit -l [ ...], --library [ ...] Space separated list of case sensitive names to process. Allowed names are: (choices: Your show or movie library names) -s [], --search [] Search any name. -t [], --type [] Refine search for name by using type. (choices: movie, show) -e [], --episodes [] Refine search for individual episodes. (choices: True, False) (default: False) -site [], --site [] Refine search for name by using type. (choices: Netflix, Amazon, Both) (default: Both) -sl [], --search_limit [] Define number of search returns from page. Zero returns all. (default: 5) If title is matched in both, Amazon is first then Netflix. """ from __future__ import print_function from __future__ import unicode_literals from builtins import str import requests import argparse from xmljson import badgerfish as bf from lxml.html import fromstring from time import sleep from plexapi.server import PlexServer, CONFIG # pip install plexapi # ## Edit ## PLEX_URL = '' PLEX_TOKEN = '' if not PLEX_URL: PLEX_URL = CONFIG.data['auth'].get('server_baseurl', '') if not PLEX_TOKEN: PLEX_TOKEN = CONFIG.data['auth'].get('server_token', '') # ## /Edit ## sess = requests.Session() # Ignore verifying the SSL certificate sess.verify = False # '/path/to/certfile' # If verify is set to a path to a directory, # the directory must have been processed using the c_rehash utility supplied # with OpenSSL. if sess.verify is False: # Disable the warning that the request is insecure, we know that... import urllib3 urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning) plex = PlexServer(PLEX_URL, PLEX_TOKEN, session=sess) def instantwatch_search(name, media_type, site, search_limit): NETFLIX_URL = 'http://www.netflix.com/title/' limit = False results_count = 0 if media_type == 'movie': content_type = '1' elif media_type == 'show': content_type = '2' elif media_type == 'episode': content_type = '4' else: content_type = '' payload = {'content_type': content_type, 'q': name.lower()} if site == 'Netflix': r = requests.get('http://instantwatcher.com/netflix/78/search'.rstrip('/'), params=payload) elif site == 'Amazon': r = requests.get('http://instantwatcher.com/amazon/search'.rstrip('/'), params=payload) else: r = requests.get('http://instantwatcher.com/u/search'.rstrip('/'), params=payload) if r.status_code != 200: print('{} not found: {}'.format(name, r.url)) return 0 results_lst = [] res_data = bf.data(fromstring(r.content)) res_data = res_data['html']['body']['div']['div'][1] # Any matches? res_results = res_data['div'][1]['div'][0] title_check = res_data['div'][1]['div'][1] try: if res_results['span']: total_results = res_results['span'] for data in total_results: results_lst += [data['$']] except Exception: pass print('{} found {}.'.format(results_lst[0], results_lst[1])) result_count = int(results_lst[1].split(' ')[0]) amazon_id = '' amazon_url = '' # Title match if result_count == 0: print('0 matches, moving on.') pass else: item_results_page = title_check['div']['div'] if result_count > 1: for results in item_results_page: for data in results['a']: try: amazon_id = data['@data-amazon-title-id'] amazon_url = data['@data-amazon-uri'] except Exception: pass for data in results['span']: if data['@class'] == 'title' and search_limit != 0: if str(data['a']['$']).lower().startswith(name.lower()): if amazon_id: if data['a']['@data-title-id'] == amazon_id: print('Match found on Amazon for {}'.format(data['a']['$'])) print('Page: {}'.format(amazon_url)) else: print('Match found on Netflix for {}'.format(data['a']['$'])) print('Page: {}{}'.format(NETFLIX_URL, data['a']['@data-title-id'])) results_count += 1 search_limit -= 1 if search_limit == 0: limit = True elif data['@class'] == 'title' and search_limit == 0 and limit is False: if data['a']['$'].lower().startswith(name.lower()): if amazon_id: if data['a']['@data-title-id'] == amazon_id: print('Match found on Amazon for {}'.format(data['a']['$'])) print('Page: {}'.format(amazon_url)) else: print('Match found on Netflix for {}'.format(data['a']['$'])) print('Page: {}{}'.format(NETFLIX_URL, data['a']['@data-title-id'])) results_count += 1 elif result_count == 1: for data in item_results_page['a']: try: amazon_id = data['@data-amazon-title-id'] amazon_url = data['@data-amazon-uri'] except Exception: pass for data in item_results_page['span']: if data['@class'] == 'title': if data['a']['$'].lower().startswith(name.lower()): print('Match! For {}'.format(data['a']['$'])) if amazon_id: if data['a']['@data-title-id'] == amazon_id: print('Page: {}'.format(amazon_url)) else: print('Page: {}{}'.format(NETFLIX_URL, data['a']['@data-title-id'])) results_count += 1 else: print('Could not find exact name match.') return results_count def plex_library_search(lib_name, site, epi_search, search_limit): for title in plex.library.section(lib_name).all(): print('Running check on {}'.format(title.title)) file_path = [] if title.type == 'show' and epi_search is True: if instantwatch_search(title.title, title.type, site, search_limit) > 0: print('Show was found. Searching for episode paths.') for episode in title.episodes(): # Need to check episodes against sites to truly find episode matches. # For now just return paths for episodes if Show name matches. # print('Running check on {} - {}'.format(title.title, episode.title)) # show_ep = '{} - {}'.format(title.title, episode.title) # if instantwatch_search(show_ep, 'episode', site) > 0: file_path += [episode.media[0].parts[0].file] elif title.type == 'movie': if instantwatch_search(title.title, title.type, site, search_limit) > 0: file_path = title.media[0].parts[0].file else: if instantwatch_search(title.title, title.type, site, search_limit) > 0: print('Show was found but path is not defined.') if file_path: if type(file_path) is str: print('File: {}'.format(file_path)) elif type(file_path) is list: print('Files: \n{}'.format(' \n'.join(file_path))) print('Waiting 5 seconds before next search.') sleep(5) def main(): sections_lst = [d.title for d in plex.library.sections() if d.type in ['show', 'movie']] parser = argparse.ArgumentParser(description="Use instantwatcher.com to find if Plex items are on Netflix.", formatter_class=argparse.RawTextHelpFormatter) parser.add_argument('-l', '--library', metavar='', choices=sections_lst, nargs='+', help='Space separated list of case sensitive names to process. Allowed names are:\n' '(choices: %(choices)s)') parser.add_argument('-s', '--search', metavar='', nargs='?', type=str, help='Search any name.') parser.add_argument('-m', '--media_type', metavar='', choices=['movie', 'show'], nargs='?', help='Refine search for name by using media type.\n' '(choices: %(choices)s)') parser.add_argument('-e', '--episodes', metavar='', nargs='?', type=bool, default=False, choices=[True, False], help='Refine search for individual episodes.\n' '(choices: %(choices)s)\n(default: %(default)s)') parser.add_argument('-site', '--site', metavar='', choices=['Netflix', 'Amazon', 'Both'], nargs='?', default='Netflix', help='Refine search for name by using type.\n' '(choices: %(choices)s)\n(default: %(default)s)') parser.add_argument('-sl', '--search_limit', metavar='', nargs='?', type=int, default=5, help='Define number of search returns from page. Zero returns all.' '\n(default: %(default)s)') opts = parser.parse_args() # print(opts) if opts.search: instantwatch_search(opts.search, opts.media_type, opts.site, opts.search_limit) else: if len(opts.library) > 1: for section in opts.library: plex_library_search(section, opts.site, opts.episodes, opts.search_limit) else: plex_library_search(opts.library[0], opts.site, opts.episodes, opts.search_limit) if __name__ == '__main__': main()