lib.itmens/catalog/sites/imdb.py

from catalog.common import *
from .tmdb import search_tmdb_by_imdb_id
from catalog.movie.models import *
from catalog.tv.models import *
import logging


_logger = logging.getLogger(__name__)


@SiteManager.register
class IMDB(AbstractSite):
    SITE_NAME = SiteName.IMDB
    ID_TYPE = IdType.IMDB
    URL_PATTERNS = [r'\w+://www.imdb.com/title/(tt\d+)']
    WIKI_PROPERTY_ID = '?'

    @classmethod
    def id_to_url(self, id_value):
        return "https://www.imdb.com/title/" + id_value + "/"

    def scrape(self):
        self.scraped = False
        res_data = search_tmdb_by_imdb_id(self.id_value)
        if 'movie_results' in res_data and len(res_data['movie_results']) > 0:
            url = f"https://www.themoviedb.org/movie/{res_data['movie_results'][0]['id']}"
        elif 'tv_results' in res_data and len(res_data['tv_results']) > 0:
            url = f"https://www.themoviedb.org/tv/{res_data['tv_results'][0]['id']}"
        elif 'tv_season_results' in res_data and len(res_data['tv_season_results']) > 0:
            # this should not happen given IMDB only has ids for either show or episode
            tv_id = res_data['tv_season_results'][0]['show_id']
            season_number = res_data['tv_season_results'][0]['season_number']
            url = f"https://www.themoviedb.org/tv/{tv_id}/season/{season_number}/episode/{episode_number}"
        elif 'tv_episode_results' in res_data and len(res_data['tv_episode_results']) > 0:
            tv_id = res_data['tv_episode_results'][0]['show_id']
            season_number = res_data['tv_episode_results'][0]['season_number']
            episode_number = res_data['tv_episode_results'][0]['episode_number']
            if season_number == 0:
                url = f"https://www.themoviedb.org/tv/{tv_id}/season/{season_number}/episode/{episode_number}"
            elif episode_number == 1:
                url = f"https://www.themoviedb.org/tv/{tv_id}/season/{season_number}"
            else:
                raise ParseError(self, "IMDB id matching TMDB but not first episode, this is not supported")
        else:
            raise ParseError(self, "IMDB id not found in TMDB")
        tmdb = SiteManager.get_site_by_url(url)
        pd = tmdb.scrape()
        pd.metadata['preferred_model'] = tmdb.DEFAULT_MODEL.__name__
        return pd
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00			`from catalog.common import *`
add douban book works; add goodread works; auto link season to show 2022-12-08 05:53:00 +00:00			`from .tmdb import search_tmdb_by_imdb_id`
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00			`from catalog.movie.models import *`
			`from catalog.tv.models import *`
			`import logging`


rename a few methods 2022-12-08 16:59:03 +00:00			`_logger = logging.getLogger(__name__)`
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00

new data model: /book/<uid> 2022-12-15 17:29:35 -05:00			`@SiteManager.register`
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00			`class IMDB(AbstractSite):`
new data model: view detail page 2022-12-16 01:08:10 -05:00			`SITE_NAME = SiteName.IMDB`
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00			`ID_TYPE = IdType.IMDB`
			`URL_PATTERNS = [r'\w+://www.imdb.com/title/(tt\d+)']`
			`WIKI_PROPERTY_ID = '?'`

			`@classmethod`
			`def id_to_url(self, id_value):`
			`return "https://www.imdb.com/title/" + id_value + "/"`

			`def scrape(self):`
			`self.scraped = False`
add douban book works; add goodread works; auto link season to show 2022-12-08 05:53:00 +00:00			`res_data = search_tmdb_by_imdb_id(self.id_value)`
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00			`if 'movie_results' in res_data and len(res_data['movie_results']) > 0:`
			`url = f"https://www.themoviedb.org/movie/{res_data['movie_results'][0]['id']}"`
			`elif 'tv_results' in res_data and len(res_data['tv_results']) > 0:`
			`url = f"https://www.themoviedb.org/tv/{res_data['tv_results'][0]['id']}"`
			`elif 'tv_season_results' in res_data and len(res_data['tv_season_results']) > 0:`
			`# this should not happen given IMDB only has ids for either show or episode`
			`tv_id = res_data['tv_season_results'][0]['show_id']`
			`season_number = res_data['tv_season_results'][0]['season_number']`
			`url = f"https://www.themoviedb.org/tv/{tv_id}/season/{season_number}/episode/{episode_number}"`
			`elif 'tv_episode_results' in res_data and len(res_data['tv_episode_results']) > 0:`
			`tv_id = res_data['tv_episode_results'][0]['show_id']`
			`season_number = res_data['tv_episode_results'][0]['season_number']`
			`episode_number = res_data['tv_episode_results'][0]['episode_number']`
			`if season_number == 0:`
			`url = f"https://www.themoviedb.org/tv/{tv_id}/season/{season_number}/episode/{episode_number}"`
			`elif episode_number == 1:`
			`url = f"https://www.themoviedb.org/tv/{tv_id}/season/{season_number}"`
			`else:`
			`raise ParseError(self, "IMDB id matching TMDB but not first episode, this is not supported")`
			`else:`
			`raise ParseError(self, "IMDB id not found in TMDB")`
new data model: /book/<uid> 2022-12-15 17:29:35 -05:00			`tmdb = SiteManager.get_site_by_url(url)`
new catalog data model, wip, not enabled 2022-12-07 19:09:05 -05:00			`pd = tmdb.scrape()`
			`pd.metadata['preferred_model'] = tmdb.DEFAULT_MODEL.__name__`
			`return pd`