unwind/tests/test_imdb.py

import bz2
import json
from pathlib import Path
from unittest.mock import AsyncMock

import bs4
import pytest

from unwind import imdb
from unwind.imdb import imdb_rating_from_score, score_from_imdb_rating

testsdir = Path(__file__).parent
fixturesdir = testsdir / "fixtures"


@pytest.mark.parametrize("rating", (x / 10 for x in range(10, 101)))
def test_rating_conversion(rating: float):
    assert rating == imdb_rating_from_score(score_from_imdb_rating(rating))


@pytest.mark.parametrize("score", range(0, 101))
def test_score_conversion(score: int):
    # Because our score covers 101 discrete values and IMDb's rating only 91
    # discrete values, the mapping is non-injective, i.e. 10 values can't be
    # mapped uniquely.
    non_injective = set(range(5, 100, 10))
    if score in non_injective:
        pytest.skip(f"Score cannot be mapped back correctly: {score}")

    assert score == score_from_imdb_rating(imdb_rating_from_score(score))


@pytest.mark.parametrize(
    "fixture",
    (
        ("most_popular_100.html.bz2"),
        ("most_popular_100-20240714.html.bz2"),
    ),
)
@pytest.mark.asyncio
async def test_load_most_popular_100(monkeypatch, fixture: str):
    with bz2.open(fixturesdir / fixture, "rb") as f:
        html = f.read()
    soup = bs4.BeautifulSoup(html, "html5lib")

    monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))

    movie_ids = await imdb.load_most_popular_100()
    assert len(set(movie_ids)) == 100
    assert all(id_.startswith("tt") for id_ in movie_ids)


@pytest.mark.parametrize(
    "fixture",
    (
        ("bottom_100.html.bz2"),
        ("bottom_100-20240714.html.bz2"),
    ),
)
@pytest.mark.asyncio
async def test_load_bottom_100(monkeypatch, fixture: str):
    with bz2.open(fixturesdir / fixture, "rb") as f:
        html = f.read()
    soup = bs4.BeautifulSoup(html, "html5lib")

    monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))

    movie_ids = await imdb.load_bottom_100()
    assert len(set(movie_ids)) == 100
    assert all(id_.startswith("tt") for id_ in movie_ids)


@pytest.mark.asyncio
async def test_load_top_250(monkeypatch):
    with bz2.open(fixturesdir / "top250.gql.json.bz2", "rb") as f:
        jsonstr = f.read()

    monkeypatch.setattr(imdb, "adownload", AsyncMock(return_value=jsonstr))

    movie_ids = await imdb.load_top_250()
    assert len(movie_ids) == 250
    assert all(id_.startswith("tt") for id_ in movie_ids)


@pytest.mark.asyncio
async def test_load_ratings_page(monkeypatch):
    with bz2.open(fixturesdir / "ratings-ur655321.html.bz2", "rb") as f:
        html = f.read()
    soup = bs4.BeautifulSoup(html, "html5lib")

    monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))

    page = await imdb._load_ratings_page("fakeurl", "ur655321")
    assert len(page.ratings) == 100
    assert page.imdb_user_id is not None
    assert page.imdb_user_id == "ur655321"
    assert page.imdb_user_name == "AlexUltra"
    assert page.next_page_url is not None
    assert page.next_page_url.startswith("/user/ur655321/ratings?")


def _mock_response(content: bytes):
    class MockResponse:
        def raise_for_status(self):
            pass

        def json(self):
            return json.loads(content)

    return MockResponse()


@pytest.mark.asyncio
async def test_load_ratings_page_20240510(monkeypatch):
    with bz2.open(fixturesdir / "ratings-ur655321-20240510.html.bz2", "rb") as f:
        html = f.read()
    soup = bs4.BeautifulSoup(html, "html5lib")
    monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))

    with bz2.open(fixturesdir / "ratings-ur655321-20240510.gql.json.bz2", "rb") as f:
        jsonstr = f.read()
    async with imdb.asession() as s:
        monkeypatch.setattr(s, "post", AsyncMock(return_value=_mock_response(jsonstr)))
        page = await imdb._load_ratings_page("fakeurl", "ur655321")
    assert len(page.ratings) == 100
    assert page.imdb_user_id is not None
    assert page.imdb_user_id == "ur655321"
    assert page.imdb_user_name == "AlexUltra"
    assert page.next_page_url is None, "not supported for new ratings page"

    def movie(item: dict):
        for rating in page.ratings:
            assert rating.movie
            if rating.movie.imdb_id == item["imdb_id"]:
                rating_dict = {key: getattr(rating.movie, key) for key in item.keys()}
                return rating_dict
        raise AssertionError(f"{item['imdb_id']} not found in page.ratings")

    a_movie = {
        "title": "Kung Fu Panda 4",
        "release_year": 2024,
        "media_type": "Movie",
        "imdb_id": "tt21692408",
        "imdb_score": 59,
        "imdb_votes": 36069,
        "runtime": 94,
        "genres": {"Action", "Adventure", "Animation"},
    }
    assert a_movie == movie(a_movie)

    a_running_tvseries = {
        "title": "Palm Royale",
        "release_year": 2024,
        "media_type": "TV Series",
        "imdb_id": "tt8888540",
        "imdb_score": 64,
        "imdb_votes": 6044,
        "genres": {"Drama"},
    }
    assert a_running_tvseries == movie(a_running_tvseries)

    a_finished_tvseries = {
        "title": "Fawlty Towers",
        "release_year": 1975,
        "media_type": "TV Series",
        "imdb_id": "tt0072500",
        "imdb_score": 87,
        "imdb_votes": 100261,
        "genres": {"Comedy"},
    }
    assert a_finished_tvseries == movie(a_finished_tvseries)

    a_tvepisode = {
        "title": "Columbo / No Time to Die",
        "original_title": "Columbo / No Time to Die",
        "release_year": 1992,
        "media_type": "TV Episode",
        "imdb_id": "tt0103987",
        "imdb_score": 59,
        "imdb_votes": 2122,
        "runtime": 98,
        "genres": {"Crime", "Drama", "Mystery"},
    }
    assert a_tvepisode == movie(a_tvepisode)

    a_videogame = {
        "title": "Alan Wake",
        "original_title": "Alan Wake",
        "release_year": 2010,
        "media_type": "Video Game",
        "imdb_id": "tt0466662",
        # The data from __NEXT_DATA__ is wrong, the actual values should be:
        # "imdb_score": 82,
        # "imdb_votes": 7300,
        # "genres": {"Action", "Adventure", "Horror"},
        "imdb_score": 67,  # Wrong value, but correctly parsed from __NEXT_DATA__
        "imdb_votes": 11655,  # Wrong value, but correctly parsed from __NEXT_DATA__
        "genres": {"Comedy", "Crime", "Drama"},  # Wrong value
    }
    assert a_videogame == movie(a_videogame)


@pytest.mark.asyncio
async def test_load_ratings_page_20240720(monkeypatch):
    with bz2.open(fixturesdir / "ratings-ur655321-20240720.html.bz2", "rb") as f:
        html = f.read()
    soup = bs4.BeautifulSoup(html, "html5lib")
    monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))

    with bz2.open(fixturesdir / "ratings-ur655321-20240720.gql.json.bz2", "rb") as f:
        jsonstr = f.read()
    async with imdb.asession() as s:
        monkeypatch.setattr(s, "post", AsyncMock(return_value=_mock_response(jsonstr)))
        page = await imdb._load_ratings_page("fakeurl", "ur655321")
    assert len(page.ratings) == 100
    assert page.imdb_user_id is not None
    assert page.imdb_user_id == "ur655321"
    assert page.imdb_user_name == "AlexUltra"
    assert page.next_page_url is None, "not supported for new ratings page"

    def movie(item: dict):
        for rating in page.ratings:
            assert rating.movie
            if rating.movie.imdb_id == item["imdb_id"]:
                rating_dict = {key: getattr(rating.movie, key) for key in item.keys()}
                return rating_dict
        raise AssertionError(f"{item['imdb_id']} not found in page.ratings")

    a_movie = {
        "title": "Kung Fu Panda 4",
        "release_year": 2024,
        "media_type": "Movie",
        "imdb_id": "tt21692408",
        "imdb_score": 59,
        "imdb_votes": 48018,
        "runtime": 94,
    }
    assert a_movie == movie(a_movie)

    a_running_tvseries = {
        "title": "Palm Royale",
        "release_year": 2024,
        "media_type": "TV Series",
        "imdb_id": "tt8888540",
        "imdb_score": 63,
        "imdb_votes": 9458,
    }
    assert a_running_tvseries == movie(a_running_tvseries)

    a_finished_tvseries = {
        "title": "Fawlty Towers",
        "release_year": 1975,
        "media_type": "TV Series",
        "imdb_id": "tt0072500",
        "imdb_score": 87,
        "imdb_votes": 100860,
    }
    assert a_finished_tvseries == movie(a_finished_tvseries)
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`import bz2`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`import json`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`from pathlib import Path`
			`from unittest.mock import AsyncMock`

			`import bs4`
add imdb full import mode 2021-06-21 18:54:03 +02:00			`import pytest`
apply auto-formatting to tests 2023-02-04 18:15:14 +01:00
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`from unwind import imdb`
add imdb full import mode 2021-06-21 18:54:03 +02:00			`from unwind.imdb import imdb_rating_from_score, score_from_imdb_rating`

feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`testsdir = Path(__file__).parent`
			`fixturesdir = testsdir / "fixtures"`

add imdb full import mode 2021-06-21 18:54:03 +02:00
			`@pytest.mark.parametrize("rating", (x / 10 for x in range(10, 101)))`
fix tests for Pytest-Asyncio running in strict mode 2023-02-04 18:12:50 +01:00			`def test_rating_conversion(rating: float):`
add imdb full import mode 2021-06-21 18:54:03 +02:00			`assert rating == imdb_rating_from_score(score_from_imdb_rating(rating))`


			`@pytest.mark.parametrize("score", range(0, 101))`
fix tests for Pytest-Asyncio running in strict mode 2023-02-04 18:12:50 +01:00			`def test_score_conversion(score: int):`
add imdb full import mode 2021-06-21 18:54:03 +02:00			`# Because our score covers 101 discrete values and IMDb's rating only 91`
			`# discrete values, the mapping is non-injective, i.e. 10 values can't be`
			`# mapped uniquely.`
			`non_injective = set(range(5, 100, 10))`
			`if score in non_injective:`
			`pytest.skip(f"Score cannot be mapped back correctly: {score}")`

			`assert score == score_from_imdb_rating(imdb_rating_from_score(score))`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00

fix: support new "most popular 100" & "bottom 100" HTML The previous version had all 100 movies rendered into the HTML. The new version has only the top 25 rendered into HTML, but the whole list has been made available as LD+JSON data. Since we can easily support both, we don't (yet) remove the old parser. 2024-07-14 16:09:02 +02:00			`@pytest.mark.parametrize(`
			`"fixture",`
			`(`
			`("most_popular_100.html.bz2"),`
			`("most_popular_100-20240714.html.bz2"),`
			`),`
			`)`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`@pytest.mark.asyncio`
fix: support new "most popular 100" & "bottom 100" HTML The previous version had all 100 movies rendered into the HTML. The new version has only the top 25 rendered into HTML, but the whole list has been made available as LD+JSON data. Since we can easily support both, we don't (yet) remove the old parser. 2024-07-14 16:09:02 +02:00			`async def test_load_most_popular_100(monkeypatch, fixture: str):`
			`with bz2.open(fixturesdir / fixture, "rb") as f:`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`html = f.read()`
			`soup = bs4.BeautifulSoup(html, "html5lib")`

			`monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))`

			`movie_ids = await imdb.load_most_popular_100()`
fix: support new "most popular 100" & "bottom 100" HTML The previous version had all 100 movies rendered into the HTML. The new version has only the top 25 rendered into HTML, but the whole list has been made available as LD+JSON data. Since we can easily support both, we don't (yet) remove the old parser. 2024-07-14 16:09:02 +02:00			`assert len(set(movie_ids)) == 100`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`assert all(id_.startswith("tt") for id_ in movie_ids)`


fix: support new "most popular 100" & "bottom 100" HTML The previous version had all 100 movies rendered into the HTML. The new version has only the top 25 rendered into HTML, but the whole list has been made available as LD+JSON data. Since we can easily support both, we don't (yet) remove the old parser. 2024-07-14 16:09:02 +02:00			`@pytest.mark.parametrize(`
			`"fixture",`
			`(`
			`("bottom_100.html.bz2"),`
			`("bottom_100-20240714.html.bz2"),`
			`),`
			`)`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`@pytest.mark.asyncio`
fix: support new "most popular 100" & "bottom 100" HTML The previous version had all 100 movies rendered into the HTML. The new version has only the top 25 rendered into HTML, but the whole list has been made available as LD+JSON data. Since we can easily support both, we don't (yet) remove the old parser. 2024-07-14 16:09:02 +02:00			`async def test_load_bottom_100(monkeypatch, fixture: str):`
			`with bz2.open(fixturesdir / fixture, "rb") as f:`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`html = f.read()`
			`soup = bs4.BeautifulSoup(html, "html5lib")`

			`monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))`

			`movie_ids = await imdb.load_bottom_100()`
fix: support new "most popular 100" & "bottom 100" HTML The previous version had all 100 movies rendered into the HTML. The new version has only the top 25 rendered into HTML, but the whole list has been made available as LD+JSON data. Since we can easily support both, we don't (yet) remove the old parser. 2024-07-14 16:09:02 +02:00			`assert len(set(movie_ids)) == 100`
feat: add functions to retrieve IMDb chart lists These charts are - the top 250 highest rated movies - the top 100 most popular movies - the bottom 100 lowest rated movies 2024-05-10 00:12:25 +02:00			`assert all(id_.startswith("tt") for id_ in movie_ids)`


			`@pytest.mark.asyncio`
			`async def test_load_top_250(monkeypatch):`
			`with bz2.open(fixturesdir / "top250.gql.json.bz2", "rb") as f:`
			`jsonstr = f.read()`

			`monkeypatch.setattr(imdb, "adownload", AsyncMock(return_value=jsonstr))`

			`movie_ids = await imdb.load_top_250()`
			`assert len(movie_ids) == 250`
			`assert all(id_.startswith("tt") for id_ in movie_ids)`
fix: find next rating page 2024-05-10 00:13:32 +02:00

			`@pytest.mark.asyncio`
			`async def test_load_ratings_page(monkeypatch):`
			`with bz2.open(fixturesdir / "ratings-ur655321.html.bz2", "rb") as f:`
			`html = f.read()`
			`soup = bs4.BeautifulSoup(html, "html5lib")`

			`monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))`

feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`page = await imdb._load_ratings_page("fakeurl", "ur655321")`
fix: find next rating page 2024-05-10 00:13:32 +02:00			`assert len(page.ratings) == 100`
			`assert page.imdb_user_id is not None`
			`assert page.imdb_user_id == "ur655321"`
			`assert page.imdb_user_name == "AlexUltra"`
			`assert page.next_page_url is not None`
			`assert page.next_page_url.startswith("/user/ur655321/ratings?")`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00

			`def _mock_response(content: bytes):`
			`class MockResponse:`
			`def raise_for_status(self):`
			`pass`

			`def json(self):`
			`return json.loads(content)`

			`return MockResponse()`


			`@pytest.mark.asyncio`
			`async def test_load_ratings_page_20240510(monkeypatch):`
			`with bz2.open(fixturesdir / "ratings-ur655321-20240510.html.bz2", "rb") as f:`
			`html = f.read()`
			`soup = bs4.BeautifulSoup(html, "html5lib")`
			`monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))`

			`with bz2.open(fixturesdir / "ratings-ur655321-20240510.gql.json.bz2", "rb") as f:`
			`jsonstr = f.read()`
			`async with imdb.asession() as s:`
			`monkeypatch.setattr(s, "post", AsyncMock(return_value=_mock_response(jsonstr)))`
			`page = await imdb._load_ratings_page("fakeurl", "ur655321")`
			`assert len(page.ratings) == 100`
			`assert page.imdb_user_id is not None`
			`assert page.imdb_user_id == "ur655321"`
			`assert page.imdb_user_name == "AlexUltra"`
			`assert page.next_page_url is None, "not supported for new ratings page"`

			`def movie(item: dict):`
			`for rating in page.ratings:`
			`assert rating.movie`
			`if rating.movie.imdb_id == item["imdb_id"]:`
			`rating_dict = {key: getattr(rating.movie, key) for key in item.keys()}`
			`return rating_dict`
chore: upgrade to Python 3.13 & run update 2025-05-15 21:56:18 +02:00			`raise AssertionError(f"{item['imdb_id']} not found in page.ratings")`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00
			`a_movie = {`
			`"title": "Kung Fu Panda 4",`
			`"release_year": 2024,`
			`"media_type": "Movie",`
			`"imdb_id": "tt21692408",`
			`"imdb_score": 59,`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"imdb_votes": 36069,`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`"runtime": 94,`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"genres": {"Action", "Adventure", "Animation"},`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`}`
			`assert a_movie == movie(a_movie)`

			`a_running_tvseries = {`
			`"title": "Palm Royale",`
			`"release_year": 2024,`
			`"media_type": "TV Series",`
			`"imdb_id": "tt8888540",`
			`"imdb_score": 64,`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"imdb_votes": 6044,`
			`"genres": {"Drama"},`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`}`
			`assert a_running_tvseries == movie(a_running_tvseries)`

			`a_finished_tvseries = {`
			`"title": "Fawlty Towers",`
			`"release_year": 1975,`
			`"media_type": "TV Series",`
			`"imdb_id": "tt0072500",`
			`"imdb_score": 87,`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"imdb_votes": 100261,`
			`"genres": {"Comedy"},`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`}`
			`assert a_finished_tvseries == movie(a_finished_tvseries)`

			`a_tvepisode = {`
			`"title": "Columbo / No Time to Die",`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"original_title": "Columbo / No Time to Die",`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`"release_year": 1992,`
			`"media_type": "TV Episode",`
			`"imdb_id": "tt0103987",`
			`"imdb_score": 59,`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"imdb_votes": 2122,`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`"runtime": 98,`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"genres": {"Crime", "Drama", "Mystery"},`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`}`
			`assert a_tvepisode == movie(a_tvepisode)`

			`a_videogame = {`
			`"title": "Alan Wake",`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`"original_title": "Alan Wake",`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`"release_year": 2010,`
			`"media_type": "Video Game",`
			`"imdb_id": "tt0466662",`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00			`# The data from __NEXT_DATA__ is wrong, the actual values should be:`
			`# "imdb_score": 82,`
			`# "imdb_votes": 7300,`
			`# "genres": {"Action", "Adventure", "Horror"},`
			`"imdb_score": 67, # Wrong value, but correctly parsed from __NEXT_DATA__`
			`"imdb_votes": 11655, # Wrong value, but correctly parsed from __NEXT_DATA__`
			`"genres": {"Comedy", "Crime", "Drama"}, # Wrong value`
feat: add support for new ratings page Genres are no longer available for ratings, so we make them optional. Adds support for validating generics in union types. 2024-05-11 17:13:48 +02:00			`}`
			`assert a_videogame == movie(a_videogame)`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00

			`@pytest.mark.asyncio`
			`async def test_load_ratings_page_20240720(monkeypatch):`
			`with bz2.open(fixturesdir / "ratings-ur655321-20240720.html.bz2", "rb") as f:`
			`html = f.read()`
			`soup = bs4.BeautifulSoup(html, "html5lib")`
			`monkeypatch.setattr(imdb, "asoup_from_url", AsyncMock(return_value=soup))`

			`with bz2.open(fixturesdir / "ratings-ur655321-20240720.gql.json.bz2", "rb") as f:`
			`jsonstr = f.read()`
			`async with imdb.asession() as s:`
			`monkeypatch.setattr(s, "post", AsyncMock(return_value=_mock_response(jsonstr)))`
			`page = await imdb._load_ratings_page("fakeurl", "ur655321")`
			`assert len(page.ratings) == 100`
			`assert page.imdb_user_id is not None`
			`assert page.imdb_user_id == "ur655321"`
			`assert page.imdb_user_name == "AlexUltra"`
			`assert page.next_page_url is None, "not supported for new ratings page"`

			`def movie(item: dict):`
			`for rating in page.ratings:`
			`assert rating.movie`
			`if rating.movie.imdb_id == item["imdb_id"]:`
			`rating_dict = {key: getattr(rating.movie, key) for key in item.keys()}`
			`return rating_dict`
chore: upgrade to Python 3.13 & run update 2025-05-15 21:56:18 +02:00			`raise AssertionError(f"{item['imdb_id']} not found in page.ratings")`
fix: support new user ratings page markup We use __NEXT_DATA__ from the page to find the user's latest rated movies. We found that at least in one case (of a Video Game) the movie details were wrong. Normally this shouldn't be a problem though because we know all the movies already and we keep the values we already have. Otherwise the data from __NEXT_DATA__ seems more accurate and complete. 2024-07-21 14:46:45 +02:00
			`a_movie = {`
			`"title": "Kung Fu Panda 4",`
			`"release_year": 2024,`
			`"media_type": "Movie",`
			`"imdb_id": "tt21692408",`
			`"imdb_score": 59,`
			`"imdb_votes": 48018,`
			`"runtime": 94,`
			`}`
			`assert a_movie == movie(a_movie)`

			`a_running_tvseries = {`
			`"title": "Palm Royale",`
			`"release_year": 2024,`
			`"media_type": "TV Series",`
			`"imdb_id": "tt8888540",`
			`"imdb_score": 63,`
			`"imdb_votes": 9458,`
			`}`
			`assert a_running_tvseries == movie(a_running_tvseries)`

			`a_finished_tvseries = {`
			`"title": "Fawlty Towers",`
			`"release_year": 1975,`
			`"media_type": "TV Series",`
			`"imdb_id": "tt0072500",`
			`"imdb_score": 87,`
			`"imdb_votes": 100860,`
			`}`
			`assert a_finished_tvseries == movie(a_finished_tvseries)`