archived-MoviePilot/tests/test_rust_accel.py

import pytest

from app.core.context import TorrentInfo
from app.modules.filter import FilterModule
from app.modules.indexer.spider import SiteSpider
from app.schemas.types import MediaType
from app.utils import rust_accel


pytestmark = pytest.mark.skipif(
    not rust_accel.is_available(),
    reason="moviepilot_rust 扩展未安装",
)


def test_rust_metainfo_fast_path_extracts_emby_override():
    """
    Rust 内嵌媒体标签识别应保持 Emby tmdbid 标签优先级。
    """
    title, metainfo = rust_accel.find_metainfo("Movie {[tmdbid=111;type=movies]} [tmdbid=222]")

    assert title == "Movie"
    assert metainfo["tmdbid"] == "222"
    assert metainfo["type"] == MediaType.MOVIE


def test_rust_video_title_fast_path_extracts_common_resource_fields():
    """
    Rust 影视标题预解析应能提取常见资源字段。
    """
    result = rust_accel.parse_video_title(
        "The 355 2022 BluRay 1080p DTS-HD MA5.1 X265.10bit 60FPS"
    )

    assert result["year"] == "2022"
    assert result["resource_pix"] == "1080p"
    assert result["resource_type"] == "BluRay"
    assert result["video_encode"] == "x265 10bit"
    assert result["video_bit"] == "10bit"
    assert result["fps"] == 60


def test_rust_filter_fast_path_matches_priority_semantics():
    """
    Rust 批量过滤应保持优先级和布尔表达式语义。
    """
    module = FilterModule()
    module.rule_set = {
        "HDR": {"include": "HDR"},
        "DV": {"include": "DOVI"},
        "BLU": {"include": "BluRay"},
    }
    torrents = [
        TorrentInfo(title="Movie HDR WEB-DL", description=""),
        TorrentInfo(title="Movie DOVI", description=""),
        TorrentInfo(title="Movie HDR BluRay", description=""),
    ]

    result = module._FilterModule__filter_torrents_by_rust(  # noqa: SLF001
        groups=[type("RuleGroup", (), {"rule_string": "HDR & !BLU > DV"})()],
        torrent_list=torrents,
        mediainfo=None,
    )

    assert result == torrents[:2]
    assert result[0].pri_order == 100
    assert result[1].pri_order == 99


def test_rust_indexer_search_url_keeps_existing_query_and_category():
    """
    Rust URL 生成应保留路径原有查询参数并应用分类参数。
    """
    spider = SiteSpider(
        indexer={
            "id": "ttg",
            "name": "TTG",
            "domain": "https://totheglory.im/",
            "search": {
                "paths": [{"path": "browse.php?c=M"}],
                "params": {"search_field": "{keyword}", "c": "M"},
                "imdbid_format": "imdb{imdbid_num}",
            },
            "category": {
                "field": "search_field",
                "delimiter": " 分类:",
                "movie": [{"id": "电影DVDRip", "cat": "Movies/SD"}],
            },
            "torrents": {"list": {}, "fields": {}},
        },
        keyword="tt0049406",
        mtype=MediaType.MOVIE,
    )

    search_url = spider._SiteSpider__get_search_url()  # noqa: SLF001

    assert search_url.count("?") == 1
    assert "c=M" in search_url
    assert "search_field=imdb0049406" in search_url


def test_rust_rss_parser_extracts_common_rss_and_atom_fields():
    """
    Rust RSS 解析应同时覆盖 RSS item 和 Atom entry 的核心字段。
    """
    xml_text = """
    <rss><channel>
      <item>
        <title>Example Torrent</title>
        <description><![CDATA[Desc]]></description>
        <link>https://example.org/details/1</link>
        <enclosure url="https://example.org/download/1.torrent" length="1024" />
        <pubDate>Tue, 19 May 2026 08:30:00 GMT</pubDate>
        <dc:creator>豆瓣用户</dc:creator>
      </item>
      <entry>
        <title>Atom Torrent</title>
        <summary>Atom Desc</summary>
        <link href="https://example.org/atom/2" />
        <updated>2026-05-19T09:30:00Z</updated>
      </entry>
    </channel></rss>
    """

    items = rust_accel.parse_rss_items(xml_text, 100)

    assert items[0]["title"] == "Example Torrent"
    assert items[0]["enclosure"] == "https://example.org/download/1.torrent"
    assert items[0]["size"] == 1024
    assert items[0]["nickname"] == "豆瓣用户"
    assert items[1]["title"] == "Atom Torrent"
    assert items[1]["enclosure"] == "https://example.org/atom/2"


def test_rust_indexer_page_parser_handles_common_fields():
    """
    Rust 普通 indexer 页面解析应批量提取列表行核心字段。
    """
    spider = SiteSpider(
        indexer={
            "id": "demo",
            "name": "Demo",
            "domain": "https://example.org/",
            "search": {"paths": [{"path": "torrents.php"}]},
            "category": {
                "movie": [{"id": "401"}],
                "tv": [{"id": "402"}],
            },
            "torrents": {
                "list": {"selector": "tr.torrent"},
                "fields": {
                    "title": {"selector": "a.title"},
                    "description": {"selector": ".desc"},
                    "details": {"selector": "a.title", "attribute": "href"},
                    "download": {"selector": "a.dl", "attribute": "href"},
                    "size": {"selector": ".size"},
                    "seeders": {"selector": ".seeders"},
                    "leechers": {"selector": ".leechers"},
                    "grabs": {"selector": ".grabs"},
                    "downloadvolumefactor": {"case": {".free": 0}},
                    "uploadvolumefactor": {"selector": ".up"},
                    "labels": {"selector": ".label"},
                    "hr": {"selector": ".hr"},
                    "category": {"selector": ".cat"},
                },
            },
        },
    )
    html = """
    <table>
      <tr class="torrent">
        <td><a class="title" href="/details/1">Movie 2024 1080p</a><span class="desc">BluRay</span></td>
        <td><a class="dl" href="/download/1">DL</a></td>
        <td class="size">1.5 GB</td><td class="seeders">1,234</td><td class="leechers">5/10</td>
        <td class="grabs">42</td><td class="free">Free</td><td class="up">2x</td>
        <td><span class="label">DIY</span><span class="label">HDR</span></td>
        <td class="hr">H&R</td><td class="cat">401</td>
      </tr>
    </table>
    """

    torrents = spider.parse(html)

    assert torrents == [{
        "title": "Movie 2024 1080p",
        "description": "BluRay",
        "page_url": "https://example.org/details/1",
        "enclosure": "https://example.org/download/1",
        "size": 1610612736,
        "seeders": 1234,
        "peers": 5,
        "grabs": 42,
        "downloadvolumefactor": 0,
        "uploadvolumefactor": 2,
        "labels": ["DIY", "HDR"],
        "hit_and_run": True,
        "category": MediaType.MOVIE.value,
    }]


def test_rust_indexer_page_parser_renders_common_title_template():
    """
    Rust 普通 indexer 页面解析应兼容站点构建项目里的 title_optional 模板。
    """
    spider = SiteSpider(
        indexer={
            "id": "demo",
            "name": "Demo",
            "domain": "https://example.org/",
            "search": {"paths": [{"path": "torrents.php"}]},
            "torrents": {
                "list": {"selector": "tr.torrent"},
                "fields": {
                    "title_default": {"selector": "a.title"},
                    "title_optional": {
                        "selector": "a.title",
                        "attribute": "title",
                        "optional": True,
                    },
                    "title": {
                        "text": (
                            "{% if fields['title_optional'] %}"
                            "{{ fields['title_optional'] }}"
                            "{% else %}"
                            "{{ fields['title_default'] }}"
                            "{% endif %}"
                        )
                    },
                    "download": {"selector": "a.dl", "attribute": "href"},
                },
            },
        },
    )
    html = """
    <table>
      <tr class="torrent">
        <td><a class="title" title="Optional Name" href="/details/1">Default Name</a></td>
        <td><a class="dl" href="/download/1">DL</a></td>
      </tr>
      <tr class="torrent">
        <td><a class="title" title="" href="/details/2">Default Fallback</a></td>
        <td><a class="dl" href="/download/2">DL</a></td>
      </tr>
    </table>
    """

    torrents = spider.parse(html)

    assert [item["title"] for item in torrents] == ["Optional Name", "Default Fallback"]


def test_rust_indexer_page_parser_renders_common_description_templates():
    """
    Rust 普通 indexer 页面解析应兼容站点构建项目里的 description 字段模板。
    """
    spider = SiteSpider(
        indexer={
            "id": "demo",
            "name": "Demo",
            "domain": "https://example.org/",
            "search": {"paths": [{"path": "torrents.php"}]},
            "torrents": {
                "list": {"selector": "tr.torrent"},
                "fields": {
                    "title": {"selector": "a.title"},
                    "subject": {"selector": ".subject"},
                    "tags": {"selector": ".tags"},
                    "description": {
                        "text": (
                            "{% if fields['tags']%}"
                            "{{ fields['subject']+' '+fields['tags'] }}"
                            "{% else %}"
                            "{{ fields['subject'] }}"
                            "{% endif %}"
                        )
                    },
                    "download": {"selector": "a.dl", "attribute": "href"},
                },
            },
        },
    )
    html = """
    <table>
      <tr class="torrent">
        <td><a class="title">Movie 2024</a><span class="subject">BluRay</span><span class="tags">HDR</span></td>
        <td><a class="dl" href="/download/1">DL</a></td>
      </tr>
      <tr class="torrent">
        <td><a class="title">Show 2025</a><span class="subject">WEB-DL</span><span class="tags"></span></td>
        <td><a class="dl" href="/download/2">DL</a></td>
      </tr>
    </table>
    """

    torrents = spider.parse(html)

    assert [item["description"] for item in torrents] == ["BluRay HDR", "WEB-DL"]


def test_rust_indexer_page_parser_supports_remove_and_negative_index():
    """
    Rust 普通 indexer 页面解析应兼容站点配置常用的 remove 和负索引。
    """
    spider = SiteSpider(
        indexer={
            "id": "demo",
            "name": "Demo",
            "domain": "https://example.org/",
            "search": {"paths": [{"path": "torrents.php"}]},
            "torrents": {
                "list": {"selector": "tr.torrent"},
                "fields": {
                    "title": {"selector": ".name", "remove": "a,b"},
                    "description": {
                        "selector": ".desc",
                        "remove": "span,a,img,font,b",
                        "contents": -1,
                    },
                    "labels": {
                        "selector": ".labels > span",
                        "remove": "span,a,img,font,b",
                        "contents": -1,
                    },
                    "download": {"selector": "a.dl", "attribute": "href"},
                },
            },
        },
    )
    html = """
    <table>
      <tr class="torrent">
        <td class="name">Movie<a>删掉</a><b>也删</b>2024</td>
        <td class="desc">第一行
          <span>标签</span><a>链接</a>
          第二行
        </td>
        <td class="labels"><span><i>DIY</i></span><span><i>HDR</i></span></td>
        <td><a class="dl" href="/download/1">DL</a></td>
      </tr>
    </table>
    """

    torrents = spider.parse(html)

    assert torrents[0]["title"] == "Movie2024"
    assert torrents[0]["description"] == "第一行 第二行"
    assert torrents[0]["labels"] == ["DIY", "HDR"]