zhenxun_bot/zhenxun/plugins/search_anime/data_source.py

import time
from urllib import parse

import feedparser
from lxml import etree

from zhenxun.services.log import logger
from zhenxun.utils.http_utils import AsyncHttpx


async def from_anime_get_info(key_word: str, max_: int) -> str | list[str]:
    s_time = time.time()
    url = "https://share.dmhy.org/topics/rss/rss.xml?keyword=" + parse.quote(key_word)
    try:
        repass = await get_repass(url, max_)
    except Exception as e:
        logger.error(f"发生了一些错误 {type(e)}", e=e)
        return "发生了一些错误！"
    repass.insert(0, f"搜索 {key_word} 结果（耗时 {int(time.time() - s_time)} 秒）：\n")
    return repass


async def get_repass(url: str, max_: int) -> list[str]:
    put_line = []
    text = (await AsyncHttpx.get(url)).text
    d = feedparser.parse(text)
    max_ = (
        max_
        if max_ < len([e.link for e in d.entries])
        else len([e.link for e in d.entries])
    )
    url_list = [e.link for e in d.entries][:max_]
    for u in url_list:
        try:
            text = (await AsyncHttpx.get(u)).text
            html = etree.HTML(text)  # type: ignore
            magent = html.xpath('.//a[@id="a_magnet"]/text()')[0]
            title = html.xpath(".//h3/text()")[0]
            item = html.xpath('//div[@class="info resource-info right"]/ul/li')
            class_a = (
                item[0]
                .xpath("string(.)")[5:]
                .strip()
                .replace("\xa0", "")
                .replace("\t", "")
            )
            size = item[3].xpath("string(.)")[5:].strip()
            put_line.append(
                "【{}】| {}\n【{}】| {}".format(class_a, title, size, magent)
            )
        except Exception as e:
            logger.error(f"搜番发生错误", e=e)
    return put_line