mirror of
https://github.com/zhenxun-org/zhenxun_bot.git
synced 2025-12-15 14:22:55 +08:00
53 lines
1.8 KiB
Python
Executable File
53 lines
1.8 KiB
Python
Executable File
from lxml import etree
|
||
import feedparser
|
||
from urllib import parse
|
||
from services.log import logger
|
||
from utils.http_utils import AsyncHttpx
|
||
from typing import List, Union
|
||
import time
|
||
|
||
|
||
async def from_anime_get_info(key_word: str, max_: int) -> Union[str, List[str]]:
|
||
s_time = time.time()
|
||
url = "https://share.dmhy.org/topics/rss/rss.xml?keyword=" + parse.quote(key_word)
|
||
try:
|
||
repass = await get_repass(url, max_)
|
||
except Exception as e:
|
||
logger.error(f"发生了一些错误 {type(e)}:{e}")
|
||
return "发生了一些错误!"
|
||
repass.insert(0, f"搜索 {key_word} 结果(耗时 {int(time.time() - s_time)} 秒):\n")
|
||
return repass
|
||
|
||
|
||
async def get_repass(url: str, max_: int) -> List[str]:
|
||
put_line = []
|
||
text = (await AsyncHttpx.get(url)).text
|
||
d = feedparser.parse(text)
|
||
max_ = max_ if max_ < len([e.link for e in d.entries]) else len([e.link for e in d.entries])
|
||
url_list = [e.link for e in d.entries][:max_]
|
||
for u in url_list:
|
||
try:
|
||
text = (await AsyncHttpx.get(u)).text
|
||
html = etree.HTML(text)
|
||
magent = html.xpath('.//a[@id="a_magnet"]/text()')[0]
|
||
title = html.xpath(".//h3/text()")[0]
|
||
item = html.xpath(
|
||
'//div[@class="info resource-info right"]/ul/li'
|
||
)
|
||
class_a = (
|
||
item[0]
|
||
.xpath("string(.)")[5:]
|
||
.strip()
|
||
.replace("\xa0", "")
|
||
.replace("\t", "")
|
||
)
|
||
size = item[3].xpath("string(.)")[5:].strip()
|
||
put_line.append(
|
||
"【{}】| {}\n【{}】| {}".format(class_a, title, size, magent)
|
||
)
|
||
except Exception as e:
|
||
logger.error(f"搜番发生错误 {type(e)}:{e}")
|
||
return put_line
|
||
|
||
|