zhenxun_bot/plugins/send_setu/data_source.py

256 lines
11 KiB
Python
Raw Normal View History

2021-05-20 19:23:32 +08:00
from configs.path_config import IMAGE_PATH, TXT_PATH
import os
import random
2021-06-30 19:50:55 +08:00
from utils.init_result import image
2021-05-20 19:23:32 +08:00
from configs.config import LOLICON_KEY
import aiohttp
import aiofiles
from services.log import logger
2021-06-30 19:50:55 +08:00
from utils.img_utils import get_img_hash
from utils.utils import get_local_proxy, is_number
2021-05-20 19:23:32 +08:00
from asyncio.exceptions import TimeoutError
from models.count_user import UserCount
from configs.config import DOWNLOAD_SETU
try:
import ujson as json
except ModuleNotFoundError:
import json
url = "https://api.lolicon.app/setu/"
2021-06-15 11:01:30 +08:00
path = '_setu/'
2021-05-20 19:23:32 +08:00
async def get_setu_urls(keyword: str, num: int = 1, r18: int = 0):
# print(keyword)
if r18 == 1:
2021-06-15 10:57:08 +08:00
file_name = 'setu_r18_url.json'
2021-05-20 19:23:32 +08:00
else:
2021-06-15 10:57:08 +08:00
file_name = 'setu_url.json'
2021-05-20 19:23:32 +08:00
try:
2021-06-15 10:57:08 +08:00
with open(TXT_PATH + file_name, 'r', encoding='utf8') as f:
txt_data = json.load(f)
except (FileNotFoundError, ValueError):
txt_data = {}
txt_urls = [txt_data[x]['img_url'] for x in txt_data.keys()]
2021-05-20 19:23:32 +08:00
params = {
"apikey": LOLICON_KEY, # 添加apikey
'r18': r18, # 添加r18参数 0为否1为是2为混合
'keyword': keyword, # 若指定关键字,将会返回从插画标题、作者、标签中模糊搜索的结果
2021-06-15 10:57:08 +08:00
'num': 100, # 一次返回的结果数量范围为1到10不提供 APIKEY 时固定为1
2021-05-20 19:23:32 +08:00
'size1200': 1, # 是否使用 master_1200 缩略图,以节省流量或提升加载速度
2021-05-26 20:08:13 +08:00
}
2021-05-20 19:23:32 +08:00
urls = []
text_list = []
for count in range(3):
print(f'get_setu_url: count --> {count}')
async with aiohttp.ClientSession() as session:
try:
2021-06-24 15:32:06 +08:00
async with session.get(url, proxy=get_local_proxy(), timeout=2, params=params) as response:
2021-05-20 19:23:32 +08:00
if response.status == 429:
return '调用达到上限,明日赶早呀~', '', 429
if response.status == 404:
return "网站裂开了...", '', 998
if response.status == 200:
data = await response.json()
if data['code'] == 0:
2021-06-30 19:50:55 +08:00
lens = len(data['data'])
for i in range(lens):
2021-05-20 19:23:32 +08:00
img_url = data['data'][i]['url']
title = data['data'][i]['title']
author = data['data'][i]['author']
pid = data['data'][i]['pid']
urls.append(img_url)
text_list.append(f'title{title}\nauthor{author}\nPID{pid}')
2021-06-15 10:57:08 +08:00
tags = []
for j in range(len(data['data'][i]['tags'])):
tags.append(data['data'][i]['tags'][j])
if img_url not in txt_urls:
save_setu_dict = {
'title': title,
'author': author,
'pid': pid,
'img_url': img_url,
'tags': tags
}
if str(pid) not in txt_data.keys():
txt_data[pid] = save_setu_dict
2021-05-20 21:09:21 +08:00
if DOWNLOAD_SETU:
2021-06-15 10:57:08 +08:00
with open(TXT_PATH + file_name, 'w', encoding='utf8') as f:
json.dump(txt_data, f, ensure_ascii=False, indent=4)
2021-06-30 19:50:55 +08:00
num = lens if num > lens else num
2021-06-15 10:57:08 +08:00
random_idx = random.sample(range(len(data['data'])), num)
x_urls = []
x_text_lst = []
for x in random_idx:
x_urls.append(urls[x])
x_text_lst.append(text_list[x])
return x_urls, x_text_lst, 200
2021-05-20 19:23:32 +08:00
else:
return "没找到符合条件的色图...", '', 401
except TimeoutError:
pass
return '我网线被人拔了..QAQ', '', 999
async def search_online_setu(url: str):
async with aiohttp.ClientSession() as session:
for i in range(3):
print(f'search_online_setu --> {i}')
try:
2021-06-24 15:32:06 +08:00
async with session.get(url, proxy=get_local_proxy(), timeout=2) as res:
2021-05-20 19:23:32 +08:00
if res.status == 200:
index = str(random.randint(1, 100000))
async with aiofiles.open(IMAGE_PATH + 'temp/' + index + "_temp_setu.jpg", 'wb') as f:
try:
await f.write(await res.read())
except TimeoutError:
# return '\n这图没下载过来~(网太差?)', -1, False
continue
logger.info(f"下载 lolicon图片 {url} 成功, id{index}")
return image(f'{index}_temp_setu.jpg', 'temp'), index
else:
logger.warning(f"访问 lolicon图片 {url} 失败 status{res.status}")
# return '\n这图好难下载啊QAQ', -1, False
except TimeoutError:
pass
return '\n图片被小怪兽恰掉啦..!QAQ', -1
2021-06-24 15:32:06 +08:00
def get_setu(index: str, setu_data: dict, tag: str = None):
2021-07-01 10:32:46 +08:00
if not os.path.exists(IMAGE_PATH + path):
os.mkdir(IMAGE_PATH + path)
2021-05-20 19:23:32 +08:00
length = len(os.listdir(IMAGE_PATH + path))
2021-05-20 21:04:57 +08:00
if length == 0:
return None, None
2021-05-20 19:23:32 +08:00
if not index:
index = random.randint(0, length - 1)
2021-06-24 15:32:06 +08:00
if tag:
all_tag_setu = [x for x in setu_data.keys() if tag in setu_data[x]['tags']]
if all_tag_setu:
index = random.choice(all_tag_setu)
2021-05-20 19:23:32 +08:00
if is_number(index):
if int(index) > length or int(index) < 0:
return f"超过当前上下限!({length - 1})", 999
else:
2021-06-17 19:22:07 +08:00
if setu_data:
index = str(index)
return f'id{index}\n' \
f'title{setu_data[index]["title"]}\n' \
f'author{setu_data[index]["author"]}\n' \
f'PID{setu_data[index]["pid"]}' + image(f'{index}.jpg', path), index
else:
return f'id{index}' + image(f'{index}.jpg', path), index
2021-05-20 19:23:32 +08:00
return None, None
def get_luoxiang(impression):
probability = impression + 70
if probability < random.randint(1, 101):
return "我为什么要给你发这个?" + image(random.choice(os.listdir(IMAGE_PATH + "luoxiang/")), 'luoxiang') + \
"\n(快向小真寻签到提升好感度吧!)"
return None
async def check_r18_and_keyword(msg: str, user_id) -> 'str, int, int':
msg_list = msg.split(' ')
num = 1
r18 = 0
keyword = ''
if len(msg_list) == 1:
if msg_list[0].strip().lower() in ['r', 'r18']:
r18 = 1
num = 10
else:
keyword = msg_list[0]
elif len(msg_list) == 2:
keyword = msg_list[1].strip()
if msg_list[0].strip().lower() in ['r', 'r18']:
r18 = 1
num = 10
else:
keyword = msg[0]
if r18 == 1:
await UserCount.add_user(user_id)
return keyword, r18, num
async def find_img_index(img_url, user_id):
try:
2021-06-15 10:57:08 +08:00
setu_data = json.load(open(TXT_PATH + 'setu_data.json', encoding='utf8'))
2021-05-20 19:23:32 +08:00
except (FileNotFoundError, ValueError):
2021-06-15 10:57:08 +08:00
setu_data = {}
2021-05-20 19:23:32 +08:00
async with aiohttp.ClientSession() as session:
async with session.get(img_url, proxy=get_local_proxy(), timeout=5) as res:
async with aiofiles.open(IMAGE_PATH + f"temp/{user_id}_find_setu_index.jpg", 'wb') as f:
await f.write(await res.read())
img_hash = str(get_img_hash(IMAGE_PATH + f"temp/{user_id}_find_setu_index.jpg"))
try:
2021-06-15 10:57:08 +08:00
index = str([setu_data[x]['img_hash'] for x in setu_data.keys()].index(img_hash))
return f"id{index}\n" \
f"title{setu_data[index]['title']}\n" \
f"author{setu_data[index]['author']}\n" \
f"PID{setu_data[index]['pid']}"
2021-05-20 19:23:32 +08:00
except ValueError:
return "该图不在色图库中!"
2021-06-04 18:01:33 +08:00
def delete_img(_id: int):
lens = len(os.listdir(IMAGE_PATH + path)) - 1
if _id < 0 or _id > lens:
return False, f'超过上下限限制,上限:{lens}'
try:
os.remove(IMAGE_PATH + path + f'{_id}.jpg')
if _id != lens:
2021-06-15 10:57:08 +08:00
setu_hash_dict = json.load(open(TXT_PATH + 'setu_data.json', encoding='utf8'))
2021-06-04 18:01:33 +08:00
setu_hash_dict[str(_id)] = setu_hash_dict[str(lens)]
os.rename(IMAGE_PATH + path + f'{lens}.jpg', IMAGE_PATH + path + f'{_id}.jpg')
2021-06-15 10:57:08 +08:00
with open(TXT_PATH + 'setu_data.json', 'w', encoding='utf8') as f:
2021-06-04 18:01:33 +08:00
json.dump(setu_hash_dict, f, ensure_ascii=False, indent=4)
return True, ''
except Exception as e:
logger.error(f'删除色图错误 e{e}')
return False, str(type(e))
# 添加涩图
async def add_img(imgs: list):
index = 0
lens = len(os.listdir(IMAGE_PATH + path))
add_count = 0
2021-06-15 10:57:08 +08:00
setu_data_dict = json.load(open(TXT_PATH + 'setu_data.json', encoding='utf8'))
2021-06-04 18:01:33 +08:00
async with aiohttp.ClientSession() as session:
for img in imgs:
async with session.get(img, proxy=get_local_proxy(), timeout=5) as res:
async with aiofiles.open(IMAGE_PATH + f"temp/add_setu_check_{index}.jpg", 'wb') as f:
await f.write(await res.read())
index += 1
index -= 1
for i in range(index, -1, -1):
img_hash = str(get_img_hash(IMAGE_PATH + f"temp/add_setu_check_{index}.jpg"))
2021-06-15 10:57:08 +08:00
if img_hash not in [setu_data_dict[x]['img_hash'] for x in setu_data_dict.keys()]:
2021-06-04 18:01:33 +08:00
os.rename(IMAGE_PATH + f"temp/add_setu_check_{index}.jpg", IMAGE_PATH + path + f'/{lens}.jpg')
2021-06-15 10:57:08 +08:00
setu_data_dict[lens] = {
'title': 'not title',
'author': 'not author',
'pid': 'not pid',
'img_hash': img_hash,
'img_url': 'not url',
}
2021-06-04 18:01:33 +08:00
lens += 1
add_count += 1
if add_count:
2021-06-15 10:57:08 +08:00
with open(TXT_PATH + 'setu_data.json', 'w', encoding='utf8') as f:
json.dump(setu_data_dict, f, ensure_ascii=False, indent=4)
2021-06-04 18:01:33 +08:00
return lens, add_count