mirror of
https://github.com/PaiGramTeam/PaiGram.git
synced 2025-01-19 09:45:04 +00:00
178 lines
5.5 KiB
Python
178 lines
5.5 KiB
Python
|
import re
|
||
|
from typing import List, Optional
|
||
|
|
||
|
from bs4 import BeautifulSoup
|
||
|
from httpx import URL
|
||
|
|
||
|
from models.wiki.base import Model, SCRAPE_HOST
|
||
|
from models.wiki.base import WikiModel
|
||
|
from models.wiki.other import Association, Element, WeaponType
|
||
|
|
||
|
|
||
|
class Birth(Model):
|
||
|
"""生日
|
||
|
Attributes:
|
||
|
day: 天
|
||
|
month: 月
|
||
|
"""
|
||
|
day: int
|
||
|
month: int
|
||
|
|
||
|
|
||
|
class CharacterAscension(Model):
|
||
|
"""角色的突破材料
|
||
|
|
||
|
Attributes:
|
||
|
level: 等级突破材料
|
||
|
skill: 技能/天赋培养材料
|
||
|
"""
|
||
|
level: List[str] = []
|
||
|
skill: List[str] = []
|
||
|
|
||
|
|
||
|
class CharacterState(Model):
|
||
|
"""角色属性值
|
||
|
|
||
|
Attributes:
|
||
|
level: 等级
|
||
|
HP: 生命
|
||
|
ATK: 攻击力
|
||
|
DEF: 防御力
|
||
|
CR: 暴击率
|
||
|
CD: 暴击伤害
|
||
|
bonus: 突破属性
|
||
|
"""
|
||
|
level: str
|
||
|
HP: int
|
||
|
ATK: float
|
||
|
DEF: float
|
||
|
CR: str
|
||
|
CD: str
|
||
|
bonus: str
|
||
|
|
||
|
|
||
|
class CharacterIcon(Model):
|
||
|
icon: str
|
||
|
side: str
|
||
|
gacha: str
|
||
|
splash: Optional[str]
|
||
|
|
||
|
|
||
|
class Character(WikiModel):
|
||
|
"""角色
|
||
|
Attributes:
|
||
|
title: 称号
|
||
|
occupation: 所属
|
||
|
association: 地区
|
||
|
weapon_type: 武器类型
|
||
|
element: 元素
|
||
|
birth: 生日
|
||
|
constellation: 命之座
|
||
|
cn_cv: 中配
|
||
|
jp_cv: 日配
|
||
|
en_cv: 英配
|
||
|
kr_cv: 韩配
|
||
|
description: 描述
|
||
|
"""
|
||
|
|
||
|
id: str
|
||
|
title: str
|
||
|
occupation: str
|
||
|
association: Association
|
||
|
weapon_type: WeaponType
|
||
|
element: Element
|
||
|
birth: Optional[Birth]
|
||
|
constellation: str
|
||
|
cn_cv: str
|
||
|
jp_cv: str
|
||
|
en_cv: str
|
||
|
kr_cv: str
|
||
|
description: str
|
||
|
ascension: CharacterAscension
|
||
|
|
||
|
stats: List[CharacterState]
|
||
|
|
||
|
@classmethod
|
||
|
def scrape_urls(cls) -> List[URL]:
|
||
|
return [SCRAPE_HOST.join("fam_chars/?lang=CHS")]
|
||
|
|
||
|
@classmethod
|
||
|
async def _parse_soup(cls, soup: BeautifulSoup) -> 'Character':
|
||
|
"""解析角色页"""
|
||
|
soup = soup.select('.wp-block-post-content')[0]
|
||
|
tables = soup.find_all('table')
|
||
|
table_rows = tables[0].find_all('tr')
|
||
|
|
||
|
def get_table_text(row_num: int) -> str:
|
||
|
"""一个快捷函数,用于返回表格对应行的最后一个单元格中的文本"""
|
||
|
return table_rows[row_num].find_all('td')[-1].text.replace('\xa0', '')
|
||
|
|
||
|
id_ = re.findall(r'img/(.*?_\d+)_.*', table_rows[0].find('img').attrs['src'])[0]
|
||
|
name = get_table_text(0)
|
||
|
if name != '旅行者': # 如果角色名不是 旅行者
|
||
|
title = get_table_text(1)
|
||
|
occupation = get_table_text(2)
|
||
|
association = Association.convert(get_table_text(3).lower().title())
|
||
|
rarity = len(table_rows[4].find_all('img'))
|
||
|
weapon_type = WeaponType[get_table_text(5)]
|
||
|
element = Element[get_table_text(6)]
|
||
|
birth = Birth(day=int(get_table_text(7)), month=int(get_table_text(8)))
|
||
|
constellation = get_table_text(10)
|
||
|
cn_cv = get_table_text(11)
|
||
|
jp_cv = get_table_text(12)
|
||
|
en_cv = get_table_text(13)
|
||
|
kr_cv = get_table_text(14)
|
||
|
else:
|
||
|
name = '空' if id_.endswith('5') else '荧'
|
||
|
title = get_table_text(0)
|
||
|
occupation = get_table_text(1)
|
||
|
association = Association.convert(get_table_text(2).lower().title())
|
||
|
rarity = len(table_rows[3].find_all('img'))
|
||
|
weapon_type = WeaponType[get_table_text(4)]
|
||
|
element = Element[get_table_text(5)]
|
||
|
birth = None
|
||
|
constellation = get_table_text(7)
|
||
|
cn_cv = get_table_text(8)
|
||
|
jp_cv = get_table_text(9)
|
||
|
en_cv = get_table_text(10)
|
||
|
kr_cv = get_table_text(11)
|
||
|
description = get_table_text(-3)
|
||
|
ascension = CharacterAscension(
|
||
|
level=[
|
||
|
target[0] for i in table_rows[-2].find_all('a')
|
||
|
if (target := re.findall(r'/(.*)/', i.attrs['href'])) # 过滤掉错误的材料(honey网页的bug)
|
||
|
],
|
||
|
skill=[re.findall(r'/(.*)/', i.attrs['href'])[0] for i in table_rows[-1].find_all('a')]
|
||
|
)
|
||
|
stats = []
|
||
|
for row in tables[2].find_all('tr')[1:]:
|
||
|
cells = row.find_all('td')
|
||
|
stats.append(
|
||
|
CharacterState(
|
||
|
level=cells[0].text, HP=cells[1].text, ATK=cells[2].text, DEF=cells[3].text,
|
||
|
CR=cells[4].text, CD=cells[5].text, bonus=cells[6].text
|
||
|
)
|
||
|
)
|
||
|
return Character(
|
||
|
id=id_, name=name, title=title, occupation=occupation, association=association, weapon_type=weapon_type,
|
||
|
element=element, birth=birth, constellation=constellation, cn_cv=cn_cv, jp_cv=jp_cv, rarity=rarity,
|
||
|
en_cv=en_cv, kr_cv=kr_cv, description=description, ascension=ascension, stats=stats
|
||
|
)
|
||
|
|
||
|
@classmethod
|
||
|
async def get_url_by_name(cls, name: str) -> Optional[URL]:
|
||
|
# 重写此函数的目的是处理主角名字的 ID
|
||
|
_map = {'荧': "playergirl_007", '空': "playerboy_005"}
|
||
|
if (id_ := _map.get(name, None)) is not None:
|
||
|
return await cls.get_url_by_id(id_)
|
||
|
return await super(Character, cls).get_url_by_name(name)
|
||
|
|
||
|
@property
|
||
|
def icon(self) -> CharacterIcon:
|
||
|
return CharacterIcon(
|
||
|
icon=str(SCRAPE_HOST.join(f'/img/{self.id}_icon.png')),
|
||
|
side=str(SCRAPE_HOST.join(f'/img/{self.id}_side_icon.png')),
|
||
|
gacha=str(SCRAPE_HOST.join(f'/img/{self.id}_gacha_card.png')),
|
||
|
splash=str(SCRAPE_HOST.join(f'/img/{self.id}_gacha_splash.png'))
|
||
|
)
|