MibooGram/modules/wiki/character.py

import re
from typing import List, Optional

from bs4 import BeautifulSoup
from httpx import URL

from modules.wiki.base import Model, SCRAPE_HOST
from modules.wiki.base import WikiModel
from modules.wiki.other import Association, Element, WeaponType


class Birth(Model):
    """生日
    Attributes:
        day: 天
        month: 月
    """
    day: int
    month: int


class CharacterAscension(Model):
    """角色的突破材料

    Attributes:
        level: 等级突破材料
        skill: 技能/天赋培养材料
    """
    level: List[str] = []
    skill: List[str] = []


class CharacterState(Model):
    """角色属性值

    Attributes:
        level: 等级
        HP: 生命
        ATK: 攻击力
        DEF: 防御力
        CR: 暴击率
        CD: 暴击伤害
        bonus: 突破属性
    """
    level: str
    HP: int
    ATK: float
    DEF: float
    CR: str
    CD: str
    bonus: str


class CharacterIcon(Model):
    icon: str
    side: str
    gacha: str
    splash: Optional[str]


class Character(WikiModel):
    """角色
    Attributes:
        title: 称号
        occupation: 所属
        association: 地区
        weapon_type: 武器类型
        element: 元素
        birth: 生日
        constellation: 命之座
        cn_cv: 中配
        jp_cv: 日配
        en_cv: 英配
        kr_cv: 韩配
        description: 描述
    """

    id: str
    title: str
    occupation: str
    association: Association
    weapon_type: WeaponType
    element: Element
    birth: Optional[Birth]
    constellation: str
    cn_cv: str
    jp_cv: str
    en_cv: str
    kr_cv: str
    description: str
    ascension: CharacterAscension

    stats: List[CharacterState]

    @classmethod
    def scrape_urls(cls) -> List[URL]:
        return [SCRAPE_HOST.join("fam_chars/?lang=CHS")]

    @classmethod
    async def _parse_soup(cls, soup: BeautifulSoup) -> 'Character':
        """解析角色页"""
        soup = soup.select('.wp-block-post-content')[0]
        tables = soup.find_all('table')
        table_rows = tables[0].find_all('tr')

        def get_table_text(row_num: int) -> str:
            """一个快捷函数，用于返回表格对应行的最后一个单元格中的文本"""
            return table_rows[row_num].find_all('td')[-1].text.replace('\xa0', '')

        id_ = re.findall(r'img/(.*?_\d+)_.*', table_rows[0].find('img').attrs['src'])[0]
        name = get_table_text(0)
        if name != '旅行者':  # 如果角色名不是 旅行者
            title = get_table_text(1)
            occupation = get_table_text(2)
            association = Association.convert(get_table_text(3).lower().title())
            rarity = len(table_rows[4].find_all('img'))
            weapon_type = WeaponType[get_table_text(5)]
            element = Element[get_table_text(6)]
            birth = Birth(day=int(get_table_text(7)), month=int(get_table_text(8)))
            constellation = get_table_text(10)
            cn_cv = get_table_text(11)
            jp_cv = get_table_text(12)
            en_cv = get_table_text(13)
            kr_cv = get_table_text(14)
        else:
            name = '空' if id_.endswith('5') else '荧'
            title = get_table_text(0)
            occupation = get_table_text(1)
            association = Association.convert(get_table_text(2).lower().title())
            rarity = len(table_rows[3].find_all('img'))
            weapon_type = WeaponType[get_table_text(4)]
            element = Element[get_table_text(5)]
            birth = None
            constellation = get_table_text(7)
            cn_cv = get_table_text(8)
            jp_cv = get_table_text(9)
            en_cv = get_table_text(10)
            kr_cv = get_table_text(11)
        description = get_table_text(-3)
        ascension = CharacterAscension(
            level=[
                target[0] for i in table_rows[-2].find_all('a')
                if (target := re.findall(r'/(.*)/', i.attrs['href']))  # 过滤掉错误的材料(honey网页的bug)
            ],
            skill=[re.findall(r'/(.*)/', i.attrs['href'])[0] for i in table_rows[-1].find_all('a')]
        )
        stats = []
        for row in tables[2].find_all('tr')[1:]:
            cells = row.find_all('td')
            stats.append(
                CharacterState(
                    level=cells[0].text, HP=cells[1].text, ATK=cells[2].text, DEF=cells[3].text,
                    CR=cells[4].text, CD=cells[5].text, bonus=cells[6].text
                )
            )
        return Character(
            id=id_, name=name, title=title, occupation=occupation, association=association, weapon_type=weapon_type,
            element=element, birth=birth, constellation=constellation, cn_cv=cn_cv, jp_cv=jp_cv, rarity=rarity,
            en_cv=en_cv, kr_cv=kr_cv, description=description, ascension=ascension, stats=stats
        )

    @classmethod
    async def get_url_by_name(cls, name: str) -> Optional[URL]:
        # 重写此函数的目的是处理主角名字的 ID
        _map = {'荧': "playergirl_007", '空': "playerboy_005"}
        if (id_ := _map.get(name)) is not None:
            return await cls.get_url_by_id(id_)
        return await super(Character, cls).get_url_by_name(name)

    @property
    def icon(self) -> CharacterIcon:
        return CharacterIcon(
            icon=str(SCRAPE_HOST.join(f'/img/{self.id}_icon.webp')),
            side=str(SCRAPE_HOST.join(f'/img/{self.id}_side_icon.webp')),
            gacha=str(SCRAPE_HOST.join(f'/img/{self.id}_gacha_card.webp')),
            splash=str(SCRAPE_HOST.join(f'/img/{self.id}_gacha_splash.webp'))
        )
♻️ 重写 wiki 模块和相关插件 1. 使用 `pydantic` 重写了 wiki 模块所使用的 model 2. 添加了 weapon_level.json 用于后续计算武器升级所需的经验 3. 修改了 wiki 插件，以适应新的 model 2022-08-28 14:37:31 +00:00			`import re`
			`from typing import List, Optional`

			`from bs4 import BeautifulSoup`
			`from httpx import URL`

♻ 更新V3版本 ♻️ 重构插件系统 ⚙️ 重写插件 🎨 改进代码结构 📝 完善文档 Co-authored-by: zhxy-CN <admin@owo.cab> Co-authored-by: 洛水居室 <luoshuijs@outlook.com> Co-authored-by: xtaodada <xtao@xtaolink.cn> Co-authored-by: Li Chuangbo <im@chuangbo.li> 2022-09-08 01:08:37 +00:00			`from modules.wiki.base import Model, SCRAPE_HOST`
			`from modules.wiki.base import WikiModel`
			`from modules.wiki.other import Association, Element, WeaponType`
♻️ 重写 wiki 模块和相关插件 1. 使用 `pydantic` 重写了 wiki 模块所使用的 model 2. 添加了 weapon_level.json 用于后续计算武器升级所需的经验 3. 修改了 wiki 插件，以适应新的 model 2022-08-28 14:37:31 +00:00

			`class Birth(Model):`
			`"""生日`
			`Attributes:`
			`day: 天`
			`month: 月`
			`"""`
			`day: int`
			`month: int`


			`class CharacterAscension(Model):`
			`"""角色的突破材料`

			`Attributes:`
			`level: 等级突破材料`
			`skill: 技能/天赋培养材料`
			`"""`
			`level: List[str] = []`
			`skill: List[str] = []`


			`class CharacterState(Model):`
			`"""角色属性值`

			`Attributes:`
			`level: 等级`
			`HP: 生命`
			`ATK: 攻击力`
			`DEF: 防御力`
			`CR: 暴击率`
			`CD: 暴击伤害`
			`bonus: 突破属性`
			`"""`
			`level: str`
			`HP: int`
			`ATK: float`
			`DEF: float`
			`CR: str`
			`CD: str`
			`bonus: str`


			`class CharacterIcon(Model):`
			`icon: str`
			`side: str`
			`gacha: str`
			`splash: Optional[str]`


			`class Character(WikiModel):`
			`"""角色`
			`Attributes:`
			`title: 称号`
			`occupation: 所属`
			`association: 地区`
			`weapon_type: 武器类型`
			`element: 元素`
			`birth: 生日`
			`constellation: 命之座`
			`cn_cv: 中配`
			`jp_cv: 日配`
			`en_cv: 英配`
			`kr_cv: 韩配`
			`description: 描述`
			`"""`

			`id: str`
			`title: str`
			`occupation: str`
			`association: Association`
			`weapon_type: WeaponType`
			`element: Element`
			`birth: Optional[Birth]`
			`constellation: str`
			`cn_cv: str`
			`jp_cv: str`
			`en_cv: str`
			`kr_cv: str`
			`description: str`
			`ascension: CharacterAscension`

			`stats: List[CharacterState]`

			`@classmethod`
			`def scrape_urls(cls) -> List[URL]:`
			`return [SCRAPE_HOST.join("fam_chars/?lang=CHS")]`

			`@classmethod`
			`async def _parse_soup(cls, soup: BeautifulSoup) -> 'Character':`
			`"""解析角色页"""`
			`soup = soup.select('.wp-block-post-content')[0]`
			`tables = soup.find_all('table')`
			`table_rows = tables[0].find_all('tr')`

			`def get_table_text(row_num: int) -> str:`
			`"""一个快捷函数，用于返回表格对应行的最后一个单元格中的文本"""`
			`return table_rows[row_num].find_all('td')[-1].text.replace('\xa0', '')`

			`id_ = re.findall(r'img/(.?_\d+)_.', table_rows[0].find('img').attrs['src'])[0]`
			`name = get_table_text(0)`
			`if name != '旅行者': # 如果角色名不是旅行者`
			`title = get_table_text(1)`
			`occupation = get_table_text(2)`
			`association = Association.convert(get_table_text(3).lower().title())`
			`rarity = len(table_rows[4].find_all('img'))`
			`weapon_type = WeaponType[get_table_text(5)]`
			`element = Element[get_table_text(6)]`
			`birth = Birth(day=int(get_table_text(7)), month=int(get_table_text(8)))`
			`constellation = get_table_text(10)`
			`cn_cv = get_table_text(11)`
			`jp_cv = get_table_text(12)`
			`en_cv = get_table_text(13)`
			`kr_cv = get_table_text(14)`
			`else:`
			`name = '空' if id_.endswith('5') else '荧'`
			`title = get_table_text(0)`
			`occupation = get_table_text(1)`
			`association = Association.convert(get_table_text(2).lower().title())`
			`rarity = len(table_rows[3].find_all('img'))`
			`weapon_type = WeaponType[get_table_text(4)]`
			`element = Element[get_table_text(5)]`
			`birth = None`
			`constellation = get_table_text(7)`
			`cn_cv = get_table_text(8)`
			`jp_cv = get_table_text(9)`
			`en_cv = get_table_text(10)`
			`kr_cv = get_table_text(11)`
			`description = get_table_text(-3)`
			`ascension = CharacterAscension(`
			`level=[`
			`target[0] for i in table_rows[-2].find_all('a')`
			`if (target := re.findall(r'/(.*)/', i.attrs['href'])) # 过滤掉错误的材料(honey网页的bug)`
			`],`
			`skill=[re.findall(r'/(.*)/', i.attrs['href'])[0] for i in table_rows[-1].find_all('a')]`
			`)`
			`stats = []`
			`for row in tables[2].find_all('tr')[1:]:`
			`cells = row.find_all('td')`
			`stats.append(`
			`CharacterState(`
			`level=cells[0].text, HP=cells[1].text, ATK=cells[2].text, DEF=cells[3].text,`
			`CR=cells[4].text, CD=cells[5].text, bonus=cells[6].text`
			`)`
			`)`
			`return Character(`
			`id=id_, name=name, title=title, occupation=occupation, association=association, weapon_type=weapon_type,`
			`element=element, birth=birth, constellation=constellation, cn_cv=cn_cv, jp_cv=jp_cv, rarity=rarity,`
			`en_cv=en_cv, kr_cv=kr_cv, description=description, ascension=ascension, stats=stats`
			`)`

			`@classmethod`
			`async def get_url_by_name(cls, name: str) -> Optional[URL]:`
			`# 重写此函数的目的是处理主角名字的 ID`
			`_map = {'荧': "playergirl_007", '空': "playerboy_005"}`
♻ 更新V3版本 ♻️ 重构插件系统 ⚙️ 重写插件 🎨 改进代码结构 📝 完善文档 Co-authored-by: zhxy-CN <admin@owo.cab> Co-authored-by: 洛水居室 <luoshuijs@outlook.com> Co-authored-by: xtaodada <xtao@xtaolink.cn> Co-authored-by: Li Chuangbo <im@chuangbo.li> 2022-09-08 01:08:37 +00:00			`if (id_ := _map.get(name)) is not None:`
♻️ 重写 wiki 模块和相关插件 1. 使用 `pydantic` 重写了 wiki 模块所使用的 model 2. 添加了 weapon_level.json 用于后续计算武器升级所需的经验 3. 修改了 wiki 插件，以适应新的 model 2022-08-28 14:37:31 +00:00			`return await cls.get_url_by_id(id_)`
			`return await super(Character, cls).get_url_by_name(name)`

			`@property`
			`def icon(self) -> CharacterIcon:`
			`return CharacterIcon(`
🐛 修复爬虫图片类型错误的问题 2022-09-01 04:20:00 +00:00			`icon=str(SCRAPE_HOST.join(f'/img/{self.id}_icon.webp')),`
			`side=str(SCRAPE_HOST.join(f'/img/{self.id}_side_icon.webp')),`
			`gacha=str(SCRAPE_HOST.join(f'/img/{self.id}_gacha_card.webp')),`
			`splash=str(SCRAPE_HOST.join(f'/img/{self.id}_gacha_splash.webp'))`
♻️ 重写 wiki 模块和相关插件 1. 使用 `pydantic` 重写了 wiki 模块所使用的 model 2. 添加了 weapon_level.json 用于后续计算武器升级所需的经验 3. 修改了 wiki 插件，以适应新的 model 2022-08-28 14:37:31 +00:00			`)`