239 lines
8.7 KiB
Python
239 lines
8.7 KiB
Python
""" PagerMaid features that uses external HTTP APIs other than Telegram. """
|
||
|
||
from googletrans import Translator, LANGUAGES
|
||
from os import remove
|
||
from urllib import request, parse
|
||
from math import ceil
|
||
from time import sleep
|
||
from threading import Thread
|
||
from bs4 import BeautifulSoup
|
||
from gtts import gTTS
|
||
from re import compile as regex_compile
|
||
from re import search, sub
|
||
from collections import deque
|
||
from pagermaid import log
|
||
from pagermaid.listener import listener, config
|
||
from pagermaid.utils import clear_emojis, attach_log, fetch_youtube_audio
|
||
|
||
|
||
@listener(outgoing=True, command="translate",
|
||
description="通过 Google 翻译将目标消息翻译成指定的语言。(支持回复)",
|
||
parameters="<文本>")
|
||
async def translate(context):
|
||
""" PagerMaid universal translator. """
|
||
translator = Translator()
|
||
reply = await context.get_reply_message()
|
||
message = context.arguments
|
||
lang = config['application_language']
|
||
if message:
|
||
pass
|
||
elif reply:
|
||
message = reply.text
|
||
else:
|
||
await context.edit("出错了呜呜呜 ~ 无效的参数。")
|
||
return
|
||
|
||
try:
|
||
await context.edit("正在生成翻译中 . . .")
|
||
result = translator.translate(clear_emojis(message), dest=lang)
|
||
except ValueError:
|
||
await context.edit("出错了呜呜呜 ~ 找不到目标语言,请更正配置文件中的错误。")
|
||
return
|
||
|
||
source_lang = LANGUAGES[f'{result.src.lower()}']
|
||
trans_lang = LANGUAGES[f'{result.dest.lower()}']
|
||
result = f"**文本翻译** 源语言 {source_lang.title()}:\n{result.text}"
|
||
|
||
if len(result) > 4096:
|
||
await context.edit("输出超出 TG 限制,正在尝试上传文件。")
|
||
await attach_log(result, context.chat_id, "translation.txt", context.id)
|
||
return
|
||
await context.edit(result)
|
||
if len(result) <= 4096:
|
||
await log(f"把 `{message}` 从 {source_lang} 翻译到了 {trans_lang}")
|
||
else:
|
||
await log(f"把一条消息从 {source_lang} 翻译到了 {trans_lang}.")
|
||
|
||
|
||
@listener(outgoing=True, command="tts",
|
||
description="通过 Google文本到语音 基于字符串生成语音消息。",
|
||
parameters="<string>")
|
||
async def tts(context):
|
||
""" Send TTS stuff as voice message. """
|
||
reply = await context.get_reply_message()
|
||
message = context.arguments
|
||
lang = config['application_tts']
|
||
if message:
|
||
pass
|
||
elif reply:
|
||
message = reply.text
|
||
else:
|
||
await context.edit("出错了呜呜呜 ~ 无效的参数。")
|
||
return
|
||
|
||
try:
|
||
await context.edit("生成语音中 . . .")
|
||
gTTS(message, lang=lang)
|
||
except AssertionError:
|
||
await context.edit("出错了呜呜呜 ~ 无效的参数。")
|
||
return
|
||
except ValueError:
|
||
await context.edit('出错了呜呜呜 ~ 找不到目标语言,请更正配置文件中的错误。')
|
||
return
|
||
except RuntimeError:
|
||
await context.edit('出错了呜呜呜 ~ 加载语言数组时出错。')
|
||
return
|
||
google_tts = gTTS(message, lang=lang)
|
||
google_tts.save("vocals.mp3")
|
||
with open("vocals.mp3", "rb") as audio:
|
||
line_list = list(audio)
|
||
line_count = len(line_list)
|
||
if line_count == 1:
|
||
google_tts = gTTS(message, lang=lang)
|
||
google_tts.save("vocals.mp3")
|
||
with open("vocals.mp3", "r"):
|
||
await context.client.send_file(context.chat_id, "vocals.mp3", voice_note=True)
|
||
remove("vocals.mp3")
|
||
if len(message) <= 4096:
|
||
await log(f"生成了一条文本到语音的音频消息 : `{message}`.")
|
||
else:
|
||
await log("生成了一条文本到语音的音频消息。")
|
||
await context.delete()
|
||
|
||
|
||
@listener(outgoing=True, command="google",
|
||
description="使用 Google 查询",
|
||
parameters="<query>")
|
||
async def google(context):
|
||
""" Searches Google for a string. """
|
||
if context.arguments == "":
|
||
await context.edit("出错了呜呜呜 ~ 无效的参数。")
|
||
return
|
||
query = context.arguments
|
||
await context.edit("正在拉取结果 . . .")
|
||
search_results = GoogleSearch().search(query=query)
|
||
results = ""
|
||
count = 0
|
||
for result in search_results.results:
|
||
if count == int(config['result_length']):
|
||
break
|
||
count += 1
|
||
title = result.title
|
||
link = result.url
|
||
desc = result.text
|
||
results += f"\n[{title}]({link}) \n`{desc}`\n"
|
||
await context.edit(f"**Google** |`{query}`| 🎙 🔍 \n"
|
||
f"{results}",
|
||
link_preview=False)
|
||
await log(f"在Google搜索引擎上查询了 `{query}`")
|
||
|
||
|
||
@listener(outgoing=True, command="fetchaudio",
|
||
description="从多个平台获取音频文件。",
|
||
parameters="<url>,<string>")
|
||
async def fetchaudio(context):
|
||
if context.arguments:
|
||
if ',' in context.arguments:
|
||
url, string_2 = context.arguments.split(',', 1)
|
||
else:
|
||
url = context.arguments
|
||
string_2 = "#audio "
|
||
else:
|
||
await context.edit("出错了呜呜呜 ~ 错误的语法。")
|
||
return
|
||
""" Fetches audio from provided URL. """
|
||
reply = await context.get_reply_message()
|
||
reply_id = None
|
||
await context.edit("拉取音频中 . . .")
|
||
if reply:
|
||
reply_id = reply.id
|
||
if url is None:
|
||
await context.edit("出错了呜呜呜 ~ 无效的参数。")
|
||
return
|
||
youtube_pattern = regex_compile(r"^(http(s)?://)?((w){3}.)?youtu(be|.be)?(\.com)?/.+")
|
||
if youtube_pattern.match(url):
|
||
if not await fetch_youtube_audio(url, context.chat_id, reply_id, string_2):
|
||
await context.edit("出错了呜呜呜 ~ 原声带下载失败。")
|
||
await log(f"从链接中获取了一条音频,链接: {url}.")
|
||
await context.delete()
|
||
|
||
class GoogleSearch:
|
||
USER_AGENT = "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.14; rv:69.0) Gecko/20100101 Firefox/69.0"
|
||
SEARCH_URL = "https://google.com/search"
|
||
RESULT_SELECTOR = "div.r > a"
|
||
TOTAL_SELECTOR = "#resultStats"
|
||
RESULTS_PER_PAGE = 10
|
||
DEFAULT_HEADERS = [
|
||
('User-Agent', USER_AGENT),
|
||
("Accept-Language", "en-US,en;q=0.5"),
|
||
]
|
||
|
||
def search(self, query, num_results=10, prefetch_pages=True, prefetch_threads=10):
|
||
search_results = []
|
||
pages = int(ceil(num_results / float(GoogleSearch.RESULTS_PER_PAGE)))
|
||
fetcher_threads = deque([])
|
||
total = None
|
||
for i in range(pages):
|
||
start = i * GoogleSearch.RESULTS_PER_PAGE
|
||
opener = request.build_opener()
|
||
opener.addheaders = GoogleSearch.DEFAULT_HEADERS
|
||
response = opener.open(GoogleSearch.SEARCH_URL + "?q=" + parse.quote(query) + ("" if start == 0 else (
|
||
"&start=" + str(start))))
|
||
soup = BeautifulSoup(response.read(), "lxml")
|
||
response.close()
|
||
if total is None:
|
||
total_text = soup.select(GoogleSearch.TOTAL_SELECTOR)[0].children.__next__()
|
||
total = int(sub("[', ]", "", search("(([0-9]+[', ])*[0-9]+)", total_text).group(1)))
|
||
results = self.parse_results(soup.select(GoogleSearch.RESULT_SELECTOR))
|
||
if len(search_results) + len(results) > num_results:
|
||
del results[num_results - len(search_results):]
|
||
search_results += results
|
||
if prefetch_pages:
|
||
for result in results:
|
||
while True:
|
||
running = 0
|
||
for thread in fetcher_threads:
|
||
if thread.is_alive():
|
||
running += 1
|
||
if running < prefetch_threads:
|
||
break
|
||
sleep(1)
|
||
fetcher_thread = Thread(target=result.get_text)
|
||
fetcher_thread.start()
|
||
fetcher_threads.append(fetcher_thread)
|
||
for thread in fetcher_threads:
|
||
thread.join()
|
||
return SearchResponse(search_results, total)
|
||
|
||
@staticmethod
|
||
def parse_results(results):
|
||
search_results = []
|
||
for result in results:
|
||
url = result["href"]
|
||
title = result.find_all('h3')[0].text
|
||
text = result.parent.parent.find_all('div', {'class': 's'})[0].text
|
||
search_results.append(SearchResult(title, url, text))
|
||
return search_results
|
||
|
||
|
||
class SearchResponse:
|
||
def __init__(self, results, total):
|
||
self.results = results
|
||
self.total = total
|
||
|
||
|
||
class SearchResult:
|
||
def __init__(self, title, url, text):
|
||
self.title = title
|
||
self.url = url
|
||
self.text = text
|
||
|
||
def get_text(self):
|
||
return self.text
|
||
|
||
def __str__(self):
|
||
return str(self.__dict__)
|
||
|
||
def __repr__(self):
|
||
return self.__str__()
|