增加网页截图,移除未使用到的依赖

This commit is contained in:
CMHopeSunshine 2022-09-25 16:27:45 +08:00
parent 3ee1bfb0c4
commit d5e9ffd890
3 changed files with 207 additions and 4 deletions

View File

@ -0,0 +1,34 @@
from nonebot import on_command
from nonebot.params import CommandArg
from nonebot.adapters.onebot.v11 import Message, MessageEvent
from nonebot.plugin import PluginMetadata
from LittlePaimon.utils.brower import AsyncPlaywright
__plugin_meta__ = PluginMetadata(
name='实用工具',
description='一些实用的工具插件',
usage='',
extra={
'author': '惜月',
'version': '3.0',
'priority': 99,
}
)
screenshot_cmd = on_command('网页截图', priority=10, block=True, state={
'pm_name': '网页截图',
'pm_description': '对指定链接页面进行截图【网页截图www.baidu.com】可选指定网页元素',
'pm_usage': '网页截图<链接> [元素]',
'pm_priority': 1
})
@screenshot_cmd.handle()
async def _(event: MessageEvent, msg: Message = CommandArg()):
await screenshot_cmd.send('正在尝试截图,请稍等...')
msg = msg.extract_plain_text().strip().split(' ')
url = msg[0]
element = msg[1:] if len(msg) > 1 else None
img = await AsyncPlaywright.screenshot(url, element=element)
await screenshot_cmd.finish(img)

View File

@ -0,0 +1,172 @@
# https://github.com/HibiKier/zhenxun_bot/blob/main/utils
import asyncio
from pathlib import Path
from typing import Optional, Literal, Union, List, Dict
from nonebot import logger
from nonebot.adapters.onebot.v11 import MessageSegment
from playwright.async_api import Browser, async_playwright, Page, BrowserContext
_browser: Optional[Browser] = None
async def init(**kwargs) -> Optional[Browser]:
global _browser
browser = await async_playwright().start()
try:
_browser = await browser.chromium.launch(**kwargs)
return _browser
except Exception:
await asyncio.get_event_loop().run_in_executor(None, install)
_browser = await browser.chromium.launch(**kwargs)
return None
async def get_browser(**kwargs) -> Browser:
return _browser or await init(**kwargs)
def install():
"""自动安装、更新 Chromium"""
logger.info("正在检查 Chromium 更新")
import sys
from playwright.__main__ import main
sys.argv = ["", "install", "chromium"]
try:
main()
except SystemExit:
pass
class AsyncPlaywright:
@classmethod
async def _new_page(cls, user_agent: Optional[str] = None, **kwargs) -> Page:
"""
说明:
获取一个新页面
参数:
:param user_agent: 请求头
"""
browser = await get_browser()
if browser:
return await browser.new_page(user_agent=user_agent, **kwargs)
logger.info('获取浏览器失败')
raise BrowserIsNone('获取浏览器失败')
@classmethod
async def new_context(cls, user_agent: Optional[str] = None, **kwargs) -> BrowserContext:
"""
说明:
获取一个新上下文
参数:
:param user_agent: 请求头
"""
browser = await get_browser()
if browser:
return await browser.new_context(user_agent=user_agent, **kwargs)
logger.info('获取浏览器失败')
raise BrowserIsNone('获取浏览器失败')
@classmethod
async def goto(
cls,
url: str,
*,
timeout: Optional[float] = 100000,
wait_until: Optional[
Literal["domcontentloaded", "load", "networkidle"]
] = "networkidle",
referer: str = None,
**kwargs
) -> Optional[Page]:
"""
说明:
goto
参数:
:param url: 网址
:param timeout: 超时限制
:param wait_until: 等待类型
:param referer:
"""
page = None
try:
page = await cls._new_page(**kwargs)
await page.goto(url, timeout=timeout, wait_until=wait_until, referer=referer)
return page
except Exception as e:
logger.warning(f"Playwright 访问 url{url} 发生错误 {type(e)}{e}")
if page:
await page.close()
return None
@classmethod
async def screenshot(
cls,
url: str,
*,
element: Optional[Union[str, List[str]]] = None,
path: Optional[Union[Path, str]] = None,
wait_time: Optional[int] = None,
viewport_size: Dict[str, int] = None,
wait_until: Optional[
Literal["domcontentloaded", "load", "networkidle"]
] = "networkidle",
timeout: float = None,
**kwargs
) -> Optional[MessageSegment]:
"""
说明:
截图该方法仅用于简单快捷截图复杂截图请操作 page
参数:
:param url: 网址
:param path: 存储路径
:param element: 元素选择
:param wait_time: 等待截取超时时间
:param viewport_size: 窗口大小
:param wait_until: 等待类型
:param timeout: 超时限制
"""
if not url.startswith(('https://', 'http://')):
url = f'https://{url}'
page = None
if viewport_size is None:
viewport_size = dict(width=1920, height=1080)
if path and isinstance(path, str):
path = Path(path)
try:
page = await cls.goto(url, wait_until=wait_until, **kwargs)
await page.set_viewport_size(viewport_size)
if element:
if isinstance(element, str):
if wait_time:
card = await page.wait_for_selector(element, timeout=wait_time * 1000)
else:
card = await page.query_selector(element)
else:
card = page
for e in element:
if wait_time:
card = await card.wait_for_selector(e, timeout=wait_time * 1000)
else:
card = await card.query_selector(e)
else:
card = page
if path:
img = await card.screenshot(path=path, timeout=timeout)
else:
img = await card.screenshot(timeout=timeout)
return MessageSegment.image(img)
except Exception as e:
logger.warning(f"Playwright 截图 url{url} element{element} 发生错误 {type(e)}{e}")
return MessageSegment.text(f'截图失败,报错信息:{e}')
finally:
if page:
await page.close()
class UrlPathNumberNotEqual(Exception):
pass
class BrowserIsNone(Exception):
pass

View File

@ -1,6 +1,6 @@
[tool.poetry]
name = "LittlePaimon"
version = "3.0.0beta1"
version = "3.0.0beta7"
description = "小派蒙原神qq群机器人基于NoneBot2的UID查询、抽卡导出分析、模拟抽卡、实时便签、札记等多功能小助手。"
authors = ["惜月 <277073121@qq.com>"]
license = "AGPL"
@ -21,9 +21,6 @@ httpx = "^0.23.0"
lxml = "^4.8.0"
Pillow = "^9.1.0"
matplotlib = "^3.5.1"
pypinyin = "^0.46.0"
xlsxwriter = "^3.0.3"
aiofiles = "^0.8.0"
tortoise-orm = "^0.19.2"
tqdm = "^4.64.0"
"ruamel.yaml" = "^0.17.21"