Miao-Yunzai/renderers/puppeteer/lib/puppeteer.js

296 lines
9.1 KiB
JavaScript
Raw Permalink Normal View History

2024-03-07 20:43:30 +08:00
import Renderer from "../../../lib/renderer/Renderer.js"
import os from "node:os"
import lodash from "lodash"
import puppeteer from "puppeteer"
// 暂时保留对原config的兼容
2024-03-07 20:43:30 +08:00
import cfg from "../../../lib/config/config.js"
2023-09-19 03:55:29 +08:00
const _path = process.cwd()
// mac地址
2024-03-07 20:43:30 +08:00
let mac = ""
2023-09-15 08:15:25 +08:00
export default class Puppeteer extends Renderer {
2024-03-07 20:43:30 +08:00
constructor(config) {
2023-09-15 08:15:25 +08:00
super({
2024-03-07 20:43:30 +08:00
id: "puppeteer",
type: "image",
render: "screenshot"
2023-09-15 08:15:25 +08:00
})
this.browser = false
this.lock = false
this.shoting = []
/** 截图数达到时重启浏览器 避免生成速度越来越慢 */
this.restartNum = 100
/** 截图次数 */
this.renderNum = 0
this.config = {
2024-03-07 20:43:30 +08:00
headless: config.headless || "new",
args: config.args || [
"--disable-gpu",
"--disable-setuid-sandbox",
"--no-sandbox",
"--no-zygote"
]
}
2024-03-07 20:43:30 +08:00
if (config.chromiumPath || cfg?.bot?.chromium_path)
/** chromium其他路径 */
this.config.executablePath = config.chromiumPath || cfg?.bot?.chromium_path
2024-03-07 20:43:30 +08:00
if (config.puppeteerWS || cfg?.bot?.puppeteer_ws)
/** chromium其他路径 */
this.config.wsEndpoint = config.puppeteerWS || cfg?.bot?.puppeteer_ws
/** puppeteer超时超时时间 */
this.puppeteerTimeout = config.puppeteerTimeout || cfg?.bot?.puppeteer_timeout || 0
}
/**
* 初始化chromium
*/
2024-03-07 20:43:30 +08:00
async browserInit() {
if (this.browser) return this.browser
if (this.lock) return false
this.lock = true
2024-03-07 20:43:30 +08:00
logger.info("puppeteer Chromium 启动中...")
let connectFlag = false
try {
// 获取Mac地址
if (!mac) {
mac = await this.getMac()
this.browserMacKey = `Yz:chromium:browserWSEndpoint:${mac}`
}
// 是否有browser实例
const browserUrl = (await redis.get(this.browserMacKey)) || this.config.wsEndpoint
if (browserUrl) {
2024-03-07 20:43:30 +08:00
try {
const browserWSEndpoint = await puppeteer.connect({ browserWSEndpoint: browserUrl })
// 如果有实例,直接使用
if (browserWSEndpoint) {
this.browser = browserWSEndpoint
connectFlag = true
}
2024-03-07 20:43:30 +08:00
logger.info(`puppeteer Chromium 连接成功 ${browserUrl}`)
} catch (err) {
await redis.del(this.browserMacKey)
}
}
2024-03-07 20:43:30 +08:00
} catch (err) {}
if (!this.browser || !connectFlag) {
// 如果没有实例初始化puppeteer
this.browser = await puppeteer.launch(this.config).catch((err, trace) => {
2024-03-07 20:43:30 +08:00
let errMsg = err.toString() + (trace ? trace.toString() : "")
if (typeof err == "object") {
logger.error(JSON.stringify(err))
} else {
logger.error(err.toString())
2024-03-07 20:43:30 +08:00
if (errMsg.includes("Could not find Chromium")) {
logger.error("没有正确安装 Chromium可以尝试执行安装命令node node_modules/puppeteer/install.js")
} else if (errMsg.includes("cannot open shared object file")) {
logger.error("没有正确安装 Chromium 运行库")
}
}
2023-09-06 14:48:25 +08:00
logger.error(err, trace)
})
}
this.lock = false
if (!this.browser) {
2024-03-07 20:43:30 +08:00
logger.error("puppeteer Chromium 启动失败")
return false
}
2024-03-07 20:43:30 +08:00
if (!connectFlag) {
logger.info(`puppeteer Chromium 启动成功 ${this.browser.wsEndpoint()}`)
if (this.browserMacKey) {
2023-09-06 14:48:25 +08:00
// 缓存一下实例30天
const expireTime = 60 * 60 * 24 * 30
await redis.set(this.browserMacKey, this.browser.wsEndpoint(), { EX: expireTime })
}
}
/** 监听Chromium实例是否断开 */
2024-03-08 09:48:18 +08:00
this.browser.on("disconnected", () => this.restart(true))
return this.browser
}
// 获取Mac地址
2024-03-07 20:43:30 +08:00
getMac() {
let mac = "00:00:00:00:00:00"
try {
const network = os.networkInterfaces()
let macFlag = false
2023-09-06 14:48:25 +08:00
for (const a in network) {
for (const i of network[a]) {
if (i.mac && i.mac !== mac) {
macFlag = true
mac = i.mac
break
2023-09-06 14:48:25 +08:00
}
}
if (macFlag) {
break
}
}
} catch (e) {
}
2024-03-07 20:43:30 +08:00
mac = mac.replace(/:/g, "")
return mac
}
/**
* `chromium` 截图
* @param name
* @param data 模板参数
* @param data.tplFile 模板路径必传
* @param data.saveId 生成html名称为空name代替
* @param data.imgType screenshot参数生成图片类型jpegpng
* @param data.quality screenshot参数图片质量 0-100jpeg是可传默认90
* @param data.omitBackground screenshot参数隐藏默认的白色背景背景透明默认不透明
* @param data.path screenshot参数截图保存路径截图图片类型将从文件扩展名推断出来如果是相对路径则从当前路径解析如果没有指定路径图片将不会保存到硬盘
* @param data.multiPage 是否分页截图默认false
* @param data.multiPageHeight 分页状态下页面高度默认4000
* @param data.pageGotoParams 页面goto时的参数
* @return img 不做segment包裹
*/
2024-03-07 20:43:30 +08:00
async screenshot(name, data = {}) {
if (!await this.browserInit())
return false
const pageHeight = data.multiPageHeight || 4000
let savePath = this.dealTpl(name, data)
2024-03-07 20:43:30 +08:00
if (!savePath) return false
2024-03-07 20:43:30 +08:00
let buff = ""
let start = Date.now()
let ret = []
this.shoting.push(name)
const puppeteerTimeout = this.puppeteerTimeout
let overtime
if (puppeteerTimeout > 0) {
// TODO 截图超时处理
overtime = setTimeout(() => {
2024-03-07 20:43:30 +08:00
if (this.shoting.length) {
logger.error(`[图片生成][${name}] 截图超时,当前等待队列:${this.shoting.join(",")}`)
this.restart(true)
this.shoting = []
}
}, puppeteerTimeout)
}
try {
const page = await this.browser.newPage()
let pageGotoParams = lodash.extend({ timeout: 120000 }, data.pageGotoParams || {})
2024-03-07 20:43:30 +08:00
await page.goto(`file://${_path}${lodash.trim(savePath, ".")}`, pageGotoParams)
let body = await page.$("#container") || await page.$("body")
// 计算页面高度
const boundingBox = await body.boundingBox()
// 分页数
let num = 1
let randData = {
2024-03-07 20:43:30 +08:00
type: data.imgType || "jpeg",
omitBackground: data.omitBackground || false,
quality: data.quality || 90,
2024-03-07 20:43:30 +08:00
path: data.path || ""
}
if (data.multiPage) {
2024-03-07 20:43:30 +08:00
randData.type = "jpeg"
num = Math.round(boundingBox.height / pageHeight) || 1
}
2024-03-07 20:43:30 +08:00
if (data.imgType === "png") {
delete randData.quality
}
if (!data.multiPage) {
buff = await body.screenshot(randData)
2024-03-07 20:43:30 +08:00
this.renderNum++
/** 计算图片大小 */
2024-03-07 20:43:30 +08:00
const kb = (buff.length / 1024).toFixed(2) + "KB"
logger.mark(`[图片生成][${name}][${this.renderNum}次] ${kb} ${logger.green(`${Date.now() - start}ms`)}`)
ret.push(buff)
} else {
// 分片截图
if (num > 1) {
await page.setViewport({
width: boundingBox.width,
height: pageHeight + 100
})
}
for (let i = 1; i <= num; i++) {
if (i !== 1 && i === num) {
await page.setViewport({
width: boundingBox.width,
height: parseInt(boundingBox.height) - pageHeight * (num - 1)
})
}
if (i !== 1 && i <= num) {
await page.evaluate(pageHeight => window.scrollBy(0, pageHeight), pageHeight)
}
if (num === 1) {
buff = await body.screenshot(randData)
} else {
buff = await page.screenshot(randData)
}
2023-09-06 14:48:25 +08:00
if (num > 2) {
2024-03-07 20:43:30 +08:00
await new Promise(resolve => setTimeout(resolve, 200))
2023-09-06 14:48:25 +08:00
}
this.renderNum++
/** 计算图片大小 */
2024-03-07 20:43:30 +08:00
const kb = (buff.length / 1024).toFixed(2) + "KB"
logger.mark(`[图片生成][${name}][${i}/${num}] ${kb}`)
ret.push(buff)
}
if (num > 1) {
logger.mark(`[图片生成][${name}] 处理完成`)
}
}
2024-03-07 20:43:30 +08:00
page.close().catch(err => logger.error(err))
} catch (err) {
logger.error(`[图片生成][${name}] 图片生成失败`, err)
/** 关闭浏览器 */
2024-03-07 20:43:30 +08:00
this.restart(true)
if (overtime) clearTimeout(overtime)
ret = []
return false
} finally {
2024-03-07 20:43:30 +08:00
if (overtime) clearTimeout(overtime)
}
this.shoting.pop()
if (ret.length === 0 || !ret[0]) {
2023-09-06 14:48:25 +08:00
logger.error(`[图片生成][${name}] 图片生成为空`)
return false
}
2024-03-07 20:43:30 +08:00
this.restart()
return data.multiPage ? ret : ret[0]
}
/** 重启 */
2024-03-07 20:43:30 +08:00
restart(force = false) {
/** 截图超过重启数时,自动关闭重启浏览器,避免生成速度越来越慢 */
2024-03-08 09:48:18 +08:00
if (!this.browser?.close || this.lock) return
2024-03-07 20:43:30 +08:00
if (!force) if (this.renderNum % this.restartNum !== 0 || this.shoting.length > 0) return
2024-03-08 09:48:18 +08:00
logger.info(`puppeteer Chromium ${force ? "强制" : ""}关闭重启...`)
this.stop(this.browser)
this.browser = false
return this.browserInit()
}
async stop(browser) {
try {
await browser.close()
} catch (err) {
logger.error("puppeteer Chromium 关闭错误", err)
}
}
2024-03-07 20:43:30 +08:00
}