stacker.news/capture/index.js

116 lines
3.5 KiB
JavaScript
Raw Normal View History

2023-07-15 16:17:16 +00:00
import express from 'express'
import puppeteer from 'puppeteer'
const captureUrl = process.env.CAPTURE_URL || 'http://host.docker.internal:3000/'
const port = process.env.PORT || 5678
2024-02-04 02:14:54 +00:00
const maxPages = Number(process.env.MAX_PAGES) || 5
const timeout = Number(process.env.TIMEOUT) || 10000
2023-07-15 16:17:16 +00:00
const cache = process.env.CACHE || 60000
const width = process.env.WIDTH || 600
const height = process.env.HEIGHT || 315
const deviceScaleFactor = process.env.SCALE_FACTOR || 2
2024-02-04 02:14:54 +00:00
// from https://www.bannerbear.com/blog/ways-to-speed-up-puppeteer-screenshots/
const args = [
'--autoplay-policy=user-gesture-required',
'--disable-background-networking',
'--disable-background-timer-throttling',
'--disable-backgrounding-occluded-windows',
'--disable-breakpad',
'--disable-client-side-phishing-detection',
'--disable-component-update',
'--disable-default-apps',
'--disable-dev-shm-usage',
'--disable-domain-reliability',
'--disable-extensions',
'--disable-features=AudioServiceOutOfProcess',
'--disable-hang-monitor',
'--disable-ipc-flooding-protection',
'--disable-notifications',
'--disable-offer-store-unmasked-wallet-cards',
'--disable-popup-blocking',
'--disable-print-preview',
'--disable-prompt-on-repost',
'--disable-renderer-backgrounding',
'--disable-setuid-sandbox',
'--disable-speech-api',
'--disable-sync',
'--hide-scrollbars',
'--ignore-gpu-blacklist',
'--metrics-recording-only',
'--mute-audio',
'--no-default-browser-check',
'--no-first-run',
'--no-pings',
'--no-sandbox',
'--no-zygote',
'--password-store=basic',
'--use-gl=swiftshader',
'--use-mock-keychain'
]
2023-07-15 16:17:16 +00:00
let browser
const app = express()
app.get('/health', (req, res) => {
res.status(200).end()
})
app.get('/*', async (req, res) => {
const url = new URL(req.originalUrl, captureUrl)
2024-02-03 23:49:34 +00:00
const timeLabel = `${Date.now()}-${url.href}`
2023-07-15 16:17:16 +00:00
const urlParams = new URLSearchParams(url.search)
const commentId = urlParams.get('commentId')
2024-02-04 02:14:54 +00:00
let page, pages
2024-02-03 23:49:34 +00:00
2023-07-15 16:17:16 +00:00
try {
2024-02-03 23:49:34 +00:00
console.time(timeLabel)
browser ||= await puppeteer.launch({
headless: 'new',
2024-02-04 02:14:54 +00:00
useDataDir: './data',
2024-02-03 23:49:34 +00:00
executablePath: 'google-chrome-stable',
2024-02-04 02:14:54 +00:00
args,
protocolTimeout: timeout,
defaultViewport: { width, height, deviceScaleFactor }
2024-02-03 23:49:34 +00:00
})
2024-02-04 02:14:54 +00:00
pages = (await browser.pages()).length
console.timeLog(timeLabel, 'capturing', 'current pages', pages)
2024-02-03 23:49:34 +00:00
// limit number of active pages
2024-02-04 02:14:54 +00:00
if (pages > maxPages + 1) {
2024-02-03 23:49:34 +00:00
console.timeLog(timeLabel, 'too many pages')
return res.writeHead(503, {
'Retry-After': 1
}).end()
}
2023-07-15 16:17:16 +00:00
page = await browser.newPage()
await page.emulateMediaFeatures([{ name: 'prefers-color-scheme', value: 'dark' }])
await page.goto(url.href, { waitUntil: 'load', timeout })
2024-02-04 02:14:54 +00:00
console.timeLog(timeLabel, 'page loaded')
if (commentId) {
console.timeLog(timeLabel, 'scrolling to comment')
await page.waitForSelector('.outline-it')
}
2023-07-15 16:17:16 +00:00
const file = await page.screenshot({ type: 'png', captureBeyondViewport: false })
2024-02-04 02:14:54 +00:00
console.timeLog(timeLabel, 'screenshot complete')
2023-07-15 16:17:16 +00:00
res.setHeader('Content-Type', 'image/png')
2024-02-03 23:49:34 +00:00
res.setHeader('Cache-Control', `public, max-age=${cache}, immutable, stale-while-revalidate=${cache * 24}, stale-if-error=${cache * 24}`)
return res.status(200).end(file)
2023-07-15 16:17:16 +00:00
} catch (err) {
2024-02-03 23:49:34 +00:00
console.timeLog(timeLabel, 'error', err)
2023-07-15 16:17:16 +00:00
return res.status(500).end()
} finally {
2024-02-04 02:14:54 +00:00
console.timeEnd(timeLabel, 'pages at start', pages)
2024-02-03 23:49:34 +00:00
page?.close().catch(console.error)
2023-07-15 16:17:16 +00:00
}
})
app.listen(port, () =>
console.log(`Screenshot listen on http://:${port}`)
)