add scraping route with headless chrome

This commit is contained in:
sjwie 2024-04-12 11:28:25 +09:00
parent bf503e548d
commit b5df196d96
3 changed files with 798 additions and 23 deletions

25
app/scrap/route.ts Normal file
View File

@ -0,0 +1,25 @@
// import chromium from "@sparticuz/chromium";
// import chromium from "chrome-aws-lambda";
const chromium = require("chrome-aws-lambda");
import { NextRequest, NextResponse } from "next/server";
// import * as puppeteer from "puppeteer-core";
import puppeteer from "puppeteer";
export default async function getBrowser() {
return puppeteer.launch({
args: [...chromium.args, "--hide-scrollbars", "--disable-web-security"],
defaultViewport: chromium.defaultViewport,
headless: false,
// ignoreHTTPSErrors: true,
});
}
export async function GET(request: NextRequest) {
const browser = await getBrowser();
const page = await browser.newPage();
await page.goto("https://naver.com");
const buffer = await page.screenshot({ type: "png" });
await browser.close();
const base64Image = buffer.toString("base64");
return NextResponse.json({ image: base64Image });
}

View File

@ -9,9 +9,14 @@
"lint": "next lint"
},
"dependencies": {
"@sparticuz/chromium": "^122.0.0",
"@sparticuz/chromium-min": "^122.0.0",
"@vercel/analytics": "^1.1.3",
"@vercel/speed-insights": "^1.0.9",
"chrome-aws-lambda": "^10.1.0",
"next": "14.1.0",
"puppeteer": "^22.4.0",
"puppeteer-core": "^22.3.0",
"react": "^18",
"react-dom": "^18",
"react-drawio": "^0.1.2",

791
yarn.lock

File diff suppressed because it is too large Load Diff