node.js 的爬虫puppeteer基本使用

const puppeteer = require("puppeteer");

function timeout() {
  return new Promise((resolve, reject) => {
    setTimeout(resolve, 3000);
  });
}

module.exports = async (url) => {
 //打开浏览器chrome 路由
  const browser = await puppeteer.launch({
    executablePath: "/Applications/Google Chrome.app/Contents/MacOS/Google\ Chrome",
    headless: true
  });
// 创建自页面
  const page = await browser.newPage();
// 打开一个网页
  await page.goto(url, {waitUtil: "networkidle2"});

  await timeout();
 // 在页面中执行js
  let results = await page.evaluate(() => {
    const tmp = [];
    
    return tmp;
  })
// 返货js执行结构
  return results;
// 关闭chrmoe
  await browser.close();
}
This entry was posted in node.js. Bookmark the permalink.

发表回复