2017-12-15 03:13:27 +00:00
|
|
|
/**
|
2024-01-03 10:11:33 +00:00
|
|
|
* @license
|
|
|
|
* Copyright 2017 Google Inc.
|
|
|
|
* SPDX-License-Identifier: Apache-2.0
|
2017-12-15 03:13:27 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @fileoverview Search developers.google.com/web for articles tagged
|
|
|
|
* "Headless Chrome" and scrape results from the results page.
|
|
|
|
*/
|
|
|
|
|
|
|
|
'use strict';
|
|
|
|
|
|
|
|
const puppeteer = require('puppeteer');
|
|
|
|
|
2020-05-07 10:54:55 +00:00
|
|
|
(async () => {
|
2018-01-11 21:42:01 +00:00
|
|
|
const browser = await puppeteer.launch();
|
|
|
|
const page = await browser.newPage();
|
|
|
|
|
|
|
|
await page.goto('https://developers.google.com/web/');
|
|
|
|
|
|
|
|
// Type into search box.
|
2021-09-11 11:02:40 +00:00
|
|
|
await page.type('.devsite-search-field', 'Headless Chrome');
|
2018-01-11 21:42:01 +00:00
|
|
|
|
|
|
|
// Wait for suggest overlay to appear and click "show all results".
|
|
|
|
const allResultsSelector = '.devsite-suggest-all-results';
|
|
|
|
await page.waitForSelector(allResultsSelector);
|
|
|
|
await page.click(allResultsSelector);
|
|
|
|
|
|
|
|
// Wait for the results page to load and display the results.
|
2023-03-15 13:10:07 +00:00
|
|
|
const resultsSelector = '.gsc-table-result a.gs-title[href]';
|
2018-01-11 21:42:01 +00:00
|
|
|
await page.waitForSelector(resultsSelector);
|
|
|
|
|
|
|
|
// Extract the results from the page.
|
2022-06-22 13:25:44 +00:00
|
|
|
const links = await page.evaluate(resultsSelector => {
|
2018-01-11 21:42:01 +00:00
|
|
|
const anchors = Array.from(document.querySelectorAll(resultsSelector));
|
2022-06-22 13:25:44 +00:00
|
|
|
return anchors.map(anchor => {
|
2018-01-11 21:42:01 +00:00
|
|
|
const title = anchor.textContent.split('|')[0].trim();
|
|
|
|
return `${title} - ${anchor.href}`;
|
|
|
|
});
|
|
|
|
}, resultsSelector);
|
|
|
|
console.log(links.join('\n'));
|
|
|
|
|
|
|
|
await browser.close();
|
2017-12-15 03:13:27 +00:00
|
|
|
})();
|