mirror of
https://github.com/puppeteer/puppeteer
synced 2024-06-14 14:02:48 +00:00
463 lines
11 KiB
TypeScript
463 lines
11 KiB
TypeScript
/**
|
|
* Copyright 2017 Google Inc. All rights reserved.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
import type {Readable} from 'stream';
|
|
|
|
import type {Protocol} from 'devtools-protocol';
|
|
|
|
import type {ElementHandle} from '../api/ElementHandle.js';
|
|
import type {JSHandle} from '../api/JSHandle.js';
|
|
import {Page} from '../api/Page.js';
|
|
import {isNode} from '../environment.js';
|
|
import {assert} from '../util/assert.js';
|
|
import {isErrorLike} from '../util/ErrorLike.js';
|
|
|
|
import type {CDPSession} from './Connection.js';
|
|
import {debug} from './Debug.js';
|
|
import {CDPElementHandle} from './ElementHandle.js';
|
|
import {TimeoutError} from './Errors.js';
|
|
import type {CommonEventEmitter} from './EventEmitter.js';
|
|
import type {ExecutionContext} from './ExecutionContext.js';
|
|
import {CDPJSHandle} from './JSHandle.js';
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export const debugError = debug('puppeteer:error');
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function getExceptionMessage(
|
|
exceptionDetails: Protocol.Runtime.ExceptionDetails
|
|
): string {
|
|
if (exceptionDetails.exception) {
|
|
return (
|
|
exceptionDetails.exception.description || exceptionDetails.exception.value
|
|
);
|
|
}
|
|
let message = exceptionDetails.text;
|
|
if (exceptionDetails.stackTrace) {
|
|
for (const callframe of exceptionDetails.stackTrace.callFrames) {
|
|
const location =
|
|
callframe.url +
|
|
':' +
|
|
callframe.lineNumber +
|
|
':' +
|
|
callframe.columnNumber;
|
|
const functionName = callframe.functionName || '<anonymous>';
|
|
message += `\n at ${functionName} (${location})`;
|
|
}
|
|
}
|
|
return message;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function valueFromRemoteObject(
|
|
remoteObject: Protocol.Runtime.RemoteObject
|
|
): any {
|
|
assert(!remoteObject.objectId, 'Cannot extract value when objectId is given');
|
|
if (remoteObject.unserializableValue) {
|
|
if (remoteObject.type === 'bigint') {
|
|
return BigInt(remoteObject.unserializableValue.replace('n', ''));
|
|
}
|
|
switch (remoteObject.unserializableValue) {
|
|
case '-0':
|
|
return -0;
|
|
case 'NaN':
|
|
return NaN;
|
|
case 'Infinity':
|
|
return Infinity;
|
|
case '-Infinity':
|
|
return -Infinity;
|
|
default:
|
|
throw new Error(
|
|
'Unsupported unserializable value: ' +
|
|
remoteObject.unserializableValue
|
|
);
|
|
}
|
|
}
|
|
return remoteObject.value;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function releaseObject(
|
|
client: CDPSession,
|
|
remoteObject: Protocol.Runtime.RemoteObject
|
|
): Promise<void> {
|
|
if (!remoteObject.objectId) {
|
|
return;
|
|
}
|
|
await client
|
|
.send('Runtime.releaseObject', {objectId: remoteObject.objectId})
|
|
.catch(error => {
|
|
// Exceptions might happen in case of a page been navigated or closed.
|
|
// Swallow these since they are harmless and we don't leak anything in this case.
|
|
debugError(error);
|
|
});
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export interface PuppeteerEventListener {
|
|
emitter: CommonEventEmitter;
|
|
eventName: string | symbol;
|
|
handler: (...args: any[]) => void;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function addEventListener(
|
|
emitter: CommonEventEmitter,
|
|
eventName: string | symbol,
|
|
handler: (...args: any[]) => void
|
|
): PuppeteerEventListener {
|
|
emitter.on(eventName, handler);
|
|
return {emitter, eventName, handler};
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function removeEventListeners(
|
|
listeners: Array<{
|
|
emitter: CommonEventEmitter;
|
|
eventName: string | symbol;
|
|
handler: (...args: any[]) => void;
|
|
}>
|
|
): void {
|
|
for (const listener of listeners) {
|
|
listener.emitter.removeListener(listener.eventName, listener.handler);
|
|
}
|
|
listeners.length = 0;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export const isString = (obj: unknown): obj is string => {
|
|
return typeof obj === 'string' || obj instanceof String;
|
|
};
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export const isNumber = (obj: unknown): obj is number => {
|
|
return typeof obj === 'number' || obj instanceof Number;
|
|
};
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export const isPlainObject = (obj: unknown): obj is Record<any, unknown> => {
|
|
return typeof obj === 'object' && obj?.constructor === Object;
|
|
};
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export const isRegExp = (obj: unknown): obj is RegExp => {
|
|
return typeof obj === 'object' && obj?.constructor === RegExp;
|
|
};
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export const isDate = (obj: unknown): obj is Date => {
|
|
return typeof obj === 'object' && obj?.constructor === Date;
|
|
};
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function waitForEvent<T>(
|
|
emitter: CommonEventEmitter,
|
|
eventName: string | symbol,
|
|
predicate: (event: T) => Promise<boolean> | boolean,
|
|
timeout: number,
|
|
abortPromise: Promise<Error>
|
|
): Promise<T> {
|
|
let eventTimeout: NodeJS.Timeout;
|
|
let resolveCallback: (value: T | PromiseLike<T>) => void;
|
|
let rejectCallback: (value: Error) => void;
|
|
const promise = new Promise<T>((resolve, reject) => {
|
|
resolveCallback = resolve;
|
|
rejectCallback = reject;
|
|
});
|
|
const listener = addEventListener(emitter, eventName, async event => {
|
|
if (!(await predicate(event))) {
|
|
return;
|
|
}
|
|
resolveCallback(event);
|
|
});
|
|
if (timeout) {
|
|
eventTimeout = setTimeout(() => {
|
|
rejectCallback(
|
|
new TimeoutError('Timeout exceeded while waiting for event')
|
|
);
|
|
}, timeout);
|
|
}
|
|
function cleanup(): void {
|
|
removeEventListeners([listener]);
|
|
clearTimeout(eventTimeout);
|
|
}
|
|
const result = await Promise.race([promise, abortPromise]).then(
|
|
r => {
|
|
cleanup();
|
|
return r;
|
|
},
|
|
error => {
|
|
cleanup();
|
|
throw error;
|
|
}
|
|
);
|
|
if (isErrorLike(result)) {
|
|
throw result;
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function createJSHandle(
|
|
context: ExecutionContext,
|
|
remoteObject: Protocol.Runtime.RemoteObject
|
|
): JSHandle | ElementHandle<Node> {
|
|
if (remoteObject.subtype === 'node' && context._world) {
|
|
return new CDPElementHandle(context, remoteObject, context._world.frame());
|
|
}
|
|
return new CDPJSHandle(context, remoteObject);
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function evaluationString(
|
|
fun: Function | string,
|
|
...args: unknown[]
|
|
): string {
|
|
if (isString(fun)) {
|
|
assert(args.length === 0, 'Cannot evaluate a string with arguments');
|
|
return fun;
|
|
}
|
|
|
|
function serializeArgument(arg: unknown): string {
|
|
if (Object.is(arg, undefined)) {
|
|
return 'undefined';
|
|
}
|
|
return JSON.stringify(arg);
|
|
}
|
|
|
|
return `(${fun})(${args.map(serializeArgument).join(',')})`;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function addPageBinding(type: string, name: string): void {
|
|
// This is the CDP binding.
|
|
// @ts-expect-error: In a different context.
|
|
const callCDP = globalThis[name];
|
|
|
|
// We replace the CDP binding with a Puppeteer binding.
|
|
Object.assign(globalThis, {
|
|
[name](...args: unknown[]): Promise<unknown> {
|
|
// This is the Puppeteer binding.
|
|
// @ts-expect-error: In a different context.
|
|
const callPuppeteer = globalThis[name];
|
|
callPuppeteer.args ??= new Map();
|
|
callPuppeteer.callbacks ??= new Map();
|
|
|
|
const seq = (callPuppeteer.lastSeq ?? 0) + 1;
|
|
callPuppeteer.lastSeq = seq;
|
|
callPuppeteer.args.set(seq, args);
|
|
|
|
callCDP(
|
|
JSON.stringify({
|
|
type,
|
|
name,
|
|
seq,
|
|
args,
|
|
isTrivial: !args.some(value => {
|
|
return value instanceof Node;
|
|
}),
|
|
})
|
|
);
|
|
|
|
return new Promise((resolve, reject) => {
|
|
callPuppeteer.callbacks.set(seq, {
|
|
resolve(value: unknown) {
|
|
callPuppeteer.args.delete(seq);
|
|
resolve(value);
|
|
},
|
|
reject(value?: unknown) {
|
|
callPuppeteer.args.delete(seq);
|
|
reject(value);
|
|
},
|
|
});
|
|
});
|
|
},
|
|
});
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export function pageBindingInitString(type: string, name: string): string {
|
|
return evaluationString(addPageBinding, type, name);
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function waitWithTimeout<T>(
|
|
promise: Promise<T>,
|
|
taskName: string,
|
|
timeout: number
|
|
): Promise<T> {
|
|
let reject: (reason?: Error) => void;
|
|
const timeoutError = new TimeoutError(
|
|
`waiting for ${taskName} failed: timeout ${timeout}ms exceeded`
|
|
);
|
|
const timeoutPromise = new Promise<never>((_, rej) => {
|
|
return (reject = rej);
|
|
});
|
|
let timeoutTimer = null;
|
|
if (timeout) {
|
|
timeoutTimer = setTimeout(() => {
|
|
return reject(timeoutError);
|
|
}, timeout);
|
|
}
|
|
try {
|
|
return await Promise.race([promise, timeoutPromise]);
|
|
} finally {
|
|
if (timeoutTimer) {
|
|
clearTimeout(timeoutTimer);
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
let fs: typeof import('fs/promises') | null = null;
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function importFSPromises(): Promise<
|
|
typeof import('fs/promises')
|
|
> {
|
|
if (!fs) {
|
|
fs = await import('fs/promises');
|
|
}
|
|
return fs;
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function getReadableAsBuffer(
|
|
readable: Readable,
|
|
path?: string
|
|
): Promise<Buffer | null> {
|
|
const buffers = [];
|
|
if (path) {
|
|
let fs: typeof import('fs/promises');
|
|
try {
|
|
fs = await importFSPromises();
|
|
} catch (error) {
|
|
if (error instanceof TypeError) {
|
|
throw new Error(
|
|
'Cannot write to a path outside of a Node-like environment.'
|
|
);
|
|
}
|
|
throw error;
|
|
}
|
|
const fileHandle = await fs.open(path, 'w+');
|
|
for await (const chunk of readable) {
|
|
buffers.push(chunk);
|
|
await fileHandle.writeFile(chunk);
|
|
}
|
|
await fileHandle.close();
|
|
} else {
|
|
for await (const chunk of readable) {
|
|
buffers.push(chunk);
|
|
}
|
|
}
|
|
try {
|
|
return Buffer.concat(buffers);
|
|
} catch (error) {
|
|
return null;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function getReadableFromProtocolStream(
|
|
client: CDPSession,
|
|
handle: string
|
|
): Promise<Readable> {
|
|
// TODO: Once Node 18 becomes the lowest supported version, we can migrate to
|
|
// ReadableStream.
|
|
if (!isNode) {
|
|
throw new Error('Cannot create a stream outside of Node.js environment.');
|
|
}
|
|
|
|
const {Readable} = await import('stream');
|
|
|
|
let eof = false;
|
|
return new Readable({
|
|
async read(size: number) {
|
|
if (eof) {
|
|
return;
|
|
}
|
|
|
|
const response = await client.send('IO.read', {handle, size});
|
|
this.push(response.data, response.base64Encoded ? 'base64' : undefined);
|
|
if (response.eof) {
|
|
eof = true;
|
|
await client.send('IO.close', {handle});
|
|
this.push(null);
|
|
}
|
|
},
|
|
});
|
|
}
|
|
|
|
/**
|
|
* @internal
|
|
*/
|
|
export async function setPageContent(
|
|
page: Pick<Page, 'evaluate'>,
|
|
content: string
|
|
): Promise<void> {
|
|
// We rely upon the fact that document.open() will reset frame lifecycle with "init"
|
|
// lifecycle event. @see https://crrev.com/608658
|
|
return page.evaluate(html => {
|
|
document.open();
|
|
document.write(html);
|
|
document.close();
|
|
}, content);
|
|
}
|