/** * Copyright 2019 Google Inc. All rights reserved. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import { assert } from './assert.js'; import { helper, debugError } from './helper.js'; import { LifecycleWatcher, PuppeteerLifeCycleEvent, } from './LifecycleWatcher.js'; import { TimeoutError } from './Errors.js'; import { JSHandle, ElementHandle } from './JSHandle.js'; import { ExecutionContext } from './ExecutionContext.js'; import { TimeoutSettings } from './TimeoutSettings.js'; import { MouseButton } from './Input.js'; import { FrameManager, Frame } from './FrameManager.js'; import { getQueryHandlerAndSelector } from './QueryHandler.js'; import { SerializableOrJSHandle, EvaluateHandleFn, WrapElementHandle, EvaluateFn, EvaluateFnReturnType, UnwrapPromiseLike, } from './EvalTypes.js'; import { isNode } from '../environment.js'; import { Protocol } from 'devtools-protocol'; // predicateQueryHandler and checkWaitForOptions are declared here so that // TypeScript knows about them when used in the predicate function below. declare const predicateQueryHandler: ( element: Element | Document, selector: string ) => Promise>; declare const checkWaitForOptions: ( node: Node, waitForVisible: boolean, waitForHidden: boolean ) => Element | null | boolean; /** * @public */ export interface WaitForSelectorOptions { visible?: boolean; hidden?: boolean; timeout?: number; } /** * @internal */ export class DOMWorld { private _frameManager: FrameManager; private _frame: Frame; private _timeoutSettings: TimeoutSettings; private _documentPromise?: Promise = null; private _contextPromise?: Promise = null; private _contextResolveCallback?: (x?: ExecutionContext) => void = null; private _detached = false; /** * internal */ _waitTasks = new Set(); // Contains mapping from functions that should be bound to Puppeteer functions. private _boundFunctions = new Map(); // Set of bindings that have been registered in the current context. private _ctxBindings = new Set(); constructor( frameManager: FrameManager, frame: Frame, timeoutSettings: TimeoutSettings ) { this._frameManager = frameManager; this._frame = frame; this._timeoutSettings = timeoutSettings; this._setContext(null); frameManager._client.on('Runtime.bindingCalled', (event) => this._onBindingCalled(event) ); } frame(): Frame { return this._frame; } async _setContext(context?: ExecutionContext): Promise { if (context) { this._contextResolveCallback.call(null, context); this._contextResolveCallback = null; this._ctxBindings.clear(); for (const name of this._boundFunctions.keys()) { await this.addBindingToContext(name); } for (const waitTask of this._waitTasks) waitTask.rerun(); } else { this._documentPromise = null; this._contextPromise = new Promise((fulfill) => { this._contextResolveCallback = fulfill; }); } } _hasContext(): boolean { return !this._contextResolveCallback; } _detach(): void { this._detached = true; for (const waitTask of this._waitTasks) waitTask.terminate( new Error('waitForFunction failed: frame got detached.') ); } executionContext(): Promise { if (this._detached) throw new Error( `Execution context is not available in detached frame "${this._frame.url()}" (are you trying to evaluate?)` ); return this._contextPromise; } async evaluateHandle( pageFunction: EvaluateHandleFn, ...args: SerializableOrJSHandle[] ): Promise { const context = await this.executionContext(); return context.evaluateHandle(pageFunction, ...args); } async evaluate( pageFunction: T, ...args: SerializableOrJSHandle[] ): Promise>> { const context = await this.executionContext(); return context.evaluate>>( pageFunction, ...args ); } async $(selector: string): Promise { const document = await this._document(); const value = await document.$(selector); return value; } async _document(): Promise { if (this._documentPromise) return this._documentPromise; this._documentPromise = this.executionContext().then(async (context) => { const document = await context.evaluateHandle('document'); return document.asElement(); }); return this._documentPromise; } async $x(expression: string): Promise { const document = await this._document(); const value = await document.$x(expression); return value; } async $eval( selector: string, pageFunction: ( element: Element, ...args: unknown[] ) => ReturnType | Promise, ...args: SerializableOrJSHandle[] ): Promise> { const document = await this._document(); return document.$eval(selector, pageFunction, ...args); } async $$eval( selector: string, pageFunction: ( elements: Element[], ...args: unknown[] ) => ReturnType | Promise, ...args: SerializableOrJSHandle[] ): Promise> { const document = await this._document(); const value = await document.$$eval( selector, pageFunction, ...args ); return value; } async $$(selector: string): Promise { const document = await this._document(); const value = await document.$$(selector); return value; } async content(): Promise { return await this.evaluate(() => { let retVal = ''; if (document.doctype) retVal = new XMLSerializer().serializeToString(document.doctype); if (document.documentElement) retVal += document.documentElement.outerHTML; return retVal; }); } async setContent( html: string, options: { timeout?: number; waitUntil?: PuppeteerLifeCycleEvent | PuppeteerLifeCycleEvent[]; } = {} ): Promise { const { waitUntil = ['load'], timeout = this._timeoutSettings.navigationTimeout(), } = options; // We rely upon the fact that document.open() will reset frame lifecycle with "init" // lifecycle event. @see https://crrev.com/608658 await this.evaluate<(x: string) => void>((html) => { document.open(); document.write(html); document.close(); }, html); const watcher = new LifecycleWatcher( this._frameManager, this._frame, waitUntil, timeout ); const error = await Promise.race([ watcher.timeoutOrTerminationPromise(), watcher.lifecyclePromise(), ]); watcher.dispose(); if (error) throw error; } /** * Adds a script tag into the current context. * * @remarks * * You can pass a URL, filepath or string of contents. Note that when running Puppeteer * in a browser environment you cannot pass a filepath and should use either * `url` or `content`. */ async addScriptTag(options: { url?: string; path?: string; content?: string; type?: string; }): Promise { const { url = null, path = null, content = null, type = '' } = options; if (url !== null) { try { const context = await this.executionContext(); return ( await context.evaluateHandle(addScriptUrl, url, type) ).asElement(); } catch (error) { throw new Error(`Loading script from ${url} failed`); } } if (path !== null) { if (!isNode) { throw new Error( 'Cannot pass a filepath to addScriptTag in the browser environment.' ); } const fs = await import('fs'); let contents = await fs.promises.readFile(path, 'utf8'); contents += '//# sourceURL=' + path.replace(/\n/g, ''); const context = await this.executionContext(); return ( await context.evaluateHandle(addScriptContent, contents, type) ).asElement(); } if (content !== null) { const context = await this.executionContext(); return ( await context.evaluateHandle(addScriptContent, content, type) ).asElement(); } throw new Error( 'Provide an object with a `url`, `path` or `content` property' ); async function addScriptUrl( url: string, type: string ): Promise { const script = document.createElement('script'); script.src = url; if (type) script.type = type; const promise = new Promise((res, rej) => { script.onload = res; script.onerror = rej; }); document.head.appendChild(script); await promise; return script; } function addScriptContent( content: string, type = 'text/javascript' ): HTMLElement { const script = document.createElement('script'); script.type = type; script.text = content; let error = null; script.onerror = (e) => (error = e); document.head.appendChild(script); if (error) throw error; return script; } } /** * Adds a style tag into the current context. * * @remarks * * You can pass a URL, filepath or string of contents. Note that when running Puppeteer * in a browser environment you cannot pass a filepath and should use either * `url` or `content`. * */ async addStyleTag(options: { url?: string; path?: string; content?: string; }): Promise { const { url = null, path = null, content = null } = options; if (url !== null) { try { const context = await this.executionContext(); return (await context.evaluateHandle(addStyleUrl, url)).asElement(); } catch (error) { throw new Error(`Loading style from ${url} failed`); } } if (path !== null) { if (!isNode) { throw new Error( 'Cannot pass a filepath to addStyleTag in the browser environment.' ); } const fs = await import('fs'); let contents = await fs.promises.readFile(path, 'utf8'); contents += '/*# sourceURL=' + path.replace(/\n/g, '') + '*/'; const context = await this.executionContext(); return ( await context.evaluateHandle(addStyleContent, contents) ).asElement(); } if (content !== null) { const context = await this.executionContext(); return ( await context.evaluateHandle(addStyleContent, content) ).asElement(); } throw new Error( 'Provide an object with a `url`, `path` or `content` property' ); async function addStyleUrl(url: string): Promise { const link = document.createElement('link'); link.rel = 'stylesheet'; link.href = url; const promise = new Promise((res, rej) => { link.onload = res; link.onerror = rej; }); document.head.appendChild(link); await promise; return link; } async function addStyleContent(content: string): Promise { const style = document.createElement('style'); style.type = 'text/css'; style.appendChild(document.createTextNode(content)); const promise = new Promise((res, rej) => { style.onload = res; style.onerror = rej; }); document.head.appendChild(style); await promise; return style; } } async click( selector: string, options: { delay?: number; button?: MouseButton; clickCount?: number } ): Promise { const handle = await this.$(selector); assert(handle, 'No node found for selector: ' + selector); await handle.click(options); await handle.dispose(); } async focus(selector: string): Promise { const handle = await this.$(selector); assert(handle, 'No node found for selector: ' + selector); await handle.focus(); await handle.dispose(); } async hover(selector: string): Promise { const handle = await this.$(selector); assert(handle, 'No node found for selector: ' + selector); await handle.hover(); await handle.dispose(); } async select(selector: string, ...values: string[]): Promise { const handle = await this.$(selector); assert(handle, 'No node found for selector: ' + selector); const result = await handle.select(...values); await handle.dispose(); return result; } async tap(selector: string): Promise { const handle = await this.$(selector); await handle.tap(); await handle.dispose(); } async type( selector: string, text: string, options?: { delay: number } ): Promise { const handle = await this.$(selector); assert(handle, 'No node found for selector: ' + selector); await handle.type(text, options); await handle.dispose(); } async waitForSelector( selector: string, options: WaitForSelectorOptions ): Promise { const { updatedSelector, queryHandler } = getQueryHandlerAndSelector( selector ); return queryHandler.waitFor(this, updatedSelector, options); } // If multiple waitFor are set up asynchronously, we need to wait for the // first one to set up the binding in the page before running the others. private _settingUpBinding: Promise | null = null; /** * @internal */ async addBindingToContext(name: string) { // Previous operation added the binding so we are done. if (this._ctxBindings.has(name)) return; // Wait for other operation to finish if (this._settingUpBinding) { await this._settingUpBinding; return this.addBindingToContext(name); } const bind = async (name: string) => { const expression = helper.pageBindingInitString('internal', name); try { const context = await this.executionContext(); await context._client.send('Runtime.addBinding', { name, executionContextId: context._contextId, }); await context.evaluate(expression); } catch (error) { // We could have tried to evaluate in a context which was already // destroyed. This happens, for example, if the page is navigated while // we are trying to add the binding const ctxDestroyed = error.message.includes( 'Execution context was destroyed' ); const ctxNotFound = error.message.includes( 'Cannot find context with specified id' ); if (ctxDestroyed || ctxNotFound) { // Retry adding the binding in the next context await bind(name); } else { debugError(error); return; } } this._ctxBindings.add(name); }; this._settingUpBinding = bind(name); await this._settingUpBinding; this._settingUpBinding = null; } /** * @internal */ async addBinding(name: string, puppeteerFunction: Function): Promise { this._boundFunctions.set(name, puppeteerFunction); await this.addBindingToContext(name); } private async _onBindingCalled( event: Protocol.Runtime.BindingCalledEvent ): Promise { const { type, name, seq, args } = JSON.parse(event.payload); if (type !== 'internal' || !this._ctxBindings.has(name)) return; if (!this._hasContext()) return; const context = await this.executionContext(); if (context._contextId !== event.executionContextId) return; try { const result = await this._boundFunctions.get(name)(...args); await context.evaluate(deliverResult, name, seq, result); } catch (error) { // The WaitTask may already have been resolved by timing out, or the // exection context may have been destroyed. // In both caes, the promises above are rejected with a protocol error. // We can safely ignores these, as the WaitTask is re-installed in // the next execution context if needed. if (error.message.includes('Protocol error')) return; debugError(error); } function deliverResult(name: string, seq: number, result: unknown): void { globalThis[name].callbacks.get(seq).resolve(result); globalThis[name].callbacks.delete(seq); } } /** * @internal */ async waitForSelectorInPage( queryOne: Function, selector: string, options: WaitForSelectorOptions ): Promise { const { visible: waitForVisible = false, hidden: waitForHidden = false, timeout = this._timeoutSettings.timeout(), } = options; const polling = waitForVisible || waitForHidden ? 'raf' : 'mutation'; const title = `selector \`${selector}\`${ waitForHidden ? ' to be hidden' : '' }`; async function predicate( selector: string, waitForVisible: boolean, waitForHidden: boolean ): Promise { const node = predicateQueryHandler ? ((await predicateQueryHandler(document, selector)) as Element) : document.querySelector(selector); return checkWaitForOptions(node, waitForVisible, waitForHidden); } const waitTask = new WaitTask( this, helper.makePredicateString(predicate, queryOne), title, polling, timeout, selector, waitForVisible, waitForHidden ); const jsHandle = await waitTask.promise; const elementHandle = jsHandle.asElement(); if (!elementHandle) { await jsHandle.dispose(); return null; } return elementHandle; } async waitForXPath( xpath: string, options: WaitForSelectorOptions ): Promise { const { visible: waitForVisible = false, hidden: waitForHidden = false, timeout = this._timeoutSettings.timeout(), } = options; const polling = waitForVisible || waitForHidden ? 'raf' : 'mutation'; const title = `XPath \`${xpath}\`${waitForHidden ? ' to be hidden' : ''}`; function predicate( xpath: string, waitForVisible: boolean, waitForHidden: boolean ): Node | null | boolean { const node = document.evaluate( xpath, document, null, XPathResult.FIRST_ORDERED_NODE_TYPE, null ).singleNodeValue; return checkWaitForOptions(node, waitForVisible, waitForHidden); } const waitTask = new WaitTask( this, helper.makePredicateString(predicate), title, polling, timeout, xpath, waitForVisible, waitForHidden ); const jsHandle = await waitTask.promise; const elementHandle = jsHandle.asElement(); if (!elementHandle) { await jsHandle.dispose(); return null; } return elementHandle; } waitForFunction( pageFunction: Function | string, options: { polling?: string | number; timeout?: number } = {}, ...args: SerializableOrJSHandle[] ): Promise { const { polling = 'raf', timeout = this._timeoutSettings.timeout(), } = options; return new WaitTask( this, pageFunction, 'function', polling, timeout, ...args ).promise; } async title(): Promise { return this.evaluate(() => document.title); } } /** * @internal */ export class WaitTask { _domWorld: DOMWorld; _polling: string | number; _timeout: number; _predicateBody: string; _args: SerializableOrJSHandle[]; _runCount = 0; promise: Promise; _resolve: (x: JSHandle) => void; _reject: (x: Error) => void; _timeoutTimer?: NodeJS.Timeout; _terminated = false; constructor( domWorld: DOMWorld, predicateBody: Function | string, title: string, polling: string | number, timeout: number, ...args: SerializableOrJSHandle[] ) { if (helper.isString(polling)) assert( polling === 'raf' || polling === 'mutation', 'Unknown polling option: ' + polling ); else if (helper.isNumber(polling)) assert(polling > 0, 'Cannot poll with non-positive interval: ' + polling); else throw new Error('Unknown polling options: ' + polling); function getPredicateBody(predicateBody: Function | string) { if (helper.isString(predicateBody)) return `return (${predicateBody});`; return `return (${predicateBody})(...args);`; } this._domWorld = domWorld; this._polling = polling; this._timeout = timeout; this._predicateBody = getPredicateBody(predicateBody); this._args = args; this._runCount = 0; domWorld._waitTasks.add(this); this.promise = new Promise((resolve, reject) => { this._resolve = resolve; this._reject = reject; }); // Since page navigation requires us to re-install the pageScript, we should track // timeout on our end. if (timeout) { const timeoutError = new TimeoutError( `waiting for ${title} failed: timeout ${timeout}ms exceeded` ); this._timeoutTimer = setTimeout( () => this.terminate(timeoutError), timeout ); } this.rerun(); } terminate(error: Error): void { this._terminated = true; this._reject(error); this._cleanup(); } async rerun(): Promise { const runCount = ++this._runCount; /** @type {?JSHandle} */ let success = null; let error = null; try { success = await (await this._domWorld.executionContext()).evaluateHandle( waitForPredicatePageFunction, this._predicateBody, this._polling, this._timeout, ...this._args ); } catch (error_) { error = error_; } if (this._terminated || runCount !== this._runCount) { if (success) await success.dispose(); return; } // Ignore timeouts in pageScript - we track timeouts ourselves. // If the frame's execution context has already changed, `frame.evaluate` will // throw an error - ignore this predicate run altogether. if ( !error && (await this._domWorld.evaluate((s) => !s, success).catch(() => true)) ) { await success.dispose(); return; } // When frame is detached the task should have been terminated by the DOMWorld. // This can fail if we were adding this task while the frame was detached, // so we terminate here instead. if (error) { if ( error.message.includes( 'Execution context is not available in detached frame' ) ) { this.terminate( new Error('waitForFunction failed: frame got detached.') ); return; } // When the page is navigated, the promise is rejected. // We will try again in the new execution context. if (error.message.includes('Execution context was destroyed')) return; // We could have tried to evaluate in a context which was already // destroyed. if (error.message.includes('Cannot find context with specified id')) return; this._reject(error); } else { this._resolve(success); } this._cleanup(); } _cleanup(): void { clearTimeout(this._timeoutTimer); this._domWorld._waitTasks.delete(this); } } async function waitForPredicatePageFunction( predicateBody: string, polling: string, timeout: number, ...args: unknown[] ): Promise { const predicate = new Function('...args', predicateBody); let timedOut = false; if (timeout) setTimeout(() => (timedOut = true), timeout); if (polling === 'raf') return await pollRaf(); if (polling === 'mutation') return await pollMutation(); if (typeof polling === 'number') return await pollInterval(polling); /** * @returns {!Promise<*>} */ async function pollMutation(): Promise { const success = await predicate(...args); if (success) return Promise.resolve(success); let fulfill; const result = new Promise((x) => (fulfill = x)); const observer = new MutationObserver(async () => { if (timedOut) { observer.disconnect(); fulfill(); } const success = await predicate(...args); if (success) { observer.disconnect(); fulfill(success); } }); observer.observe(document, { childList: true, subtree: true, attributes: true, }); return result; } async function pollRaf(): Promise { let fulfill; const result = new Promise((x) => (fulfill = x)); await onRaf(); return result; async function onRaf(): Promise { if (timedOut) { fulfill(); return; } const success = await predicate(...args); if (success) fulfill(success); else requestAnimationFrame(onRaf); } } async function pollInterval(pollInterval: number): Promise { let fulfill; const result = new Promise((x) => (fulfill = x)); await onTimeout(); return result; async function onTimeout(): Promise { if (timedOut) { fulfill(); return; } const success = await predicate(...args); if (success) fulfill(success); else setTimeout(onTimeout, pollInterval); } } }