mirror of
https://github.com/puppeteer/puppeteer
synced 2024-06-14 14:02:48 +00:00
517 lines
18 KiB
TypeScript
517 lines
18 KiB
TypeScript
/**
|
|
* Copyright 2017 Google Inc. All rights reserved.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
import * as EventEmitter from 'events';
|
|
import {helper, assert, debugError} from './helper';
|
|
import {Events} from './Events';
|
|
import {ExecutionContext, EVALUATION_SCRIPT_URL} from './ExecutionContext';
|
|
import {LifecycleWatcher, PuppeteerLifeCycleEvent} from './LifecycleWatcher';
|
|
import {DOMWorld, WaitForSelectorOptions} from './DOMWorld';
|
|
import {NetworkManager} from './NetworkManager';
|
|
import {TimeoutSettings} from './TimeoutSettings';
|
|
import {CDPSession} from './Connection';
|
|
import {JSHandle, ElementHandle} from './JSHandle';
|
|
import {MouseButtonInput} from './Input';
|
|
|
|
const UTILITY_WORLD_NAME = '__puppeteer_utility_world__';
|
|
|
|
export class FrameManager extends EventEmitter {
|
|
_client: CDPSession;
|
|
_page: Puppeteer.Page;
|
|
_networkManager: Puppeteer.NetworkManager;
|
|
_timeoutSettings: TimeoutSettings;
|
|
_frames = new Map<string, Frame>();
|
|
_contextIdToContext = new Map<number, ExecutionContext>();
|
|
_isolatedWorlds = new Set<string>();
|
|
_mainFrame: Frame;
|
|
|
|
constructor(client: CDPSession, page: Puppeteer.Page, ignoreHTTPSErrors: boolean, timeoutSettings: TimeoutSettings) {
|
|
super();
|
|
this._client = client;
|
|
this._page = page;
|
|
this._networkManager = new NetworkManager(client, ignoreHTTPSErrors, this);
|
|
this._timeoutSettings = timeoutSettings;
|
|
this._client.on('Page.frameAttached', event => this._onFrameAttached(event.frameId, event.parentFrameId));
|
|
this._client.on('Page.frameNavigated', event => this._onFrameNavigated(event.frame));
|
|
this._client.on('Page.navigatedWithinDocument', event => this._onFrameNavigatedWithinDocument(event.frameId, event.url));
|
|
this._client.on('Page.frameDetached', event => this._onFrameDetached(event.frameId));
|
|
this._client.on('Page.frameStoppedLoading', event => this._onFrameStoppedLoading(event.frameId));
|
|
this._client.on('Runtime.executionContextCreated', event => this._onExecutionContextCreated(event.context));
|
|
this._client.on('Runtime.executionContextDestroyed', event => this._onExecutionContextDestroyed(event.executionContextId));
|
|
this._client.on('Runtime.executionContextsCleared', () => this._onExecutionContextsCleared());
|
|
this._client.on('Page.lifecycleEvent', event => this._onLifecycleEvent(event));
|
|
}
|
|
|
|
async initialize(): Promise<void> {
|
|
const result = await Promise.all<Protocol.Page.enableReturnValue, Protocol.Page.getFrameTreeReturnValue>([
|
|
this._client.send('Page.enable'),
|
|
this._client.send('Page.getFrameTree'),
|
|
]);
|
|
|
|
const {frameTree} = result[1];
|
|
this._handleFrameTree(frameTree);
|
|
await Promise.all([
|
|
this._client.send('Page.setLifecycleEventsEnabled', {enabled: true}),
|
|
this._client.send('Runtime.enable', {}).then(() => this._ensureIsolatedWorld(UTILITY_WORLD_NAME)),
|
|
this._networkManager.initialize(),
|
|
]);
|
|
}
|
|
|
|
networkManager(): Puppeteer.NetworkManager {
|
|
return this._networkManager;
|
|
}
|
|
|
|
async navigateFrame(frame: Frame, url: string, options: {referer?: string; timeout?: number; waitUntil?: PuppeteerLifeCycleEvent|PuppeteerLifeCycleEvent[]} = {}): Promise<Puppeteer.Response | null> {
|
|
assertNoLegacyNavigationOptions(options);
|
|
const {
|
|
referer = this._networkManager.extraHTTPHeaders()['referer'],
|
|
waitUntil = ['load'],
|
|
timeout = this._timeoutSettings.navigationTimeout(),
|
|
} = options;
|
|
|
|
const watcher = new LifecycleWatcher(this, frame, waitUntil, timeout);
|
|
let ensureNewDocumentNavigation = false;
|
|
let error = await Promise.race([
|
|
navigate(this._client, url, referer, frame._id),
|
|
watcher.timeoutOrTerminationPromise(),
|
|
]);
|
|
if (!error) {
|
|
error = await Promise.race([
|
|
watcher.timeoutOrTerminationPromise(),
|
|
ensureNewDocumentNavigation ? watcher.newDocumentNavigationPromise() : watcher.sameDocumentNavigationPromise(),
|
|
]);
|
|
}
|
|
watcher.dispose();
|
|
if (error)
|
|
throw error;
|
|
return watcher.navigationResponse();
|
|
|
|
async function navigate(client: CDPSession, url: string, referrer: string, frameId: string): Promise<Error | null> {
|
|
try {
|
|
const response = await client.send('Page.navigate', {url, referrer, frameId});
|
|
ensureNewDocumentNavigation = !!response.loaderId;
|
|
return response.errorText ? new Error(`${response.errorText} at ${url}`) : null;
|
|
} catch (error) {
|
|
return error;
|
|
}
|
|
}
|
|
}
|
|
|
|
async waitForFrameNavigation(frame: Frame, options: {timeout?: number; waitUntil?: PuppeteerLifeCycleEvent|PuppeteerLifeCycleEvent[]} = {}): Promise<Puppeteer.Response | null> {
|
|
assertNoLegacyNavigationOptions(options);
|
|
const {
|
|
waitUntil = ['load'],
|
|
timeout = this._timeoutSettings.navigationTimeout(),
|
|
} = options;
|
|
const watcher = new LifecycleWatcher(this, frame, waitUntil, timeout);
|
|
const error = await Promise.race([
|
|
watcher.timeoutOrTerminationPromise(),
|
|
watcher.sameDocumentNavigationPromise(),
|
|
watcher.newDocumentNavigationPromise()
|
|
]);
|
|
watcher.dispose();
|
|
if (error)
|
|
throw error;
|
|
return watcher.navigationResponse();
|
|
}
|
|
|
|
_onLifecycleEvent(event: Protocol.Page.lifecycleEventPayload): void {
|
|
const frame = this._frames.get(event.frameId);
|
|
if (!frame)
|
|
return;
|
|
frame._onLifecycleEvent(event.loaderId, event.name);
|
|
this.emit(Events.FrameManager.LifecycleEvent, frame);
|
|
}
|
|
|
|
_onFrameStoppedLoading(frameId: string): void {
|
|
const frame = this._frames.get(frameId);
|
|
if (!frame)
|
|
return;
|
|
frame._onLoadingStopped();
|
|
this.emit(Events.FrameManager.LifecycleEvent, frame);
|
|
}
|
|
|
|
_handleFrameTree(frameTree: Protocol.Page.FrameTree): void {
|
|
if (frameTree.frame.parentId)
|
|
this._onFrameAttached(frameTree.frame.id, frameTree.frame.parentId);
|
|
this._onFrameNavigated(frameTree.frame);
|
|
if (!frameTree.childFrames)
|
|
return;
|
|
|
|
for (const child of frameTree.childFrames)
|
|
this._handleFrameTree(child);
|
|
}
|
|
|
|
page(): Puppeteer.Page {
|
|
return this._page;
|
|
}
|
|
|
|
mainFrame(): Frame {
|
|
return this._mainFrame;
|
|
}
|
|
|
|
frames(): Frame[] {
|
|
return Array.from(this._frames.values());
|
|
}
|
|
|
|
frame(frameId: string): Frame | null {
|
|
return this._frames.get(frameId) || null;
|
|
}
|
|
|
|
_onFrameAttached(frameId: string, parentFrameId?: string): void {
|
|
if (this._frames.has(frameId))
|
|
return;
|
|
assert(parentFrameId);
|
|
const parentFrame = this._frames.get(parentFrameId);
|
|
const frame = new Frame(this, this._client, parentFrame, frameId);
|
|
this._frames.set(frame._id, frame);
|
|
this.emit(Events.FrameManager.FrameAttached, frame);
|
|
}
|
|
|
|
_onFrameNavigated(framePayload: Protocol.Page.Frame): void {
|
|
const isMainFrame = !framePayload.parentId;
|
|
let frame = isMainFrame ? this._mainFrame : this._frames.get(framePayload.id);
|
|
assert(isMainFrame || frame, 'We either navigate top level or have old version of the navigated frame');
|
|
|
|
// Detach all child frames first.
|
|
if (frame) {
|
|
for (const child of frame.childFrames())
|
|
this._removeFramesRecursively(child);
|
|
}
|
|
|
|
// Update or create main frame.
|
|
if (isMainFrame) {
|
|
if (frame) {
|
|
// Update frame id to retain frame identity on cross-process navigation.
|
|
this._frames.delete(frame._id);
|
|
frame._id = framePayload.id;
|
|
} else {
|
|
// Initial main frame navigation.
|
|
frame = new Frame(this, this._client, null, framePayload.id);
|
|
}
|
|
this._frames.set(framePayload.id, frame);
|
|
this._mainFrame = frame;
|
|
}
|
|
|
|
// Update frame payload.
|
|
frame._navigated(framePayload);
|
|
|
|
this.emit(Events.FrameManager.FrameNavigated, frame);
|
|
}
|
|
|
|
async _ensureIsolatedWorld(name: string): Promise<void> {
|
|
if (this._isolatedWorlds.has(name))
|
|
return;
|
|
this._isolatedWorlds.add(name);
|
|
await this._client.send('Page.addScriptToEvaluateOnNewDocument', {
|
|
source: `//# sourceURL=${EVALUATION_SCRIPT_URL}`,
|
|
worldName: name,
|
|
}),
|
|
await Promise.all(this.frames().map(frame => this._client.send('Page.createIsolatedWorld', {
|
|
frameId: frame._id,
|
|
grantUniveralAccess: true,
|
|
worldName: name,
|
|
}).catch(debugError))); // frames might be removed before we send this
|
|
}
|
|
|
|
_onFrameNavigatedWithinDocument(frameId: string, url: string): void {
|
|
const frame = this._frames.get(frameId);
|
|
if (!frame)
|
|
return;
|
|
frame._navigatedWithinDocument(url);
|
|
this.emit(Events.FrameManager.FrameNavigatedWithinDocument, frame);
|
|
this.emit(Events.FrameManager.FrameNavigated, frame);
|
|
}
|
|
|
|
_onFrameDetached(frameId: string): void {
|
|
const frame = this._frames.get(frameId);
|
|
if (frame)
|
|
this._removeFramesRecursively(frame);
|
|
}
|
|
|
|
_onExecutionContextCreated(contextPayload: Protocol.Runtime.ExecutionContextDescription): void {
|
|
const auxData = contextPayload.auxData as { frameId?: string};
|
|
const frameId = auxData ? auxData.frameId : null;
|
|
const frame = this._frames.get(frameId) || null;
|
|
let world = null;
|
|
if (frame) {
|
|
if (contextPayload.auxData && !!contextPayload.auxData['isDefault']) {
|
|
world = frame._mainWorld;
|
|
} else if (contextPayload.name === UTILITY_WORLD_NAME && !frame._secondaryWorld._hasContext()) {
|
|
// In case of multiple sessions to the same target, there's a race between
|
|
// connections so we might end up creating multiple isolated worlds.
|
|
// We can use either.
|
|
world = frame._secondaryWorld;
|
|
}
|
|
}
|
|
if (contextPayload.auxData && contextPayload.auxData['type'] === 'isolated')
|
|
this._isolatedWorlds.add(contextPayload.name);
|
|
const context = new ExecutionContext(this._client, contextPayload, world);
|
|
if (world)
|
|
world._setContext(context);
|
|
this._contextIdToContext.set(contextPayload.id, context);
|
|
}
|
|
|
|
/**
|
|
* @param {number} executionContextId
|
|
*/
|
|
_onExecutionContextDestroyed(executionContextId: number): void {
|
|
const context = this._contextIdToContext.get(executionContextId);
|
|
if (!context)
|
|
return;
|
|
this._contextIdToContext.delete(executionContextId);
|
|
if (context._world)
|
|
context._world._setContext(null);
|
|
}
|
|
|
|
_onExecutionContextsCleared(): void {
|
|
for (const context of this._contextIdToContext.values()) {
|
|
if (context._world)
|
|
context._world._setContext(null);
|
|
}
|
|
this._contextIdToContext.clear();
|
|
}
|
|
|
|
executionContextById(contextId: number): ExecutionContext {
|
|
const context = this._contextIdToContext.get(contextId);
|
|
assert(context, 'INTERNAL ERROR: missing context with id = ' + contextId);
|
|
return context;
|
|
}
|
|
|
|
_removeFramesRecursively(frame: Frame): void {
|
|
for (const child of frame.childFrames())
|
|
this._removeFramesRecursively(child);
|
|
frame._detach();
|
|
this._frames.delete(frame._id);
|
|
this.emit(Events.FrameManager.FrameDetached, frame);
|
|
}
|
|
}
|
|
|
|
export class Frame {
|
|
_frameManager: FrameManager;
|
|
_client: CDPSession;
|
|
_parentFrame?: Frame;
|
|
_id: string;
|
|
|
|
_url = '';
|
|
_detached = false;
|
|
_loaderId = '';
|
|
_name?: string;
|
|
|
|
_lifecycleEvents = new Set<string>();
|
|
_mainWorld: DOMWorld;
|
|
_secondaryWorld: DOMWorld;
|
|
_childFrames: Set<Frame>;
|
|
|
|
constructor(frameManager: FrameManager, client: CDPSession, parentFrame: Frame | null, frameId: string) {
|
|
this._frameManager = frameManager;
|
|
this._client = client;
|
|
this._parentFrame = parentFrame;
|
|
this._url = '';
|
|
this._id = frameId;
|
|
this._detached = false;
|
|
|
|
this._loaderId = '';
|
|
this._mainWorld = new DOMWorld(frameManager, this, frameManager._timeoutSettings);
|
|
this._secondaryWorld = new DOMWorld(frameManager, this, frameManager._timeoutSettings);
|
|
|
|
this._childFrames = new Set();
|
|
if (this._parentFrame)
|
|
this._parentFrame._childFrames.add(this);
|
|
}
|
|
|
|
async goto(url: string, options: {referer?: string; timeout?: number; waitUntil?: PuppeteerLifeCycleEvent | PuppeteerLifeCycleEvent[]}): Promise<Puppeteer.Response | null> {
|
|
return await this._frameManager.navigateFrame(this, url, options);
|
|
}
|
|
|
|
async waitForNavigation(options: {timeout?: number; waitUntil?: PuppeteerLifeCycleEvent|PuppeteerLifeCycleEvent[]}): Promise<Puppeteer.Response | null> {
|
|
return await this._frameManager.waitForFrameNavigation(this, options);
|
|
}
|
|
|
|
executionContext(): Promise<ExecutionContext> {
|
|
return this._mainWorld.executionContext();
|
|
}
|
|
|
|
async evaluateHandle(pageFunction: Function|string, ...args: unknown[]): Promise<JSHandle> {
|
|
return this._mainWorld.evaluateHandle(pageFunction, ...args);
|
|
}
|
|
|
|
async evaluate<ReturnType extends any>(pageFunction: Function|string, ...args: unknown[]): Promise<ReturnType> {
|
|
return this._mainWorld.evaluate<ReturnType>(pageFunction, ...args);
|
|
}
|
|
|
|
async $(selector: string): Promise<ElementHandle | null> {
|
|
return this._mainWorld.$(selector);
|
|
}
|
|
|
|
async $x(expression: string): Promise<ElementHandle[]> {
|
|
return this._mainWorld.$x(expression);
|
|
}
|
|
|
|
async $eval<ReturnType extends any>(selector: string, pageFunction: Function | string, ...args: unknown[]): Promise<ReturnType> {
|
|
return this._mainWorld.$eval<ReturnType>(selector, pageFunction, ...args);
|
|
}
|
|
|
|
async $$eval<ReturnType extends any>(selector: string, pageFunction: Function | string, ...args: unknown[]): Promise<ReturnType> {
|
|
return this._mainWorld.$$eval<ReturnType>(selector, pageFunction, ...args);
|
|
}
|
|
|
|
async $$(selector: string): Promise<ElementHandle[]> {
|
|
return this._mainWorld.$$(selector);
|
|
}
|
|
|
|
async content(): Promise<string> {
|
|
return this._secondaryWorld.content();
|
|
}
|
|
|
|
async setContent(html: string, options: {timeout?: number; waitUntil?: PuppeteerLifeCycleEvent|PuppeteerLifeCycleEvent[]} = {}): Promise<void> {
|
|
return this._secondaryWorld.setContent(html, options);
|
|
}
|
|
|
|
name(): string {
|
|
return this._name || '';
|
|
}
|
|
|
|
url(): string {
|
|
return this._url;
|
|
}
|
|
|
|
parentFrame(): Frame | null {
|
|
return this._parentFrame;
|
|
}
|
|
|
|
childFrames(): Frame[] {
|
|
return Array.from(this._childFrames);
|
|
}
|
|
|
|
isDetached(): boolean {
|
|
return this._detached;
|
|
}
|
|
|
|
async addScriptTag(options: {url?: string; path?: string; content?: string; type?: string}): Promise<ElementHandle> {
|
|
return this._mainWorld.addScriptTag(options);
|
|
}
|
|
|
|
async addStyleTag(options: {url?: string; path?: string; content?: string}): Promise<ElementHandle> {
|
|
return this._mainWorld.addStyleTag(options);
|
|
}
|
|
|
|
async click(selector: string, options: {delay?: number; button?: MouseButtonInput; clickCount?: number}): Promise<void> {
|
|
return this._secondaryWorld.click(selector, options);
|
|
}
|
|
|
|
async focus(selector: string): Promise<void> {
|
|
return this._secondaryWorld.focus(selector);
|
|
}
|
|
|
|
async hover(selector: string): Promise<void> {
|
|
return this._secondaryWorld.hover(selector);
|
|
}
|
|
|
|
select(selector: string, ...values: string[]): Promise<string[]> {
|
|
return this._secondaryWorld.select(selector, ...values);
|
|
}
|
|
|
|
async tap(selector: string): Promise<void> {
|
|
return this._secondaryWorld.tap(selector);
|
|
}
|
|
|
|
async type(selector: string, text: string, options?: {delay: number}): Promise<void> {
|
|
return this._mainWorld.type(selector, text, options);
|
|
}
|
|
|
|
waitFor(selectorOrFunctionOrTimeout: string|number|Function, options: {} = {}, ...args: unknown[]): Promise<JSHandle | null> {
|
|
const xPathPattern = '//';
|
|
|
|
if (helper.isString(selectorOrFunctionOrTimeout)) {
|
|
const string = selectorOrFunctionOrTimeout;
|
|
if (string.startsWith(xPathPattern))
|
|
return this.waitForXPath(string, options);
|
|
return this.waitForSelector(string, options);
|
|
}
|
|
if (helper.isNumber(selectorOrFunctionOrTimeout))
|
|
return new Promise(fulfill => setTimeout(fulfill, selectorOrFunctionOrTimeout));
|
|
if (typeof selectorOrFunctionOrTimeout === 'function')
|
|
return this.waitForFunction(selectorOrFunctionOrTimeout, options, ...args);
|
|
return Promise.reject(new Error('Unsupported target type: ' + (typeof selectorOrFunctionOrTimeout)));
|
|
}
|
|
|
|
async waitForSelector(selector: string, options: WaitForSelectorOptions): Promise<ElementHandle | null> {
|
|
const handle = await this._secondaryWorld.waitForSelector(selector, options);
|
|
if (!handle)
|
|
return null;
|
|
const mainExecutionContext = await this._mainWorld.executionContext();
|
|
const result = await mainExecutionContext._adoptElementHandle(handle);
|
|
await handle.dispose();
|
|
return result;
|
|
}
|
|
|
|
async waitForXPath(xpath: string, options: WaitForSelectorOptions): Promise<ElementHandle | null> {
|
|
const handle = await this._secondaryWorld.waitForXPath(xpath, options);
|
|
if (!handle)
|
|
return null;
|
|
const mainExecutionContext = await this._mainWorld.executionContext();
|
|
const result = await mainExecutionContext._adoptElementHandle(handle);
|
|
await handle.dispose();
|
|
return result;
|
|
}
|
|
|
|
waitForFunction(pageFunction: Function|string, options: {polling?: string|number; timeout?: number} = {}, ...args: unknown[]): Promise<JSHandle> {
|
|
return this._mainWorld.waitForFunction(pageFunction, options, ...args);
|
|
}
|
|
|
|
async title(): Promise<string> {
|
|
return this._secondaryWorld.title();
|
|
}
|
|
|
|
_navigated(framePayload: Protocol.Page.Frame): void {
|
|
this._name = framePayload.name;
|
|
this._url = framePayload.url;
|
|
}
|
|
|
|
_navigatedWithinDocument(url: string): void {
|
|
this._url = url;
|
|
}
|
|
|
|
_onLifecycleEvent(loaderId: string, name: string): void {
|
|
if (name === 'init') {
|
|
this._loaderId = loaderId;
|
|
this._lifecycleEvents.clear();
|
|
}
|
|
this._lifecycleEvents.add(name);
|
|
}
|
|
|
|
_onLoadingStopped(): void {
|
|
this._lifecycleEvents.add('DOMContentLoaded');
|
|
this._lifecycleEvents.add('load');
|
|
}
|
|
|
|
_detach(): void {
|
|
this._detached = true;
|
|
this._mainWorld._detach();
|
|
this._secondaryWorld._detach();
|
|
if (this._parentFrame)
|
|
this._parentFrame._childFrames.delete(this);
|
|
this._parentFrame = null;
|
|
}
|
|
}
|
|
|
|
function assertNoLegacyNavigationOptions(options: {[optionName: string]: unknown}): void {
|
|
assert(options['networkIdleTimeout'] === undefined, 'ERROR: networkIdleTimeout option is no longer supported.');
|
|
assert(options['networkIdleInflight'] === undefined, 'ERROR: networkIdleInflight option is no longer supported.');
|
|
assert(options.waitUntil !== 'networkidle', 'ERROR: "networkidle" option is no longer supported. Use "networkidle2" instead');
|
|
}
|