apify · nikitachapovskii-dev · Apr 28, 2026 · Apr 22, 2026 · Apr 24, 2026 · Apr 27, 2026
diff --git a/packages/playwright-crawler/src/internals/playwright-crawler.ts b/packages/playwright-crawler/src/internals/playwright-crawler.ts
@@ -8,7 +8,7 @@ import type {
     RouterRoutes,
 } from '@crawlee/browser';
 import { BrowserCrawler, Configuration, Router } from '@crawlee/browser';
-import type { BrowserPoolOptions, PlaywrightController, PlaywrightPlugin } from '@crawlee/browser-pool';
+import type { BrowserPoolOptions, CommonPage, PlaywrightController, PlaywrightPlugin } from '@crawlee/browser-pool';
 import type { Dictionary } from '@crawlee/types';
 import ow from 'ow';
 import type { LaunchOptions, Page, Response } from 'playwright';
@@ -238,6 +238,15 @@ export class PlaywrightCrawler extends BrowserCrawler<
         super({ ...browserCrawlerOptions, launchContext, browserPoolOptions }, config);
     }
 
+    protected override _enhanceCrawlingContextWithPageInfo(
+        crawlingContext: PlaywrightCrawlingContext,
+        page: CommonPage,
+        createNewSession?: boolean,
+    ): void {
+        super._enhanceCrawlingContextWithPageInfo(crawlingContext, page, createNewSession);
+        (page as Page).on('download', (download) => crawlingContext.downloads.push(download));
+    }
+
     protected override async _runRequestHandler(context: PlaywrightCrawlingContext) {
         registerUtilsToContext(context, this.options);
         await super._runRequestHandler(context);

diff --git a/packages/playwright-crawler/src/internals/utils/playwright-utils.ts b/packages/playwright-crawler/src/internals/utils/playwright-utils.ts
@@ -34,7 +34,7 @@ import type { BatchAddRequestsResult } from '@crawlee/types';
 import { type CheerioRoot, type Dictionary, expandShadowRoots, sleep } from '@crawlee/utils';
 import * as cheerio from 'cheerio';
 import ow from 'ow';
-import type { Page, Response, Route } from 'playwright';
+import type { Download, Page, Response, Route } from 'playwright';
 
 import { LruCache } from '@apify/datastructures';
 import log_ from '@apify/log';
@@ -1062,12 +1062,40 @@ export interface PlaywrightContextUtils {
      * @param [options]
      */
     handleCloudflareChallenge(options?: HandleCloudflareChallengeOptions): Promise<void>;
+
+    /**
+     * A list of {@link https://playwright.dev/docs/api/class-download | Download} objects
+     * triggered during the current page navigation.
+     *
+     * Playwright intercepts downloads before they complete, so the objects are available
+     * as soon as the browser starts the download — including inside `errorHandler` when
+     * `page.goto` throws `"Download is starting"`.
+     *
+     * > **Note:** Playwright saves download data to a temporary file on disk. For very large
+     * > files this may be a concern; prefer re-enqueueing the URL to a streaming downloader
+     * > when file size is unpredictable.
 const browserContext = await this.library 
     .launchPersistentContext(userDataDir, launchOptions) 
     .catch((error) => { 
         return this._throwOnFailedLaunch(launchContext, error); 
     }); 
 if (this.launchContext.useIncognitoPages) { 
     // Each page requires to have all the context options applied 
     contextOptions = { 
         ...this.launchContext.launchOptions, 
         ...contextOptions, 
     }; 
 const browserContext = await this.library 
     .launchPersistentContext(userDataDir, launchOptions) 
     .catch((error) => { 
         return this._throwOnFailedLaunch(launchContext, error); 
     }); 
 if (this.launchContext.useIncognitoPages) { 
     // Each page requires to have all the context options applied 
     contextOptions = { 
         ...this.launchContext.launchOptions, 
         ...contextOptions, 
     }; 
+     *
+     * **Example usage**
+     * ```ts
+     * errorHandler: async ({ downloads, request }, error) => {
+     *     if (error.message.includes('Download is starting')) {
+     *         for (const download of downloads) {
+     *             const stream = await download.createReadStream();
+     *             // stream to storage...
+     *         }
+     *     }
+     * },
+     * ```
+     */
+    downloads: Download[];
 }
 
 export function registerUtilsToContext(
     context: PlaywrightCrawlingContext,
     crawlerOptions: PlaywrightCrawlerOptions,
 ): void {
+    context.downloads = [];
+
     context.injectFile = async (filePath: string, options?: InjectFileOptions) =>
         injectFile(context.page, filePath, options);
     context.injectJQuery = async () => {