From ff4cabcb0323ce677e117d5f4e903242cc6e4c0e Mon Sep 17 00:00:00 2001
From: "stainless-app[bot]"
 <142633134+stainless-app[bot]@users.noreply.github.com>
Date: Sun, 7 Jun 2026 22:02:57 +0000
Subject: [PATCH 1/2] feat(api): api update

---
 .stats.yml                                   |  4 +-
 packages/mcp-server/src/local-docs-search.ts | 12 ++++--
 src/resources/web.ts                         | 43 ++++++++++++++++++++
 tests/api-resources/web.test.ts              |  6 +++
 4 files changed, 60 insertions(+), 5 deletions(-)

diff --git a/.stats.yml b/.stats.yml
index 27382d2..f1634d6 100644
--- a/.stats.yml
+++ b/.stats.yml
@@ -1,4 +1,4 @@
 configured_endpoints: 25
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/context-dev/context.dev-de0ba2ed18ec7265b0b20d9639b3da207dd33e354f0a856091902291c6661830.yml
-openapi_spec_hash: ae25efc2ac6bcab54bc3f4efaab73a55
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/context-dev/context.dev-8f6bc62256b5a4aa44e82389bfefee1d73172856c407567bba11a82fd4203641.yml
+openapi_spec_hash: 8b7230de56ecbec4712fa1e81067a75c
 config_hash: f86a4e06ae5ed725aa79d58d7a8dc27c
diff --git a/packages/mcp-server/src/local-docs-search.ts b/packages/mcp-server/src/local-docs-search.ts
index ff0dac0..92cd926 100644
--- a/packages/mcp-server/src/local-docs-search.ts
+++ b/packages/mcp-server/src/local-docs-search.ts
@@ -60,8 +60,10 @@ const EMBEDDED_METHODS: MethodEntry[] = [
     qualified: 'client.web.webScrapeHTML',
     params: [
       'url: string;',
+      'excludeSelectors?: string[];',
       'headers?: object;',
       'includeFrames?: boolean;',
+      'includeSelectors?: string[];',
       'maxAgeMs?: number;',
       'pdf?: { end?: number; shouldParse?: boolean; start?: number; };',
       'timeoutMS?: number;',
@@ -70,7 +72,7 @@ const EMBEDDED_METHODS: MethodEntry[] = [
     response:
       "{ html: string; success: true; type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'; url: string; }",
     markdown:
-      "## web_scrape_html\n\n`client.web.webScrapeHTML(url: string, headers?: object, includeFrames?: boolean, maxAgeMs?: number, pdf?: { end?: number; shouldParse?: boolean; start?: number; }, timeoutMS?: number, waitForMs?: number): { html: string; success: true; type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'; url: string; }`\n\n**get** `/web/scrape/html`\n\nScrapes the given URL and returns the raw HTML content of the page.\n\n### Parameters\n\n- `url: string`\n  Full URL to scrape (must include http:// or https:// protocol)\n\n- `headers?: object`\n  Optional outbound HTTP headers forwarded only to the target URL, sent as deep-object query params such as headers[X-Custom]=value. When provided, caching is bypassed: the result is neither read from nor written to cache.\n\n- `includeFrames?: boolean`\n  When true, iframes are rendered inline into the returned HTML.\n\n- `maxAgeMs?: number`\n  Return a cached result if a prior scrape for the same parameters exists and is younger than this many milliseconds. Defaults to 1 day (86400000 ms) when omitted. Max is 30 days (2592000000 ms). Set to 0 to always scrape fresh.\n\n- `pdf?: { end?: number; shouldParse?: boolean; start?: number; }`\n  PDF parsing controls. Use start/end to limit text extraction and OCR to an inclusive 1-based page range.\n  - `end?: number`\n    Last 1-based PDF page to parse. When omitted, parsing ends at the last page. Must be greater than or equal to start when both are provided.\n  - `shouldParse?: boolean`\n    When true, PDF URLs are fetched and parsed. When false, PDF URLs are skipped and a 400 WEBSITE_ACCESS_ERROR is returned.\n  - `start?: number`\n    First 1-based PDF page to parse. When omitted, parsing starts at the first page.\n\n- `timeoutMS?: number`\n  Optional timeout in milliseconds for the request. If the request takes longer than this value, it will be aborted with a 408 status code. Maximum allowed value is 300000ms (5 minutes).\n\n- `waitForMs?: number`\n  Optional browser wait time in milliseconds after initial page load. Min: 0. Max: 30000 (30 seconds). \n\n### Returns\n\n- `{ html: string; success: true; type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'; url: string; }`\n\n  - `html: string`\n  - `success: true`\n  - `type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'`\n  - `url: string`\n\n### Example\n\n```typescript\nimport ContextDev from 'context.dev';\n\nconst client = new ContextDev();\n\nconst response = await client.web.webScrapeHTML({ url: 'https://example.com' });\n\nconsole.log(response);\n```",
+      "## web_scrape_html\n\n`client.web.webScrapeHTML(url: string, excludeSelectors?: string[], headers?: object, includeFrames?: boolean, includeSelectors?: string[], maxAgeMs?: number, pdf?: { end?: number; shouldParse?: boolean; start?: number; }, timeoutMS?: number, waitForMs?: number): { html: string; success: true; type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'; url: string; }`\n\n**get** `/web/scrape/html`\n\nScrapes the given URL and returns the raw HTML content of the page.\n\n### Parameters\n\n- `url: string`\n  Full URL to scrape (must include http:// or https:// protocol)\n\n- `excludeSelectors?: string[]`\n  CSS selectors to remove from the result. Applied after includeSelectors. Exclusion takes precedence: an element matching both is removed. Examples: \"nav\", \"footer\", \".ad-banner\", \"[aria-hidden=true]\".\n\n- `headers?: object`\n  Optional outbound HTTP headers forwarded only to the target URL, sent as deep-object query params such as headers[X-Custom]=value. When provided, caching is bypassed: the result is neither read from nor written to cache.\n\n- `includeFrames?: boolean`\n  When true, iframes are rendered inline into the returned HTML.\n\n- `includeSelectors?: string[]`\n  CSS selectors. When provided, only matching subtrees (and their descendants) are kept and everything else is dropped. When omitted, the entire document is kept. Examples: \"article.main\", \"#content\", \"[role=main]\".\n\n- `maxAgeMs?: number`\n  Return a cached result if a prior scrape for the same parameters exists and is younger than this many milliseconds. Defaults to 1 day (86400000 ms) when omitted. Max is 30 days (2592000000 ms). Set to 0 to always scrape fresh.\n\n- `pdf?: { end?: number; shouldParse?: boolean; start?: number; }`\n  PDF parsing controls. Use start/end to limit text extraction and OCR to an inclusive 1-based page range.\n  - `end?: number`\n    Last 1-based PDF page to parse. When omitted, parsing ends at the last page. Must be greater than or equal to start when both are provided.\n  - `shouldParse?: boolean`\n    When true, PDF URLs are fetched and parsed. When false, PDF URLs are skipped and a 400 WEBSITE_ACCESS_ERROR is returned.\n  - `start?: number`\n    First 1-based PDF page to parse. When omitted, parsing starts at the first page.\n\n- `timeoutMS?: number`\n  Optional timeout in milliseconds for the request. If the request takes longer than this value, it will be aborted with a 408 status code. Maximum allowed value is 300000ms (5 minutes).\n\n- `waitForMs?: number`\n  Optional browser wait time in milliseconds after initial page load. Min: 0. Max: 30000 (30 seconds). \n\n### Returns\n\n- `{ html: string; success: true; type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'; url: string; }`\n\n  - `html: string`\n  - `success: true`\n  - `type: 'html' | 'xml' | 'json' | 'text' | 'csv' | 'markdown' | 'svg' | 'pdf'`\n  - `url: string`\n\n### Example\n\n```typescript\nimport ContextDev from 'context.dev';\n\nconst client = new ContextDev();\n\nconst response = await client.web.webScrapeHTML({ url: 'https://example.com' });\n\nconsole.log(response);\n```",
     perLanguage: {
       typescript: {
         method: 'client.web.webScrapeHTML',
@@ -108,10 +110,12 @@ const EMBEDDED_METHODS: MethodEntry[] = [
     qualified: 'client.web.webScrapeMd',
     params: [
       'url: string;',
+      'excludeSelectors?: string[];',
       'headers?: object;',
       'includeFrames?: boolean;',
       'includeImages?: boolean;',
       'includeLinks?: boolean;',
+      'includeSelectors?: string[];',
       'maxAgeMs?: number;',
       'pdf?: { end?: number; shouldParse?: boolean; start?: number; };',
       'shortenBase64Images?: boolean;',
@@ -121,7 +125,7 @@ const EMBEDDED_METHODS: MethodEntry[] = [
     ],
     response: '{ markdown: string; success: true; url: string; }',
     markdown:
-      "## web_scrape_md\n\n`client.web.webScrapeMd(url: string, headers?: object, includeFrames?: boolean, includeImages?: boolean, includeLinks?: boolean, maxAgeMs?: number, pdf?: { end?: number; shouldParse?: boolean; start?: number; }, shortenBase64Images?: boolean, timeoutMS?: number, useMainContentOnly?: boolean, waitForMs?: number): { markdown: string; success: true; url: string; }`\n\n**get** `/web/scrape/markdown`\n\nScrapes the given URL into LLM usable Markdown.\n\n### Parameters\n\n- `url: string`\n  Full URL to scrape into LLM usable Markdown (must include http:// or https:// protocol)\n\n- `headers?: object`\n  Optional outbound HTTP headers forwarded only to the target URL, sent as deep-object query params such as headers[X-Custom]=value. When provided, caching is bypassed: the result is neither read from nor written to cache.\n\n- `includeFrames?: boolean`\n  When true, the contents of iframes are rendered to Markdown.\n\n- `includeImages?: boolean`\n  Include image references in Markdown output\n\n- `includeLinks?: boolean`\n  Preserve hyperlinks in Markdown output\n\n- `maxAgeMs?: number`\n  Return a cached result if a prior scrape for the same parameters exists and is younger than this many milliseconds. Defaults to 1 day (86400000 ms) when omitted. Max is 30 days (2592000000 ms). Set to 0 to always scrape fresh.\n\n- `pdf?: { end?: number; shouldParse?: boolean; start?: number; }`\n  PDF parsing controls. Use start/end to limit text extraction and OCR to an inclusive 1-based page range.\n  - `end?: number`\n    Last 1-based PDF page to parse. When omitted, parsing ends at the last page. Must be greater than or equal to start when both are provided.\n  - `shouldParse?: boolean`\n    When true, PDF URLs are fetched and parsed. When false, PDF URLs are skipped and a 400 WEBSITE_ACCESS_ERROR is returned.\n  - `start?: number`\n    First 1-based PDF page to parse. When omitted, parsing starts at the first page.\n\n- `shortenBase64Images?: boolean`\n  Shorten base64-encoded image data in the Markdown output\n\n- `timeoutMS?: number`\n  Optional timeout in milliseconds for the request. If the request takes longer than this value, it will be aborted with a 408 status code. Maximum allowed value is 300000ms (5 minutes).\n\n- `useMainContentOnly?: boolean`\n  Extract only the main content of the page, excluding headers, footers, sidebars, and navigation\n\n- `waitForMs?: number`\n  Optional browser wait time in milliseconds after initial page load before converting the page to Markdown. Min: 0. Max: 30000 (30 seconds). \n\n### Returns\n\n- `{ markdown: string; success: true; url: string; }`\n\n  - `markdown: string`\n  - `success: true`\n  - `url: string`\n\n### Example\n\n```typescript\nimport ContextDev from 'context.dev';\n\nconst client = new ContextDev();\n\nconst response = await client.web.webScrapeMd({ url: 'https://example.com' });\n\nconsole.log(response);\n```",
+      '## web_scrape_md\n\n`client.web.webScrapeMd(url: string, excludeSelectors?: string[], headers?: object, includeFrames?: boolean, includeImages?: boolean, includeLinks?: boolean, includeSelectors?: string[], maxAgeMs?: number, pdf?: { end?: number; shouldParse?: boolean; start?: number; }, shortenBase64Images?: boolean, timeoutMS?: number, useMainContentOnly?: boolean, waitForMs?: number): { markdown: string; success: true; url: string; }`\n\n**get** `/web/scrape/markdown`\n\nScrapes the given URL into LLM usable Markdown.\n\n### Parameters\n\n- `url: string`\n  Full URL to scrape into LLM usable Markdown (must include http:// or https:// protocol)\n\n- `excludeSelectors?: string[]`\n  CSS selectors to remove before conversion to Markdown. Applied after includeSelectors. Exclusion takes precedence: an element matching both is removed. Examples: "nav", "footer", ".ad-banner", "[aria-hidden=true]".\n\n- `headers?: object`\n  Optional outbound HTTP headers forwarded only to the target URL, sent as deep-object query params such as headers[X-Custom]=value. When provided, caching is bypassed: the result is neither read from nor written to cache.\n\n- `includeFrames?: boolean`\n  When true, the contents of iframes are rendered to Markdown.\n\n- `includeImages?: boolean`\n  Include image references in Markdown output\n\n- `includeLinks?: boolean`\n  Preserve hyperlinks in Markdown output\n\n- `includeSelectors?: string[]`\n  CSS selectors. When provided, only matching HTML subtrees (and their descendants) are kept before conversion to Markdown. When omitted, the entire document is kept. Examples: "article.main", "#content", "[role=main]".\n\n- `maxAgeMs?: number`\n  Return a cached result if a prior scrape for the same parameters exists and is younger than this many milliseconds. Defaults to 1 day (86400000 ms) when omitted. Max is 30 days (2592000000 ms). Set to 0 to always scrape fresh.\n\n- `pdf?: { end?: number; shouldParse?: boolean; start?: number; }`\n  PDF parsing controls. Use start/end to limit text extraction and OCR to an inclusive 1-based page range.\n  - `end?: number`\n    Last 1-based PDF page to parse. When omitted, parsing ends at the last page. Must be greater than or equal to start when both are provided.\n  - `shouldParse?: boolean`\n    When true, PDF URLs are fetched and parsed. When false, PDF URLs are skipped and a 400 WEBSITE_ACCESS_ERROR is returned.\n  - `start?: number`\n    First 1-based PDF page to parse. When omitted, parsing starts at the first page.\n\n- `shortenBase64Images?: boolean`\n  Shorten base64-encoded image data in the Markdown output\n\n- `timeoutMS?: number`\n  Optional timeout in milliseconds for the request. If the request takes longer than this value, it will be aborted with a 408 status code. Maximum allowed value is 300000ms (5 minutes).\n\n- `useMainContentOnly?: boolean`\n  Extract only the main content of the page, excluding headers, footers, sidebars, and navigation\n\n- `waitForMs?: number`\n  Optional browser wait time in milliseconds after initial page load before converting the page to Markdown. Min: 0. Max: 30000 (30 seconds). \n\n### Returns\n\n- `{ markdown: string; success: true; url: string; }`\n\n  - `markdown: string`\n  - `success: true`\n  - `url: string`\n\n### Example\n\n```typescript\nimport ContextDev from \'context.dev\';\n\nconst client = new ContextDev();\n\nconst response = await client.web.webScrapeMd({ url: \'https://example.com\' });\n\nconsole.log(response);\n```',
     perLanguage: {
       typescript: {
         method: 'client.web.webScrapeMd',
@@ -304,10 +308,12 @@ const EMBEDDED_METHODS: MethodEntry[] = [
     qualified: 'client.web.webCrawlMd',
     params: [
       'url: string;',
+      'excludeSelectors?: string[];',
       'followSubdomains?: boolean;',
       'includeFrames?: boolean;',
       'includeImages?: boolean;',
       'includeLinks?: boolean;',
+      'includeSelectors?: string[];',
       'maxAgeMs?: number;',
       'maxDepth?: number;',
       'maxPages?: number;',
@@ -322,7 +328,7 @@ const EMBEDDED_METHODS: MethodEntry[] = [
     response:
       '{ metadata: { maxCrawlDepth: number; numFailed: number; numSkipped: number; numSucceeded: number; numUrls: number; }; results: { markdown: string; metadata: { crawlDepth: number; statusCode: number; success: boolean; title: string; url: string; }; }[]; }',
     markdown:
-      "## web_crawl_md\n\n`client.web.webCrawlMd(url: string, followSubdomains?: boolean, includeFrames?: boolean, includeImages?: boolean, includeLinks?: boolean, maxAgeMs?: number, maxDepth?: number, maxPages?: number, pdf?: { end?: number; shouldParse?: boolean; start?: number; }, shortenBase64Images?: boolean, stopAfterMs?: number, timeoutMS?: number, urlRegex?: string, useMainContentOnly?: boolean, waitForMs?: number): { metadata: object; results: object[]; }`\n\n**post** `/web/crawl`\n\nPerforms a crawl starting from a given URL, extracts page content as Markdown, and returns results for all crawled pages.\n\n### Parameters\n\n- `url: string`\n  The starting URL for the crawl (must include http:// or https:// protocol)\n\n- `followSubdomains?: boolean`\n  When true, follow links on subdomains of the starting URL's domain (e.g. docs.example.com when starting from example.com). www and apex are always treated as equivalent.\n\n- `includeFrames?: boolean`\n  When true, the contents of iframes are rendered to Markdown for each crawled page.\n\n- `includeImages?: boolean`\n  Include image references in the Markdown output\n\n- `includeLinks?: boolean`\n  Preserve hyperlinks in the Markdown output\n\n- `maxAgeMs?: number`\n  Return a cached result if a prior scrape for the same parameters exists and is younger than this many milliseconds. Defaults to 1 day (86400000 ms) when omitted. Max is 30 days (2592000000 ms). Set to 0 to always scrape fresh.\n\n- `maxDepth?: number`\n  Maximum link depth from the starting URL (0 = only the starting page)\n\n- `maxPages?: number`\n  Maximum number of pages to crawl. Hard cap: 500.\n\n- `pdf?: { end?: number; shouldParse?: boolean; start?: number; }`\n  PDF parsing controls. Use start/end to limit text extraction and OCR to an inclusive 1-based page range.\n  - `end?: number`\n    Last 1-based PDF page to parse. When omitted, parsing ends at the last page. Must be greater than or equal to start when both are provided.\n  - `shouldParse?: boolean`\n    When true, PDF pages are fetched and parsed. When false, PDF pages are skipped entirely (not included in results and not counted as failures).\n  - `start?: number`\n    First 1-based PDF page to parse. When omitted, parsing starts at the first page.\n\n- `shortenBase64Images?: boolean`\n  Truncate base64-encoded image data in the Markdown output\n\n- `stopAfterMs?: number`\n  Soft time budget for the crawl in milliseconds. After each scrape, the crawler checks the elapsed time and, if exceeded, returns the pages collected so far instead of continuing. Min: 10000 (10s). Max: 240000 (4 min). Default: 120000 (2 min).\n\n- `timeoutMS?: number`\n  Optional timeout in milliseconds for the request. If the request takes longer than this value, it will be aborted with a 408 status code. Maximum allowed value is 300000ms (5 minutes).\n\n- `urlRegex?: string`\n  Regex pattern. Only URLs matching this pattern will be followed and scraped.\n\n- `useMainContentOnly?: boolean`\n  Extract only the main content, stripping headers, footers, sidebars, and navigation\n\n- `waitForMs?: number`\n  Optional browser wait time in milliseconds after initial page load for each crawled page. Min: 0. Max: 30000 (30 seconds). \n\n### Returns\n\n- `{ metadata: { maxCrawlDepth: number; numFailed: number; numSkipped: number; numSucceeded: number; numUrls: number; }; results: { markdown: string; metadata: { crawlDepth: number; statusCode: number; success: boolean; title: string; url: string; }; }[]; }`\n\n  - `metadata: { maxCrawlDepth: number; numFailed: number; numSkipped: number; numSucceeded: number; numUrls: number; }`\n  - `results: { markdown: string; metadata: { crawlDepth: number; statusCode: number; success: boolean; title: string; url: string; }; }[]`\n\n### Example\n\n```typescript\nimport ContextDev from 'context.dev';\n\nconst client = new ContextDev();\n\nconst response = await client.web.webCrawlMd({ url: 'https://example.com' });\n\nconsole.log(response);\n```",
+      '## web_crawl_md\n\n`client.web.webCrawlMd(url: string, excludeSelectors?: string[], followSubdomains?: boolean, includeFrames?: boolean, includeImages?: boolean, includeLinks?: boolean, includeSelectors?: string[], maxAgeMs?: number, maxDepth?: number, maxPages?: number, pdf?: { end?: number; shouldParse?: boolean; start?: number; }, shortenBase64Images?: boolean, stopAfterMs?: number, timeoutMS?: number, urlRegex?: string, useMainContentOnly?: boolean, waitForMs?: number): { metadata: object; results: object[]; }`\n\n**post** `/web/crawl`\n\nPerforms a crawl starting from a given URL, extracts page content as Markdown, and returns results for all crawled pages.\n\n### Parameters\n\n- `url: string`\n  The starting URL for the crawl (must include http:// or https:// protocol)\n\n- `excludeSelectors?: string[]`\n  CSS selectors to remove before each crawled page is converted to Markdown. Applied after includeSelectors. Exclusion takes precedence: an element matching both is removed. Examples: "nav", "footer", ".ad-banner", "[aria-hidden=true]".\n\n- `followSubdomains?: boolean`\n  When true, follow links on subdomains of the starting URL\'s domain (e.g. docs.example.com when starting from example.com). www and apex are always treated as equivalent.\n\n- `includeFrames?: boolean`\n  When true, the contents of iframes are rendered to Markdown for each crawled page.\n\n- `includeImages?: boolean`\n  Include image references in the Markdown output\n\n- `includeLinks?: boolean`\n  Preserve hyperlinks in the Markdown output\n\n- `includeSelectors?: string[]`\n  CSS selectors. When provided, only matching HTML subtrees (and their descendants) are kept before each crawled page is converted to Markdown. When omitted, the entire document is kept. Examples: "article.main", "#content", "[role=main]".\n\n- `maxAgeMs?: number`\n  Return a cached result if a prior scrape for the same parameters exists and is younger than this many milliseconds. Defaults to 1 day (86400000 ms) when omitted. Max is 30 days (2592000000 ms). Set to 0 to always scrape fresh.\n\n- `maxDepth?: number`\n  Maximum link depth from the starting URL (0 = only the starting page)\n\n- `maxPages?: number`\n  Maximum number of pages to crawl. Hard cap: 500.\n\n- `pdf?: { end?: number; shouldParse?: boolean; start?: number; }`\n  PDF parsing controls. Use start/end to limit text extraction and OCR to an inclusive 1-based page range.\n  - `end?: number`\n    Last 1-based PDF page to parse. When omitted, parsing ends at the last page. Must be greater than or equal to start when both are provided.\n  - `shouldParse?: boolean`\n    When true, PDF pages are fetched and parsed. When false, PDF pages are skipped entirely (not included in results and not counted as failures).\n  - `start?: number`\n    First 1-based PDF page to parse. When omitted, parsing starts at the first page.\n\n- `shortenBase64Images?: boolean`\n  Truncate base64-encoded image data in the Markdown output\n\n- `stopAfterMs?: number`\n  Soft time budget for the crawl in milliseconds. After each scrape, the crawler checks the elapsed time and, if exceeded, returns the pages collected so far instead of continuing. Min: 10000 (10s). Max: 240000 (4 min). Default: 120000 (2 min).\n\n- `timeoutMS?: number`\n  Optional timeout in milliseconds for the request. If the request takes longer than this value, it will be aborted with a 408 status code. Maximum allowed value is 300000ms (5 minutes).\n\n- `urlRegex?: string`\n  Regex pattern. Only URLs matching this pattern will be followed and scraped.\n\n- `useMainContentOnly?: boolean`\n  Extract only the main content, stripping headers, footers, sidebars, and navigation\n\n- `waitForMs?: number`\n  Optional browser wait time in milliseconds after initial page load for each crawled page. Min: 0. Max: 30000 (30 seconds). \n\n### Returns\n\n- `{ metadata: { maxCrawlDepth: number; numFailed: number; numSkipped: number; numSucceeded: number; numUrls: number; }; results: { markdown: string; metadata: { crawlDepth: number; statusCode: number; success: boolean; title: string; url: string; }; }[]; }`\n\n  - `metadata: { maxCrawlDepth: number; numFailed: number; numSkipped: number; numSucceeded: number; numUrls: number; }`\n  - `results: { markdown: string; metadata: { crawlDepth: number; statusCode: number; success: boolean; title: string; url: string; }; }[]`\n\n### Example\n\n```typescript\nimport ContextDev from \'context.dev\';\n\nconst client = new ContextDev();\n\nconst response = await client.web.webCrawlMd({ url: \'https://example.com\' });\n\nconsole.log(response);\n```',
     perLanguage: {
       typescript: {
         method: 'client.web.webCrawlMd',
diff --git a/src/resources/web.ts b/src/resources/web.ts
index aa0bdc0..124997f 100644
--- a/src/resources/web.ts
+++ b/src/resources/web.ts
@@ -1629,6 +1629,13 @@ export interface WebWebCrawlMdParams {
    */
   url: string;
 
+  /**
+   * CSS selectors to remove before each crawled page is converted to Markdown.
+   * Applied after includeSelectors. Exclusion takes precedence: an element matching
+   * both is removed. Examples: "nav", "footer", ".ad-banner", "[aria-hidden=true]".
+   */
+  excludeSelectors?: Array<string>;
+
   /**
    * When true, follow links on subdomains of the starting URL's domain (e.g.
    * docs.example.com when starting from example.com). www and apex are always
@@ -1652,6 +1659,14 @@ export interface WebWebCrawlMdParams {
    */
   includeLinks?: boolean;
 
+  /**
+   * CSS selectors. When provided, only matching HTML subtrees (and their
+   * descendants) are kept before each crawled page is converted to Markdown. When
+   * omitted, the entire document is kept. Examples: "article.main", "#content",
+   * "[role=main]".
+   */
+  includeSelectors?: Array<string>;
+
   /**
    * Return a cached result if a prior scrape for the same parameters exists and is
    * younger than this many milliseconds. Defaults to 1 day (86400000 ms) when
@@ -1744,6 +1759,13 @@ export interface WebWebScrapeHTMLParams {
    */
   url: string;
 
+  /**
+   * CSS selectors to remove from the result. Applied after includeSelectors.
+   * Exclusion takes precedence: an element matching both is removed. Examples:
+   * "nav", "footer", ".ad-banner", "[aria-hidden=true]".
+   */
+  excludeSelectors?: Array<string>;
+
   /**
    * Optional outbound HTTP headers forwarded only to the target URL, sent as
    * deep-object query params such as headers[X-Custom]=value. When provided, caching
@@ -1756,6 +1778,13 @@ export interface WebWebScrapeHTMLParams {
    */
   includeFrames?: boolean;
 
+  /**
+   * CSS selectors. When provided, only matching subtrees (and their descendants) are
+   * kept and everything else is dropped. When omitted, the entire document is kept.
+   * Examples: "article.main", "#content", "[role=main]".
+   */
+  includeSelectors?: Array<string>;
+
   /**
    * Return a cached result if a prior scrape for the same parameters exists and is
    * younger than this many milliseconds. Defaults to 1 day (86400000 ms) when
@@ -1883,6 +1912,13 @@ export interface WebWebScrapeMdParams {
    */
   url: string;
 
+  /**
+   * CSS selectors to remove before conversion to Markdown. Applied after
+   * includeSelectors. Exclusion takes precedence: an element matching both is
+   * removed. Examples: "nav", "footer", ".ad-banner", "[aria-hidden=true]".
+   */
+  excludeSelectors?: Array<string>;
+
   /**
    * Optional outbound HTTP headers forwarded only to the target URL, sent as
    * deep-object query params such as headers[X-Custom]=value. When provided, caching
@@ -1905,6 +1941,13 @@ export interface WebWebScrapeMdParams {
    */
   includeLinks?: boolean;
 
+  /**
+   * CSS selectors. When provided, only matching HTML subtrees (and their
+   * descendants) are kept before conversion to Markdown. When omitted, the entire
+   * document is kept. Examples: "article.main", "#content", "[role=main]".
+   */
+  includeSelectors?: Array<string>;
+
   /**
    * Return a cached result if a prior scrape for the same parameters exists and is
    * younger than this many milliseconds. Defaults to 1 day (86400000 ms) when
diff --git a/tests/api-resources/web.test.ts b/tests/api-resources/web.test.ts
index 1d69f42..837bf84 100644
--- a/tests/api-resources/web.test.ts
+++ b/tests/api-resources/web.test.ts
@@ -220,10 +220,12 @@ describe('resource web', () => {
   test.skip('webCrawlMd: required and optional params', async () => {
     const response = await client.web.webCrawlMd({
       url: 'https://example.com',
+      excludeSelectors: ['string'],
       followSubdomains: true,
       includeFrames: true,
       includeImages: true,
       includeLinks: true,
+      includeSelectors: ['string'],
       maxAgeMs: 0,
       maxDepth: 0,
       maxPages: 1,
@@ -257,8 +259,10 @@ describe('resource web', () => {
   test.skip('webScrapeHTML: required and optional params', async () => {
     const response = await client.web.webScrapeHTML({
       url: 'https://example.com',
+      excludeSelectors: ['string'],
       headers: { foo: 'J!' },
       includeFrames: true,
+      includeSelectors: ['string'],
       maxAgeMs: 0,
       pdf: {
         end: 1,
@@ -315,10 +319,12 @@ describe('resource web', () => {
   test.skip('webScrapeMd: required and optional params', async () => {
     const response = await client.web.webScrapeMd({
       url: 'https://example.com',
+      excludeSelectors: ['string'],
       headers: { foo: 'J!' },
       includeFrames: true,
       includeImages: true,
       includeLinks: true,
+      includeSelectors: ['string'],
       maxAgeMs: 0,
       pdf: {
         end: 1,

From 5d3982b3fa5fb45055eea15f5520cb314789202c Mon Sep 17 00:00:00 2001
From: "stainless-app[bot]"
 <142633134+stainless-app[bot]@users.noreply.github.com>
Date: Sun, 7 Jun 2026 22:03:19 +0000
Subject: [PATCH 2/2] release: 1.32.0

---
 .release-please-manifest.json     | 2 +-
 CHANGELOG.md                      | 8 ++++++++
 package.json                      | 2 +-
 packages/mcp-server/manifest.json | 2 +-
 packages/mcp-server/package.json  | 2 +-
 packages/mcp-server/src/server.ts | 2 +-
 src/version.ts                    | 2 +-
 7 files changed, 14 insertions(+), 6 deletions(-)

diff --git a/.release-please-manifest.json b/.release-please-manifest.json
index 306dc07..f16e9b1 100644
--- a/.release-please-manifest.json
+++ b/.release-please-manifest.json
@@ -1,3 +1,3 @@
 {
-  ".": "1.31.0"
+  ".": "1.32.0"
 }
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 526f7f1..3442c99 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,13 @@
 # Changelog
 
+## 1.32.0 (2026-06-07)
+
+Full Changelog: [v1.31.0...v1.32.0](https://github.com/context-dot-dev/context-typescript-sdk/compare/v1.31.0...v1.32.0)
+
+### Features
+
+* **api:** api update ([ff4cabc](https://github.com/context-dot-dev/context-typescript-sdk/commit/ff4cabcb0323ce677e117d5f4e903242cc6e4c0e))
+
 ## 1.31.0 (2026-06-07)
 
 Full Changelog: [v1.30.0...v1.31.0](https://github.com/context-dot-dev/context-typescript-sdk/compare/v1.30.0...v1.31.0)
diff --git a/package.json b/package.json
index 8a9b57c..7d4b61d 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "context.dev",
-  "version": "1.31.0",
+  "version": "1.32.0",
   "description": "The official TypeScript library for the Context Dev API",
   "author": "Context Dev <hello@context.dev>",
   "types": "dist/index.d.ts",
diff --git a/packages/mcp-server/manifest.json b/packages/mcp-server/manifest.json
index f842fd6..b5dd168 100644
--- a/packages/mcp-server/manifest.json
+++ b/packages/mcp-server/manifest.json
@@ -1,7 +1,7 @@
 {
   "dxt_version": "0.2",
   "name": "context.dev-mcp",
-  "version": "1.31.0",
+  "version": "1.32.0",
   "description": "The official MCP Server for the Context Dev API",
   "author": {
     "name": "Context Dev",
diff --git a/packages/mcp-server/package.json b/packages/mcp-server/package.json
index fccf0d4..50f4155 100644
--- a/packages/mcp-server/package.json
+++ b/packages/mcp-server/package.json
@@ -1,6 +1,6 @@
 {
   "name": "context.dev-mcp",
-  "version": "1.31.0",
+  "version": "1.32.0",
   "description": "The official MCP Server for the Context Dev API",
   "author": "Context Dev <hello@context.dev>",
   "types": "dist/index.d.ts",
diff --git a/packages/mcp-server/src/server.ts b/packages/mcp-server/src/server.ts
index 6c3c569..514204f 100644
--- a/packages/mcp-server/src/server.ts
+++ b/packages/mcp-server/src/server.ts
@@ -28,7 +28,7 @@ export const newMcpServer = async ({
   new McpServer(
     {
       name: 'context_dev_api',
-      version: '1.31.0',
+      version: '1.32.0',
     },
     {
       instructions: await getInstructions({ stainlessApiKey, customInstructionsPath }),
diff --git a/src/version.ts b/src/version.ts
index f3e3208..49bad0d 100644
--- a/src/version.ts
+++ b/src/version.ts
@@ -1 +1 @@
-export const VERSION = '1.31.0'; // x-release-please-version
+export const VERSION = '1.32.0'; // x-release-please-version