Merge pull request #29 from devdiv-microsoft/tyler/satisfied-peafowl

TylerLeonhardt · web-flow · commit 6e1169b54a0e · 2025-05-09T08:23:08.000-07:00
MSRC 96762 (CVE-2025-21264)
diff --git a/src/vs/workbench/contrib/chat/browser/chatMarkdownRenderer.ts b/src/vs/workbench/contrib/chat/browser/chatMarkdownRenderer.ts
@@ -16,7 +16,6 @@ import { IFileService } from '../../../../platform/files/common/files.js';
 import { IHoverService } from '../../../../platform/hover/browser/hover.js';
 import { IOpenerService } from '../../../../platform/opener/common/opener.js';
 import { REVEAL_IN_EXPLORER_COMMAND_ID } from '../../files/browser/fileConstants.js';
-import { ITrustedDomainService } from '../../url/browser/trustedDomainService.js';
 
 const allowedHtmlTags = [
 	'b',
@@ -63,7 +62,6 @@ export class ChatMarkdownRenderer extends MarkdownRenderer {
 		options: IMarkdownRendererOptions | undefined,
 		@ILanguageService languageService: ILanguageService,
 		@IOpenerService openerService: IOpenerService,
-		@ITrustedDomainService private readonly trustedDomainService: ITrustedDomainService,
 		@IHoverService private readonly hoverService: IHoverService,
 		@IFileService private readonly fileService: IFileService,
 		@ICommandService private readonly commandService: ICommandService,
@@ -74,7 +72,7 @@ export class ChatMarkdownRenderer extends MarkdownRenderer {
 	override render(markdown: IMarkdownString | undefined, options?: MarkdownRenderOptions, markedOptions?: MarkedOptions): IMarkdownRenderResult {
 		options = {
 			...options,
-			remoteImageIsAllowed: (uri) => this.trustedDomainService.isValid(uri),
+			remoteImageIsAllowed: (_uri) => false,
 			sanitizerOptions: {
 				replaceWithPlaintext: true,
 				allowedTags: allowedHtmlTags,
diff --git a/src/vs/workbench/contrib/chat/electron-sandbox/tools/fetchPageTool.ts b/src/vs/workbench/contrib/chat/electron-sandbox/tools/fetchPageTool.ts
@@ -5,10 +5,10 @@
 
 import { CancellationToken } from '../../../../../base/common/cancellation.js';
 import { MarkdownString } from '../../../../../base/common/htmlContent.js';
+import { ResourceSet } from '../../../../../base/common/map.js';
 import { URI } from '../../../../../base/common/uri.js';
 import { localize } from '../../../../../nls.js';
 import { IWebContentExtractorService } from '../../../../../platform/webContentExtractor/common/webContentExtractor.js';
-import { ITrustedDomainService } from '../../../url/browser/trustedDomainService.js';
 import { CountTokensCallback, IPreparedToolInvocation, IToolData, IToolImpl, IToolInvocation, IToolResult, IToolResultTextPart, ToolProgress } from '../../common/languageModelToolsService.js';
 import { InternalFetchWebPageToolId } from '../../common/tools/tools.js';
 
@@ -34,11 +34,10 @@ export const FetchWebPageToolData: IToolData = {
 };
 
 export class FetchWebPageTool implements IToolImpl {
-	private _alreadyApprovedDomains = new Set<string>();
+	private _alreadyApprovedDomains = new ResourceSet();
 
 	constructor(
 		@IWebContentExtractorService private readonly _readerModeService: IWebContentExtractorService,
-		@ITrustedDomainService private readonly _trustedDomainService: ITrustedDomainService,
 	) { }
 
 	async invoke(invocation: IToolInvocation, _countTokens: CountTokensCallback, _progress: ToolProgress, _token: CancellationToken): Promise<IToolResult> {
@@ -53,9 +52,7 @@ export class FetchWebPageTool implements IToolImpl {
 		// We approved these via confirmation, so mark them as "approved" in this session
 		// if they are not approved via the trusted domain service.
 		for (const uri of validUris) {
-			if (!this._trustedDomainService.isValid(uri)) {
-				this._alreadyApprovedDomains.add(uri.toString(true));
-			}
+			this._alreadyApprovedDomains.add(uri);
 		}
 
 		const contents = await this._readerModeService.extract(validUris);
@@ -89,7 +86,7 @@ export class FetchWebPageTool implements IToolImpl {
 				valid.push(uri);
 			}
 		});
-		const urlsNeedingConfirmation = valid.filter(url => !this._trustedDomainService.isValid(url) && !this._alreadyApprovedDomains.has(url.toString(true)));
+		const urlsNeedingConfirmation = valid.filter(url => !this._alreadyApprovedDomains.has(url));
 
 		const pastTenseMessage = invalid.length
 			? invalid.length > 1
@@ -138,32 +135,17 @@ export class FetchWebPageTool implements IToolImpl {
 
 		const result: IPreparedToolInvocation = { invocationMessage, pastTenseMessage };
 		if (urlsNeedingConfirmation.length) {
-			const confirmationTitle = urlsNeedingConfirmation.length > 1
-				? localize('fetchWebPage.confirmationTitle.plural', 'Fetch untrusted web pages?')
-				: localize('fetchWebPage.confirmationTitle.singular', 'Fetch untrusted web page?');
-
-			const managedTrustedDomainsCommand = 'workbench.action.manageTrustedDomain';
-			const confirmationMessage = new MarkdownString(
-				urlsNeedingConfirmation.length > 1
-					? urlsNeedingConfirmation.map(uri => `- ${uri.toString()}`).join('\n')
-					: urlsNeedingConfirmation[0].toString(),
-				{
-					isTrusted: { enabledCommands: [managedTrustedDomainsCommand] },
-					supportThemeIcons: true
-				}
-			);
-
-			confirmationMessage.appendMarkdown(
-				'\n\n$(info) ' + localize(
-					'fetchWebPage.confirmationMessageManageTrustedDomains',
-					'You can [manage your trusted domains]({0}) to skip this confirmation in the future.',
-					`command:${managedTrustedDomainsCommand}`
-				)
-			);
-
-			result.confirmationMessages = { title: confirmationTitle, message: confirmationMessage, allowAutoConfirm: false };
+			let confirmationTitle: string;
+			let confirmationMessage: string | MarkdownString;
+			if (urlsNeedingConfirmation.length === 1) {
+				confirmationTitle = localize('fetchWebPage.confirmationTitle.singular', 'Fetch untrusted web page?');
+				confirmationMessage = urlsNeedingConfirmation[0].toString();
+			} else {
+				confirmationTitle = localize('fetchWebPage.confirmationTitle.plural', 'Fetch untrusted web pages?');
+				confirmationMessage = new MarkdownString(urlsNeedingConfirmation.map(uri => `- ${uri.toString()}`).join('\n'));
+			}
+			result.confirmationMessages = { title: confirmationTitle, message: confirmationMessage, allowAutoConfirm: true };
 		}
-
 		return result;
 	}
 
diff --git a/src/vs/workbench/contrib/chat/test/browser/__snapshots__/ChatMarkdownRenderer_remote_images.0.snap b/src/vs/workbench/contrib/chat/test/browser/__snapshots__/ChatMarkdownRenderer_remote_images.0.snap
diff --git a/src/vs/workbench/contrib/chat/test/browser/__snapshots__/ChatMarkdownRenderer_remote_images_are_disallowed.0.snap b/src/vs/workbench/contrib/chat/test/browser/__snapshots__/ChatMarkdownRenderer_remote_images_are_disallowed.0.snap
@@ -0,0 +1 @@
+<div class="rendered-markdown"><p></p><div>&lt;img src="http://disallowed.com/image.jpg"&gt;</div><p></p></div>
diff --git a/src/vs/workbench/contrib/chat/test/browser/chatMarkdownRenderer.test.ts b/src/vs/workbench/contrib/chat/test/browser/chatMarkdownRenderer.test.ts
@@ -7,8 +7,6 @@ import { MarkdownString } from '../../../../../base/common/htmlContent.js';
 import { assertSnapshot } from '../../../../../base/test/common/snapshot.js';
 import { ensureNoDisposablesAreLeakedInTestSuite } from '../../../../../base/test/common/utils.js';
 import { ChatMarkdownRenderer } from '../../browser/chatMarkdownRenderer.js';
-import { ITrustedDomainService } from '../../../url/browser/trustedDomainService.js';
-import { MockTrustedDomainService } from '../../../url/test/browser/mockTrustedDomainService.js';
 import { workbenchInstantiationService } from '../../../../test/browser/workbenchTestServices.js';
 
 suite('ChatMarkdownRenderer', () => {
@@ -17,7 +15,6 @@ suite('ChatMarkdownRenderer', () => {
 	let testRenderer: ChatMarkdownRenderer;
 	setup(() => {
 		const instantiationService = store.add(workbenchInstantiationService(undefined, store));
-		instantiationService.stub(ITrustedDomainService, new MockTrustedDomainService(['http://allowed.com']));
 		testRenderer = instantiationService.createInstance(ChatMarkdownRenderer, {});
 	});
 
@@ -102,8 +99,8 @@ suite('ChatMarkdownRenderer', () => {
 		await assertSnapshot(result.element.outerHTML);
 	});
 
-	test('remote images', async () => {
-		const md = new MarkdownString('<img src="http://allowed.com/image.jpg"> <img src="http://disallowed.com/image.jpg">');
+	test('remote images are disallowed', async () => {
+		const md = new MarkdownString('<img src="http://disallowed.com/image.jpg">');
 		md.supportHtml = true;
 		const result = store.add(testRenderer.render(md));
 		await assertSnapshot(result.element.outerHTML);
diff --git a/src/vs/workbench/contrib/url/common/urlGlob.ts b/src/vs/workbench/contrib/url/common/urlGlob.ts
@@ -5,89 +5,154 @@
 
 import { URI } from '../../../../base/common/uri.js';
 
-// TODO: rewrite this to use URIs directly and validate each part individually
-// instead of relying on memoization of the stringified URI.
-export const testUrlMatchesGlob = (uri: URI, globUrl: string): boolean => {
-	let url = uri.with({ query: null, fragment: null }).toString(true);
-	const normalize = (url: string) => url.replace(/\/+$/, '');
-	globUrl = normalize(globUrl);
-	url = normalize(url);
-
-	const memo = Array.from({ length: url.length + 1 }).map(() =>
-		Array.from({ length: globUrl.length + 1 }).map(() => undefined),
-	);
+/**
+ * Normalizes a URL by removing trailing slashes and query/fragment components.
+ * @param url The URL to normalize.
+ * @returns URI - The normalized URI object.
+ */
+function normalizeURL(url: string | URI): URI {
+	const uri = typeof url === 'string' ? URI.parse(url) : url;
+	return uri.with({
+		// Remove trailing slashes
+		path: uri.path.replace(/\/+$/, ''),
+		// Remove query and fragment
+		query: null,
+		fragment: null,
+	});
+}
 
-	if (/^[^./:]*:\/\//.test(globUrl)) {
-		return doUrlMatch(memo, url, globUrl, 0, 0);
-	}
+/**
+ * Checks if a given URL matches a glob URL pattern.
+ * The glob URL pattern can contain wildcards (*) and subdomain matching (*.)
+ * @param uri The URL to check.
+ * @param globUrl The glob URL pattern to match against.
+ * @returns boolean - True if the URL matches the glob URL pattern, false otherwise.
+ */
+export function testUrlMatchesGlob(uri: string | URI, globUrl: string): boolean {
+	const normalizedUrl = normalizeURL(uri);
+	let normalizedGlobUrl = normalizeURL(globUrl);
 
-	const scheme = /^(https?):\/\//.exec(url)?.[1];
-	if (scheme) {
-		return doUrlMatch(memo, url, `${scheme}://${globUrl}`, 0, 0);
+	const globHasScheme = /^[^./:]*:\/\//.test(globUrl);
+	// if the glob does not have a scheme we assume the scheme is http or https
+	// so if the url doesn't have a scheme of http or https we return false
+	if (!globHasScheme) {
+		if (normalizedUrl.scheme !== 'http' && normalizedUrl.scheme !== 'https') {
+			return false;
+		}
+		normalizedGlobUrl = normalizeURL(`${normalizedUrl.scheme}://${globUrl}`);
 	}
 
-	return false;
-};
+	return (
+		doMemoUrlMatch(normalizedUrl.scheme, normalizedGlobUrl.scheme) &&
+		// The authority is the only thing that should do port logic.
+		doMemoUrlMatch(normalizedUrl.authority, normalizedGlobUrl.authority, true) &&
+		(
+			//
+			normalizedGlobUrl.path === '/' ||
+			doMemoUrlMatch(normalizedUrl.path, normalizedGlobUrl.path)
+		)
+	);
+}
+
+/**
+ * @param normalizedUrlPart The normalized URL part to match.
+ * @param normalizedGlobUrlPart The normalized glob URL part to match against.
+ * @param includePortLogic Whether to include port logic in the matching process.
+ * @returns boolean - True if the URL part matches the glob URL part, false otherwise.
+ */
+function doMemoUrlMatch(
+	normalizedUrlPart: string,
+	normalizedGlobUrlPart: string,
+	includePortLogic: boolean = false,
+) {
+	const memo = Array.from({ length: normalizedUrlPart.length + 1 }).map(() =>
+		Array.from({ length: normalizedGlobUrlPart.length + 1 }).map(() => undefined),
+	);
 
-const doUrlMatch = (
+	return doUrlPartMatch(memo, includePortLogic, normalizedUrlPart, normalizedGlobUrlPart, 0, 0);
+}
+
+/**
+ * Recursively checks if a URL part matches a glob URL part.
+ * This function uses memoization to avoid recomputing results for the same inputs.
+ * It handles various cases such as exact matches, wildcard matches, and port logic.
+ * @param memo A memoization table to avoid recomputing results for the same inputs.
+ * @param includePortLogic Whether to include port logic in the matching process.
+ * @param urlPart The URL part to match with.
+ * @param globUrlPart The glob URL part to match against.
+ * @param urlOffset The current offset in the URL part.
+ * @param globUrlOffset The current offset in the glob URL part.
+ * @returns boolean - True if the URL part matches the glob URL part, false otherwise.
+ */
+function doUrlPartMatch(
 	memo: (boolean | undefined)[][],
-	url: string,
-	globUrl: string,
+	includePortLogic: boolean,
+	urlPart: string,
+	globUrlPart: string,
 	urlOffset: number,
-	globUrlOffset: number,
-): boolean => {
+	globUrlOffset: number
+): boolean {
 	if (memo[urlOffset]?.[globUrlOffset] !== undefined) {
 		return memo[urlOffset][globUrlOffset]!;
 	}
 
 	const options = [];
 
-	// Endgame.
-	// Fully exact match
-	if (urlOffset === url.length) {
-		return globUrlOffset === globUrl.length;
+	// We've reached the end of the url.
+	if (urlOffset === urlPart.length) {
+		// We're also at the end of the glob url as well so we have an exact match.
+		if (globUrlOffset === globUrlPart.length) {
+			return true;
+		}
+
+		if (includePortLogic && globUrlPart[globUrlOffset] + globUrlPart[globUrlOffset + 1] === ':*') {
+			// any port match. Consume a port if it exists otherwise nothing. Always consume the base.
+			return globUrlOffset + 2 === globUrlPart.length;
+		}
+
+		return false;
 	}
 
 	// Some path remaining in url
-	if (globUrlOffset === globUrl.length) {
-		const remaining = url.slice(urlOffset);
+	if (globUrlOffset === globUrlPart.length) {
+		const remaining = urlPart.slice(urlOffset);
 		return remaining[0] === '/';
 	}
 
-	if (url[urlOffset] === globUrl[globUrlOffset]) {
+	if (urlPart[urlOffset] === globUrlPart[globUrlOffset]) {
 		// Exact match.
-		options.push(doUrlMatch(memo, url, globUrl, urlOffset + 1, globUrlOffset + 1));
+		options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset + 1, globUrlOffset + 1));
 	}
 
-	if (globUrl[globUrlOffset] + globUrl[globUrlOffset + 1] === '*.') {
+	if (globUrlPart[globUrlOffset] + globUrlPart[globUrlOffset + 1] === '*.') {
 		// Any subdomain match. Either consume one thing that's not a / or : and don't advance base or consume nothing and do.
-		if (!['/', ':'].includes(url[urlOffset])) {
-			options.push(doUrlMatch(memo, url, globUrl, urlOffset + 1, globUrlOffset));
+		if (!['/', ':'].includes(urlPart[urlOffset])) {
+			options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset + 1, globUrlOffset));
 		}
-		options.push(doUrlMatch(memo, url, globUrl, urlOffset, globUrlOffset + 2));
+		options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset, globUrlOffset + 2));
 	}
 
-	if (globUrl[globUrlOffset] === '*') {
+	if (globUrlPart[globUrlOffset] === '*') {
 		// Any match. Either consume one thing and don't advance base or consume nothing and do.
-		if (urlOffset + 1 === url.length) {
+		if (urlOffset + 1 === urlPart.length) {
 			// If we're at the end of the input url consume one from both.
-			options.push(doUrlMatch(memo, url, globUrl, urlOffset + 1, globUrlOffset + 1));
+			options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset + 1, globUrlOffset + 1));
 		} else {
-			options.push(doUrlMatch(memo, url, globUrl, urlOffset + 1, globUrlOffset));
+			options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset + 1, globUrlOffset));
 		}
-		options.push(doUrlMatch(memo, url, globUrl, urlOffset, globUrlOffset + 1));
+		options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset, globUrlOffset + 1));
 	}
 
-	if (globUrl[globUrlOffset] + globUrl[globUrlOffset + 1] === ':*') {
-		// any port match. Consume a port if it exists otherwise nothing. Always comsume the base.
-		if (url[urlOffset] === ':') {
+	if (includePortLogic && globUrlPart[globUrlOffset] + globUrlPart[globUrlOffset + 1] === ':*') {
+		// any port match. Consume a port if it exists otherwise nothing. Always consume the base.
+		if (urlPart[urlOffset] === ':') {
 			let endPortIndex = urlOffset + 1;
-			do { endPortIndex++; } while (/[0-9]/.test(url[endPortIndex]));
-			options.push(doUrlMatch(memo, url, globUrl, endPortIndex, globUrlOffset + 2));
+			do { endPortIndex++; } while (/[0-9]/.test(urlPart[endPortIndex]));
+			options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, endPortIndex, globUrlOffset + 2));
 		} else {
-			options.push(doUrlMatch(memo, url, globUrl, urlOffset, globUrlOffset + 2));
+			options.push(doUrlPartMatch(memo, includePortLogic, urlPart, globUrlPart, urlOffset, globUrlOffset + 2));
 		}
 	}
 
 	return (memo[urlOffset][globUrlOffset] = options.some(a => a === true));
-};
+}
diff --git a/src/vs/workbench/contrib/url/test/browser/trustedDomains.test.ts b/src/vs/workbench/contrib/url/test/browser/trustedDomains.test.ts
@@ -113,4 +113,9 @@ suite('Link protection domain matching', () => {
 		linkAllowedByRules('https://github.com/login/oauth/authorize?foo=4', ['https://github.com/login/oauth/authorize']);
 		linkAllowedByRules('https://github.com/login/oauth/authorize#foo', ['https://github.com/login/oauth/authorize']);
 	});
+
+	test('ensure individual parts of url are compared and wildcard does not leak out', () => {
+		linkNotAllowedByRules('https://x.org/github.com', ['https://*.github.com']);
+		linkNotAllowedByRules('https://x.org/y.github.com', ['https://*.github.com']);
+	});
 });

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+<div class="rendered-markdown"><p></p><div><img src="http://disallowed.com/image.jpg"></div><p></p></div>`