Implement Auto Model (#415)

lramos15 · web-flow · commit 78acc299df80 · 2025-07-31T19:16:55.000Z
* Auto mode work

* Implement auto mode

* Auto mode!
diff --git a/package-lock.json b/package-lock.json
diff --git a/package.json b/package.json
@@ -3667,7 +3667,7 @@
 		"@humanwhocodes/gitignore-to-minimatch": "1.0.2",
 		"@microsoft/tiktokenizer": "^1.0.10",
 		"@roamhq/mac-ca": "^1.0.7",
-		"@vscode/copilot-api": "^0.1.1",
+		"@vscode/copilot-api": "^0.1.3",
 		"@vscode/extension-telemetry": "^1.0.0",
 		"@vscode/l10n": "^0.0.18",
 		"@vscode/prompt-tsx": "^0.4.0-alpha.5",
diff --git a/src/extension/conversation/vscode-node/languageModelAccess.ts b/src/extension/conversation/vscode-node/languageModelAccess.ts
@@ -11,8 +11,9 @@ import { IBlockedExtensionService } from '../../../platform/chat/common/blockedE
 import { ChatFetchResponseType, ChatLocation, getErrorDetailsFromChatFetchError } from '../../../platform/chat/common/commonTypes';
 import { getTextPart } from '../../../platform/chat/common/globalStringUtils';
 import { EmbeddingType, getWellKnownEmbeddingTypeInfo, IEmbeddingsComputer } from '../../../platform/embeddings/common/embeddingsComputer';
+import { AutoChatEndpoint, isAutoModeEnabled } from '../../../platform/endpoint/common/autoChatEndpoint';
+import { IAutomodeService } from '../../../platform/endpoint/common/automodeService';
 import { IEndpointProvider } from '../../../platform/endpoint/common/endpointProvider';
-import { AutoChatEndpoint, isAutoModeEnabled } from '../../../platform/endpoint/node/autoChatEndpoint';
 import { IEnvService } from '../../../platform/env/common/envService';
 import { IVSCodeExtensionContext } from '../../../platform/extContext/common/extensionContext';
 import { ILogService } from '../../../platform/log/common/logService';
@@ -25,6 +26,7 @@ import { BaseTokensPerCompletion } from '../../../platform/tokenizer/node/tokeni
 import { Emitter } from '../../../util/vs/base/common/event';
 import { Disposable, MutableDisposable } from '../../../util/vs/base/common/lifecycle';
 import { isDefined, isNumber, isString, isStringArray } from '../../../util/vs/base/common/types';
+import { generateUuid } from '../../../util/vs/base/common/uuid';
 import { localize } from '../../../util/vs/nls';
 import { IInstantiationService } from '../../../util/vs/platform/instantiation/common/instantiation';
 import { ExtensionMode } from '../../../vscodeTypes';
@@ -51,7 +53,9 @@ export class LanguageModelAccess extends Disposable implements IExtensionContrib
 		@IEndpointProvider private readonly _endpointProvider: IEndpointProvider,
 		@IEmbeddingsComputer private readonly _embeddingsComputer: IEmbeddingsComputer,
 		@IVSCodeExtensionContext private readonly _vsCodeExtensionContext: IVSCodeExtensionContext,
-		@IExperimentationService private readonly _expService: IExperimentationService
+		@IExperimentationService private readonly _expService: IExperimentationService,
+		@IAutomodeService private readonly _automodeService: IAutomodeService,
+		@IEnvService private readonly _envService: IEnvService
 	) {
 		super();
 
@@ -96,11 +100,11 @@ export class LanguageModelAccess extends Disposable implements IExtensionContrib
 
 		const models: vscode.LanguageModelChatInformation[] = [];
 		const chatEndpoints = await this._endpointProvider.getAllChatEndpoints();
-		if (isAutoModeEnabled(this._expService)) {
-			chatEndpoints.push(this._instantiationService.createInstance(AutoChatEndpoint));
-		}
 
 		const defaultChatEndpoint = chatEndpoints.find(e => e.isDefault) ?? await this._endpointProvider.getChatEndpoint('gpt-4.1') ?? chatEndpoints[0];
+		if (isAutoModeEnabled(this._expService, this._envService)) {
+			chatEndpoints.push(await this._automodeService.resolveAutoModeEndpoint(generateUuid(), chatEndpoints));
+		}
 		const seenFamilies = new Set<string>();
 
 		for (const endpoint of chatEndpoints) {
@@ -140,7 +144,7 @@ export class LanguageModelAccess extends Disposable implements IExtensionContrib
 
 			const model: vscode.LanguageModelChatInformation = {
 				id: endpoint.model,
-				name: endpoint.name,
+				name: endpoint.model === AutoChatEndpoint.id ? 'Auto' : endpoint.name,
 				family: endpoint.family,
 				description: modelDescription,
 				cost: multiplierString,
diff --git a/src/extension/extension/vscode/services.ts b/src/extension/extension/vscode/services.ts
@@ -27,6 +27,7 @@ import { EditSurvivalTrackerService, IEditSurvivalTrackerService } from '../../.
 import { IEmbeddingsComputer } from '../../../platform/embeddings/common/embeddingsComputer';
 import { RemoteEmbeddingsComputer } from '../../../platform/embeddings/common/remoteEmbeddingsComputer';
 import { ICombinedEmbeddingIndex, VSCodeCombinedIndexImpl } from '../../../platform/embeddings/common/vscodeIndex';
+import { AutomodeService, IAutomodeService } from '../../../platform/endpoint/common/automodeService';
 import { IEnvService } from '../../../platform/env/common/envService';
 import { EnvServiceImpl } from '../../../platform/env/vscode/envServiceImpl';
 import { IVSCodeExtensionContext } from '../../../platform/extContext/common/extensionContext';
@@ -107,6 +108,7 @@ export function registerServices(builder: IInstantiationServiceBuilder, extensio
 	const isTestMode = extensionContext.extensionMode === ExtensionMode.Test;
 
 	builder.define(IInteractionService, new SyncDescriptor(InteractionService));
+	builder.define(IAutomodeService, new SyncDescriptor(AutomodeService));
 	builder.define(ICopilotTokenStore, new CopilotTokenStore());
 	builder.define(IDebugOutputService, new DebugOutputServiceImpl());
 	builder.define(IDialogService, new DialogServiceImpl());
diff --git a/src/extension/prompt/vscode-node/endpointProviderImpl.ts b/src/extension/prompt/vscode-node/endpointProviderImpl.ts
@@ -6,10 +6,11 @@
 import { LanguageModelChat, type ChatRequest } from 'vscode';
 import { IAuthenticationService } from '../../../platform/authentication/common/authentication';
 import { ConfigKey, EMBEDDING_MODEL, IConfigurationService } from '../../../platform/configuration/common/configurationService';
+import { AutoChatEndpoint } from '../../../platform/endpoint/common/autoChatEndpoint';
+import { IAutomodeService } from '../../../platform/endpoint/common/automodeService';
 import { ICAPIClientService } from '../../../platform/endpoint/common/capiClient';
 import { IDomainService } from '../../../platform/endpoint/common/domainService';
 import { ChatEndpointFamily, EmbeddingsEndpointFamily, IChatModelInformation, IEmbeddingModelInformation, IEndpointProvider } from '../../../platform/endpoint/common/endpointProvider';
-import { AutoChatEndpoint, resolveAutoChatEndpoint } from '../../../platform/endpoint/node/autoChatEndpoint';
 import { CopilotChatEndpoint } from '../../../platform/endpoint/node/copilotChatEndpoint';
 import { EmbeddingEndpoint } from '../../../platform/endpoint/node/embeddingsEndpoint';
 import { IModelMetadataFetcher, ModelMetadataFetcher } from '../../../platform/endpoint/node/modelMetadataFetcher';
@@ -38,6 +39,7 @@ export class ProductionEndpointProvider implements IEndpointProvider {
 		@IDomainService domainService: IDomainService,
 		@ICAPIClientService capiClientService: ICAPIClientService,
 		@IFetcherService fetcher: IFetcherService,
+		@IAutomodeService private readonly _autoModeService: IAutomodeService,
 		@IExperimentationService private readonly _expService: IExperimentationService,
 		@ITelemetryService private readonly _telemetryService: ITelemetryService,
 		@ILogService private readonly _logService: ILogService,
@@ -140,7 +142,9 @@ export class ProductionEndpointProvider implements IEndpointProvider {
 			if (experimentModelConfig && model && model.id === experimentModelConfig.id) {
 				endpoint = (await this.getAllChatEndpoints()).find(e => e.model === experimentModelConfig.selected) || await this.getChatEndpoint('gpt-4.1');
 			} else if (model && model.vendor === 'copilot' && model.id === AutoChatEndpoint.id) {
-				return resolveAutoChatEndpoint(this, this._expService, (requestOrFamilyOrModel as ChatRequest)?.prompt);
+				// TODO @lramos15 - This may be the ugliest cast I've ever seen but our types seem to be incorrect
+				const conversationdId = ((requestOrFamilyOrModel as ChatRequest).toolInvocationToken as { sessionId: string }).sessionId || 'unknown';
+				return this._autoModeService.getCachedAutoEndpoint(conversationdId) || this._autoModeService.resolveAutoModeEndpoint(conversationdId, await this.getAllChatEndpoints());
 			} else if (model && model.vendor === 'copilot') {
 				let modelMetadata = await this._modelFetcher.getChatModelFromApiModel(model);
 				if (modelMetadata) {
diff --git a/src/platform/endpoint/common/autoChatEndpoint.ts b/src/platform/endpoint/common/autoChatEndpoint.ts
@@ -0,0 +1,86 @@
+/*---------------------------------------------------------------------------------------------
+ *  Copyright (c) Microsoft Corporation. All rights reserved.
+ *  Licensed under the MIT License. See License.txt in the project root for license information.
+ *--------------------------------------------------------------------------------------------*/
+
+import type { RequestMetadata } from '@vscode/copilot-api';
+import { ChatMessage } from '@vscode/prompt-tsx/dist/base/output/rawTypes';
+import type { CancellationToken } from 'vscode';
+import { ITokenizer, TokenizerType } from '../../../util/common/tokenizer';
+import { AsyncIterableObject } from '../../../util/vs/base/common/async';
+import { IntentParams, Source } from '../../chat/common/chatMLFetcher';
+import { ChatLocation, ChatResponse } from '../../chat/common/commonTypes';
+import { IEnvService } from '../../env/common/envService';
+import { ILogService } from '../../log/common/logService';
+import { FinishedCallback, OptionalChatRequestParams } from '../../networking/common/fetch';
+import { Response } from '../../networking/common/fetcherService';
+import { IChatEndpoint } from '../../networking/common/networking';
+import { ChatCompletion } from '../../networking/common/openai';
+import { IExperimentationService } from '../../telemetry/common/nullExperimentationService';
+import { ITelemetryService, TelemetryProperties } from '../../telemetry/common/telemetry';
+import { TelemetryData } from '../../telemetry/common/telemetryData';
+
+/**
+ * This endpoint represents the "Auto" model in the model picker.
+ * It just effectively wraps a different endpoint and adds the auto stuff on top
+ */
+export class AutoChatEndpoint implements IChatEndpoint {
+	public static readonly id = 'auto';
+	maxOutputTokens: number = this._wrappedEndpoint.maxOutputTokens;
+	model: string = AutoChatEndpoint.id;
+	supportsToolCalls: boolean = this._wrappedEndpoint.supportsToolCalls;
+	supportsVision: boolean = this._wrappedEndpoint.supportsVision;
+	supportsPrediction: boolean = this._wrappedEndpoint.supportsPrediction;
+	showInModelPicker: boolean = true;
+	isPremium?: boolean | undefined = this._wrappedEndpoint.isPremium;
+	multiplier?: number | undefined = this._wrappedEndpoint.multiplier;
+	restrictedToSkus?: string[] | undefined = this._wrappedEndpoint.restrictedToSkus;
+	isDefault: boolean = this._wrappedEndpoint.isDefault;
+	isFallback: boolean = this._wrappedEndpoint.isFallback;
+	policy: 'enabled' | { terms: string } = this._wrappedEndpoint.policy;
+	urlOrRequestMetadata: string | RequestMetadata = this._wrappedEndpoint.urlOrRequestMetadata;
+	modelMaxPromptTokens: number = this._wrappedEndpoint.modelMaxPromptTokens;
+	name: string = this._wrappedEndpoint.name;
+	version: string = this._wrappedEndpoint.version;
+	family: string = this._wrappedEndpoint.family;
+	tokenizer: TokenizerType = this._wrappedEndpoint.tokenizer;
+
+	constructor(
+		private readonly _wrappedEndpoint: IChatEndpoint,
+		private readonly _sessionToken: string
+	) { }
+
+	getExtraHeaders(): Record<string, string> {
+		return {
+			...(this._wrappedEndpoint.getExtraHeaders?.() || {}),
+			'Copilot-Session-Token': this._sessionToken
+		};
+	}
+
+	processResponseFromChatEndpoint(telemetryService: ITelemetryService, logService: ILogService, response: Response, expectedNumChoices: number, finishCallback: FinishedCallback, telemetryData: TelemetryData, cancellationToken?: CancellationToken): Promise<AsyncIterableObject<ChatCompletion>> {
+		return this._wrappedEndpoint.processResponseFromChatEndpoint(telemetryService, logService, response, expectedNumChoices, finishCallback, telemetryData, cancellationToken);
+	}
+	acceptChatPolicy(): Promise<boolean> {
+		return this._wrappedEndpoint.acceptChatPolicy();
+	}
+	cloneWithTokenOverride(modelMaxPromptTokens: number): IChatEndpoint {
+		return this._wrappedEndpoint.cloneWithTokenOverride(modelMaxPromptTokens);
+	}
+	acquireTokenizer(): ITokenizer {
+		return this._wrappedEndpoint.acquireTokenizer();
+	}
+
+	async makeChatRequest(debugName: string, messages: ChatMessage[], finishedCb: FinishedCallback | undefined, token: CancellationToken, location: ChatLocation, source?: Source, requestOptions?: Omit<OptionalChatRequestParams, 'n'>, userInitiatedRequest?: boolean, telemetryProperties?: TelemetryProperties, intentParams?: IntentParams): Promise<ChatResponse> {
+		return this._wrappedEndpoint.makeChatRequest(debugName, messages, finishedCb, token, location, source, requestOptions, userInitiatedRequest, telemetryProperties, intentParams);
+	}
+}
+
+/**
+ * Checks if the auto chat mode is enabled.
+ * @param expService The experimentation service to use to check if the auto mode is enabled
+ * @param envService The environment service to use to check if the auto mode is enabled
+ * @returns True if the auto mode is enabled, false otherwise
+ */
+export function isAutoModeEnabled(expService: IExperimentationService, envService: IEnvService): boolean {
+	return !!expService.getTreatmentVariable<boolean>('vscode', 'copilotchatcapiautomode') || envService.isPreRelease();
+}
diff --git a/src/platform/endpoint/common/automodeService.ts b/src/platform/endpoint/common/automodeService.ts
@@ -0,0 +1,65 @@
+/*---------------------------------------------------------------------------------------------
+ *  Copyright (c) Microsoft Corporation. All rights reserved.
+ *  Licensed under the MIT License. See License.txt in the project root for license information.
+ *--------------------------------------------------------------------------------------------*/
+
+import { RequestType } from '@vscode/copilot-api';
+import { createServiceIdentifier } from '../../../util/common/services';
+import { IAuthenticationService } from '../../authentication/common/authentication';
+import { IChatEndpoint } from '../../networking/common/networking';
+import { AutoChatEndpoint } from './autoChatEndpoint';
+import { ICAPIClientService } from './capiClient';
+
+interface AutoModeAPIResponse {
+	available_models: string[];
+	selected_model: string;
+	session_token: string;
+}
+
+export const IAutomodeService = createServiceIdentifier<IAutomodeService>('IAutomodeService');
+
+export interface IAutomodeService {
+	readonly _serviceBrand: undefined;
+
+	getCachedAutoEndpoint(conversationId: string): IChatEndpoint | undefined;
+
+	resolveAutoModeEndpoint(conversationId: string, knownEndpoints: IChatEndpoint[]): Promise<IChatEndpoint>;
+}
+
+export class AutomodeService implements IAutomodeService {
+	readonly _serviceBrand: undefined;
+	private readonly _autoModelCache: Map<string, IChatEndpoint> = new Map();
+
+	constructor(
+		@ICAPIClientService private readonly _capiClientService: ICAPIClientService,
+		@IAuthenticationService private readonly _authService: IAuthenticationService
+	) {
+		this._serviceBrand = undefined;
+	}
+
+	getCachedAutoEndpoint(conversationId: string): IChatEndpoint | undefined {
+		return this._autoModelCache.get(conversationId);
+	}
+
+	async resolveAutoModeEndpoint(conversationId: string, knownEndpoints: IChatEndpoint[]): Promise<IChatEndpoint> {
+		if (this.getCachedAutoEndpoint(conversationId)) {
+			return this.getCachedAutoEndpoint(conversationId)!;
+		}
+		const authToken = (await this._authService.getCopilotToken()).token;
+		const response = await this._capiClientService.makeRequest<Response>({
+			json: {
+				"auto_mode": { "model_hints": ["auto"] },
+			},
+			headers: {
+				'Content-Type': 'application/json',
+				'Authorization': `Bearer ${authToken}`
+			},
+			method: 'POST'
+		}, { type: RequestType.AutoModels });
+		const data: AutoModeAPIResponse = await response.json() as AutoModeAPIResponse;
+		const selectedModel = knownEndpoints.find(e => e.model === data.selected_model) || knownEndpoints[0];
+		const autoEndpoint = new AutoChatEndpoint(selectedModel, data.session_token);
+		this._autoModelCache.set(conversationId, autoEndpoint);
+		return autoEndpoint;
+	}
+}
diff --git a/src/platform/endpoint/node/autoChatEndpoint.ts b/src/platform/endpoint/node/autoChatEndpoint.ts
diff --git a/src/platform/test/node/services.ts b/src/platform/test/node/services.ts