[Inference] openai client snippet for "auto" provider (#1630)

krampstudio · web-flow · commit 3ba8dc7381bd · 2025-07-16T14:48:10.000+02:00
<img width="919" height="713" alt="image" src="https://github.com/user-attachments/assets/14b093a9-e246-4ea3-84cb-c25d016c3700" /> (also needed for internal huggingface-internal/moon-landing#14421)
diff --git a/packages/inference/src/config.ts b/packages/inference/src/config.ts
@@ -1,3 +1,4 @@
 export const HF_HUB_URL = "https://huggingface.co";
 export const HF_ROUTER_URL = "https://router.huggingface.co";
+export const HF_ROUTER_AUTO_ENDPOINT = `${HF_ROUTER_URL}/v1`;
 export const HF_HEADER_X_BILL_TO = "X-HF-Bill-To";
diff --git a/packages/inference/src/snippets/getInferenceSnippets.ts b/packages/inference/src/snippets/getInferenceSnippets.ts
@@ -13,6 +13,7 @@ import { makeRequestOptionsFromResolvedModel } from "../lib/makeRequestOptions.j
 import type { InferenceProviderMappingEntry, InferenceProviderOrPolicy, InferenceTask, RequestArgs } from "../types.js";
 import { templates } from "./templates.exported.js";
 import { getLogger } from "../lib/logger.js";
+import { HF_ROUTER_AUTO_ENDPOINT } from "../config.js";
 
 export type InferenceSnippetOptions = {
 	streaming?: boolean;
@@ -37,7 +38,7 @@ const CLIENTS: Record<InferenceSnippetLanguage, Client[]> = {
 
 const CLIENTS_AUTO_POLICY: Partial<Record<InferenceSnippetLanguage, Client[]>> = {
 	js: ["huggingface.js"],
-	python: ["huggingface_hub"],
+	python: ["huggingface_hub", "openai"],
 };
 
 type InputPreparationFn = (model: ModelDataMinimal, opts?: Record<string, unknown>) => object;
@@ -179,7 +180,7 @@ const snippetGenerator = (templateName: string, inputPreparationFn?: InputPrepar
 			{
 				accessToken: accessTokenOrPlaceholder,
 				provider,
-				endpointUrl: opts?.endpointUrl,
+				endpointUrl: opts?.endpointUrl ?? (provider === "auto" ? HF_ROUTER_AUTO_ENDPOINT : undefined),
 				...inputs,
 			} as RequestArgs,
 			inferenceProviderMapping,