huggingface
diff --git a/‎packages/tasks-gen/scripts/generate-snippets-fixtures.ts‎
Lines changed: 6 additions & 5 deletions b/‎packages/tasks-gen/scripts/generate-snippets-fixtures.ts‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-non-stream/0.curl.together.sh‎
Lines changed: 1 addition & 1 deletion b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-non-stream/0.curl.together.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-non-stream/1.openai.together.js‎
Lines changed: 1 addition & 1 deletion b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-non-stream/1.openai.together.js‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-non-stream/1.openai.together.py‎
Lines changed: 1 addition & 1 deletion b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-non-stream/1.openai.together.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/0.curl.together.sh‎
Lines changed: 14 additions & 0 deletions b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/0.curl.together.sh‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/0.huggingface.js.together.js‎
Lines changed: 25 additions & 0 deletions b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/0.huggingface.js.together.js‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/0.huggingface_hub.together.py‎
Lines changed: 23 additions & 0 deletions b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/0.huggingface_hub.together.py‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/1.openai.together.js‎
Lines changed: 28 additions & 0 deletions b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/1.openai.together.js‎
Lines changed: 28 additions & 0 deletions
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/1.openai.together.py‎
Lines changed: 23 additions & 0 deletions b/‎packages/tasks-gen/snippets-fixtures/conversational-llm-stream/1.openai.together.py‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎packages/tasks-gen/snippets-fixtures/conversational-vlm-non-stream/0.curl.fireworks-ai.sh‎
Lines changed: 25 additions & 0 deletions b/‎packages/tasks-gen/snippets-fixtures/conversational-vlm-non-stream/0.curl.fireworks-ai.sh‎
Lines changed: 25 additions & 0 deletions
@@ -52,7 +52,7 @@ const TEST_CASES: {
 			inference: "",
 		},
 		languages: ["sh", "js", "py"],
-		providers: ["hf-inference"],
+		providers: ["hf-inference", "together"],
 		opts: { streaming: true },
 	},
 	{
@@ -64,7 +64,7 @@ const TEST_CASES: {
 			inference: "",
 		},
 		languages: ["sh", "js", "py"],
-		providers: ["hf-inference"],
+		providers: ["hf-inference", "fireworks-ai"],
 		opts: { streaming: false },
 	},
 	{
@@ -76,7 +76,7 @@ const TEST_CASES: {
 			inference: "",
 		},
 		languages: ["sh", "js", "py"],
-		providers: ["hf-inference"],
+		providers: ["hf-inference", "fireworks-ai"],
 		opts: { streaming: true },
 	},
 	{
@@ -87,7 +87,7 @@ const TEST_CASES: {
 			tags: [],
 			inference: "",
 		},
-		providers: ["hf-inference"],
+		providers: ["hf-inference", "fal-ai"],
 		languages: ["sh", "js", "py"],
 	},
 	{
@@ -133,7 +133,8 @@ function generateInferenceSnippet(
 	provider: SnippetInferenceProvider,
 	opts?: Record<string, unknown>
 ): InferenceSnippet[] {
-	return GET_SNIPPET_FN[language](model, "api_token", provider, opts);
+	const providerModelId = provider === "hf-inference" ? model.id : `<${provider} alias for ${model.id}>`;
+	return GET_SNIPPET_FN[language](model, "api_token", provider, providerModelId, opts);
 }
 
 async function getExpectedInferenceSnippet(
 
@@ -2,7 +2,7 @@ curl 'https://router.huggingface.co/together/v1/chat/completions' \
 -H 'Authorization: Bearer api_token' \
 -H 'Content-Type: application/json' \
 --data '{
-    "model": "meta-llama/Llama-3.1-8B-Instruct",
+    "model": "<together alias for meta-llama/Llama-3.1-8B-Instruct>",
     "messages": [
 		{
 			"role": "user",
 
@@ -6,7 +6,7 @@ const client = new OpenAI({
 });
 
 const chatCompletion = await client.chat.completions.create({
-	model: "meta-llama/Llama-3.1-8B-Instruct",
+	model: "<together alias for meta-llama/Llama-3.1-8B-Instruct>",
 	messages: [
 		{
 			role: "user",
 
@@ -13,7 +13,7 @@
 ]
 
 completion = client.chat.completions.create(
-	model="meta-llama/Llama-3.1-8B-Instruct", 
+	model="<together alias for meta-llama/Llama-3.1-8B-Instruct>", 
 	messages=messages, 
 	max_tokens=500,
 )
 
@@ -0,0 +1,14 @@
+curl 'https://router.huggingface.co/together/v1/chat/completions' \
+-H 'Authorization: Bearer api_token' \
+-H 'Content-Type: application/json' \
+--data '{
+    "model": "<together alias for meta-llama/Llama-3.1-8B-Instruct>",
+    "messages": [
+		{
+			"role": "user",
+			"content": "What is the capital of France?"
+		}
+	],
+    "max_tokens": 500,
+    "stream": true
+}'
@@ -0,0 +1,25 @@
+import { HfInference } from "@huggingface/inference";
+
+const client = new HfInference("api_token");
+
+let out = "";
+
+const stream = client.chatCompletionStream({
+	model: "meta-llama/Llama-3.1-8B-Instruct",
+	messages: [
+		{
+			role: "user",
+			content: "What is the capital of France?"
+		}
+	],
+	provider: "together",
+	max_tokens: 500,
+});
+
+for await (const chunk of stream) {
+	if (chunk.choices && chunk.choices.length > 0) {
+		const newContent = chunk.choices[0].delta.content;
+		out += newContent;
+		console.log(newContent);
+	}  
+}
@@ -0,0 +1,23 @@
+from huggingface_hub import InferenceClient
+
+client = InferenceClient(
+	provider="together",
+	api_key="api_token"
+)
+
+messages = [
+	{
+		"role": "user",
+		"content": "What is the capital of France?"
+	}
+]
+
+stream = client.chat.completions.create(
+	model="meta-llama/Llama-3.1-8B-Instruct", 
+	messages=messages, 
+	max_tokens=500,
+	stream=True
+)
+
+for chunk in stream:
+    print(chunk.choices[0].delta.content, end="")
@@ -0,0 +1,28 @@
+import { OpenAI } from "openai";
+
+const client = new OpenAI({
+	baseURL: "https://router.huggingface.co/together",
+	apiKey: "api_token"
+});
+
+let out = "";
+
+const stream = await client.chat.completions.create({
+	model: "<together alias for meta-llama/Llama-3.1-8B-Instruct>",
+	messages: [
+		{
+			role: "user",
+			content: "What is the capital of France?"
+		}
+	],
+	max_tokens: 500,
+	stream: true,
+});
+
+for await (const chunk of stream) {
+	if (chunk.choices && chunk.choices.length > 0) {
+		const newContent = chunk.choices[0].delta.content;
+		out += newContent;
+		console.log(newContent);
+	}  
+}
@@ -0,0 +1,23 @@
+from openai import OpenAI
+
+client = OpenAI(
+	base_url="https://router.huggingface.co/together",
+	api_key="api_token"
+)
+
+messages = [
+	{
+		"role": "user",
+		"content": "What is the capital of France?"
+	}
+]
+
+stream = client.chat.completions.create(
+    model="<together alias for meta-llama/Llama-3.1-8B-Instruct>", 
+	messages=messages, 
+	max_tokens=500,
+	stream=True
+)
+
+for chunk in stream:
+	print(chunk.choices[0].delta.content, end="")
@@ -0,0 +1,25 @@
+curl 'https://router.huggingface.co/fireworks-ai/v1/chat/completions' \
+-H 'Authorization: Bearer api_token' \
+-H 'Content-Type: application/json' \
+--data '{
+    "model": "<fireworks-ai alias for meta-llama/Llama-3.2-11B-Vision-Instruct>",
+    "messages": [
+		{
+			"role": "user",
+			"content": [
+				{
+					"type": "text",
+					"text": "Describe this image in one sentence."
+				},
+				{
+					"type": "image_url",
+					"image_url": {
+						"url": "https://cdn.britannica.com/61/93061-050-99147DCE/Statue-of-Liberty-Island-New-York-Bay.jpg"
+					}
+				}
+			]
+		}
+	],
+    "max_tokens": 500,
+    "stream": false
+}'
Original file line number	Diff line number	Diff line change
`@@ -2,7 +2,7 @@ curl 'https://router.huggingface.co/together/v1/chat/completions' \`
`2`	`2`	`-H 'Authorization: Bearer api_token' \`
`3`	`3`	`-H 'Content-Type: application/json' \`
`4`	`4`	`--data '{`
`5`		`- "model": "meta-llama/Llama-3.1-8B-Instruct",`
	`5`	`+ "model": "<together alias for meta-llama/Llama-3.1-8B-Instruct>",`
`6`	`6`	`"messages": [`
`7`	`7`	`{`
`8`	`8`	`"role": "user",`
Original file line number	Diff line number	Diff line change
`@@ -6,7 +6,7 @@ const client = new OpenAI({`
`6`	`6`	`});`
`7`	`7`
`8`	`8`	`const chatCompletion = await client.chat.completions.create({`
`9`		`- model: "meta-llama/Llama-3.1-8B-Instruct",`
	`9`	`+ model: "<together alias for meta-llama/Llama-3.1-8B-Instruct>",`
`10`	`10`	`messages: [`
`11`	`11`	`{`
`12`	`12`	`role: "user",`
Original file line number	Diff line number	Diff line change
`@@ -13,7 +13,7 @@`
`13`	`13`	`]`
`14`	`14`
`15`	`15`	`completion = client.chat.completions.create(`
`16`		`- model="meta-llama/Llama-3.1-8B-Instruct",`
	`16`	`+ model="<together alias for meta-llama/Llama-3.1-8B-Instruct>",`
`17`	`17`	`messages=messages,`
`18`	`18`	`max_tokens=500,`
`19`	`19`	`)`