From 346734e96792f4bf1d284fe0ce1a118614aeb1e5 Mon Sep 17 00:00:00 2001 From: daisyfaithauma Date: Tue, 4 Feb 2025 15:24:55 +0000 Subject: [PATCH 1/4] Cerebras provider --- .../docs/ai-gateway/providers/cerebras.mdx | 61 +++++++++++++++++++ 1 file changed, 61 insertions(+) create mode 100644 src/content/docs/ai-gateway/providers/cerebras.mdx diff --git a/src/content/docs/ai-gateway/providers/cerebras.mdx b/src/content/docs/ai-gateway/providers/cerebras.mdx new file mode 100644 index 000000000000000..f897f50c6add5bf --- /dev/null +++ b/src/content/docs/ai-gateway/providers/cerebras.mdx @@ -0,0 +1,61 @@ +--- +title: Cerebras +pcx_content_type: get-started +--- + +[Cerebras](https://inference-docs.cerebras.ai/) offers developers a low-latency solution for AI model inference. + +## Endpoint + +```txt +https://gateway.ai.cloudflare.com/v1/{account_id}/{gateway_id}/cerebras-ai +``` + +## Prerequisites + +When making requests to Cerebras, ensure you have the following: + +- Your AI Gateway Account ID. +- Your AI Gateway gateway name. +- An active Cerebras API token. +- The name of the Cerebras model you want to use. + +## Examples + +### cURL + +```bash title="Example fetch request" +curl -X POST https://gateway.ai.cloudflare.com/v1/ACCOUNT_TAG/GATEWAY/cerebras/chat/completions \ + --header 'content-type: application/json' \ + --header 'Authorization: Bearer CEREBRAS_TOKEN' \ + --data '{ + "model": "llama3.1-8b", + "messages": [ + { + "role": "user", + "content": "What is Cloudflare?" + } + ] +}' +``` + +### Use Cerebras through Cerebras Cloud SDK with JavaScript + +```js title="JavaScript" +import Cerebras from "@cerebras/cerebras_cloud_sdk"; + +const client = new Cerebras({ + apiKey: process.env["CEREBRAS_API_KEY"], // This is the default and can be omitted +}); + +async function main() { + const completionCreateResponse = await client.chat.completions.create({ + messages: [{ role: "user", content: "Why is fast inference important?" }], + model: "llama3.1-8b", + }); + + console.log(completionCreateResponse); +} + +main(); +``` From 9f5abc06bbfba8547d9711b524de50400523f1d0 Mon Sep 17 00:00:00 2001 From: daisyfaithauma Date: Tue, 4 Feb 2025 17:00:51 +0000 Subject: [PATCH 2/4] removed example --- .../docs/ai-gateway/providers/cerebras.mdx | 21 ------------------- 1 file changed, 21 deletions(-) diff --git a/src/content/docs/ai-gateway/providers/cerebras.mdx b/src/content/docs/ai-gateway/providers/cerebras.mdx index f897f50c6add5bf..50a729bc21f0286 100644 --- a/src/content/docs/ai-gateway/providers/cerebras.mdx +++ b/src/content/docs/ai-gateway/providers/cerebras.mdx @@ -38,24 +38,3 @@ curl -X POST https://gateway.ai.cloudflare.com/v1/ACCOUNT_TAG/GATEWAY/cerebras/c ] }' ``` - -### Use Cerebras through Cerebras Cloud SDK with JavaScript - -```js title="JavaScript" -import Cerebras from "@cerebras/cerebras_cloud_sdk"; - -const client = new Cerebras({ - apiKey: process.env["CEREBRAS_API_KEY"], // This is the default and can be omitted -}); - -async function main() { - const completionCreateResponse = await client.chat.completions.create({ - messages: [{ role: "user", content: "Why is fast inference important?" }], - model: "llama3.1-8b", - }); - - console.log(completionCreateResponse); -} - -main(); -``` From f508f4a887263e242c8a91082b492885b21a2b18 Mon Sep 17 00:00:00 2001 From: daisyfaithauma Date: Wed, 5 Feb 2025 16:00:59 +0000 Subject: [PATCH 3/4] Update cerebras.mdx --- src/content/docs/ai-gateway/providers/cerebras.mdx | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/content/docs/ai-gateway/providers/cerebras.mdx b/src/content/docs/ai-gateway/providers/cerebras.mdx index 50a729bc21f0286..9fa4c492988ddc7 100644 --- a/src/content/docs/ai-gateway/providers/cerebras.mdx +++ b/src/content/docs/ai-gateway/providers/cerebras.mdx @@ -25,7 +25,7 @@ When making requests to Cerebras, ensure you have the following: ### cURL ```bash title="Example fetch request" -curl -X POST https://gateway.ai.cloudflare.com/v1/ACCOUNT_TAG/GATEWAY/cerebras/chat/completions \ +curl https://gateway.ai.cloudflare.com/v1/ACCOUNT_TAG/GATEWAY/cerebras/chat/completions \ --header 'content-type: application/json' \ --header 'Authorization: Bearer CEREBRAS_TOKEN' \ --data '{ From 9e6863690db8ac8c4f685f35d700201a820103df Mon Sep 17 00:00:00 2001 From: daisyfaithauma Date: Wed, 5 Feb 2025 16:49:42 +0000 Subject: [PATCH 4/4] Update cerebras.mdx Beta label --- src/content/docs/ai-gateway/providers/cerebras.mdx | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/content/docs/ai-gateway/providers/cerebras.mdx b/src/content/docs/ai-gateway/providers/cerebras.mdx index 9fa4c492988ddc7..6a6554cb34e8499 100644 --- a/src/content/docs/ai-gateway/providers/cerebras.mdx +++ b/src/content/docs/ai-gateway/providers/cerebras.mdx @@ -1,6 +1,9 @@ --- title: Cerebras pcx_content_type: get-started +sidebar: + badge: + text: Beta --- [Cerebras](https://inference-docs.cerebras.ai/) offers developers a low-latency solution for AI model inference.