cosmocode
diff --git a/‎Model/Anthropic/models.json‎
Lines changed: 38 additions & 10 deletions b/‎Model/Anthropic/models.json‎
Lines changed: 38 additions & 10 deletions
diff --git a/‎Model/Groq/models.json‎
Lines changed: 12 additions & 12 deletions b/‎Model/Groq/models.json‎
Lines changed: 12 additions & 12 deletions
diff --git a/‎Model/Mistral/models.json‎
Lines changed: 66 additions & 17 deletions b/‎Model/Mistral/models.json‎
Lines changed: 66 additions & 17 deletions
diff --git a/‎Model/OpenAI/models.json‎
Lines changed: 41 additions & 14 deletions b/‎Model/OpenAI/models.json‎
Lines changed: 41 additions & 14 deletions
diff --git a/‎Model/Reka/models.json‎
Lines changed: 5 additions & 5 deletions b/‎Model/Reka/models.json‎
Lines changed: 5 additions & 5 deletions
@@ -2,31 +2,59 @@
     "chat": {
         "claude-3-opus-20240229": {
             "description": "Most powerful model for highly complex tasks. Top-level performance, intelligence, fluency, and understanding.",
-            "inputTokens": 150000,
-            "inputTokenPrice": 15.00,
+            "inputTokens": 200000,
+            "inputTokenPrice": 15,
             "outputTokens": 4096,
-            "outputTokenPrice": 75.00
+            "outputTokenPrice": 75
         },
         "claude-3-5-sonnet-20240620": {
             "description": "Most intelligent model",
             "inputTokens": 200000,
-            "inputTokenPrice": 3.00,
+            "inputTokenPrice": 3,
             "outputTokens": 4096,
-            "outputTokenPrice": 15.00
+            "outputTokenPrice": 15
         },
         "claude-3-sonnet-20240229": {
             "description": "Ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.",
-            "inputTokens": 150000,
-            "inputTokenPrice": 3.00,
+            "inputTokens": 200000,
+            "inputTokenPrice": 3,
             "outputTokens": 4096,
-            "outputTokenPrice": 15.00
+            "outputTokenPrice": 15
         },
         "claude-3-haiku-20240307": {
             "description": "Fastest and most compact model for near-instant responsiveness. Quick and accurate targeted performance.",
-            "inputTokens": 150000,
+            "inputTokens": 200000,
             "inputTokenPrice": 0.25,
             "outputTokens": 4096,
             "outputTokenPrice": 1.25
+        },
+        "claude-instant-1": {
+            "description": "",
+            "inputTokens": 100000,
+            "inputTokenPrice": 1.63,
+            "outputTokens": 8191,
+            "outputTokenPrice": 5.51
+        },
+        "claude-instant-1.2": {
+            "description": "",
+            "inputTokens": 100000,
+            "inputTokenPrice": 0.16,
+            "outputTokens": 8191,
+            "outputTokenPrice": 0.55
+        },
+        "claude-2": {
+            "description": "",
+            "inputTokens": 100000,
+            "inputTokenPrice": 8,
+            "outputTokens": 8191,
+            "outputTokenPrice": 24
+        },
+        "claude-2.1": {
+            "description": "",
+            "inputTokens": 200000,
+            "inputTokenPrice": 8,
+            "outputTokens": 8191,
+            "outputTokenPrice": 24
         }
     }
-}
+}
@@ -3,37 +3,37 @@
         "llama3-8b-8192": {
             "description": "LLaMA3 8b",
             "inputTokens": 8192,
-            "inputTokenPrice": 0,
+            "inputTokenPrice": 0.05,
             "outputTokens": 8192,
-            "outputTokenPrice": 0
+            "outputTokenPrice": 0.08
         },
         "llama3-70b-8192": {
             "description": "LLaMA3 70b",
             "inputTokens": 8192,
-            "inputTokenPrice": 0,
+            "inputTokenPrice": 0.59,
             "outputTokens": 8192,
-            "outputTokenPrice": 0
+            "outputTokenPrice": 0.79
         },
         "llama2-70b-4096": {
             "description": "LLaMA2 70b",
             "inputTokens": 4096,
-            "inputTokenPrice": 0,
+            "inputTokenPrice": 0.7,
             "outputTokens": 4096,
-            "outputTokenPrice": 0
+            "outputTokenPrice": 0.8
         },
         "mixtral-8x7b-32768": {
             "description": "Mixtral 8x7b",
             "inputTokens": 32768,
-            "inputTokenPrice": 0,
+            "inputTokenPrice": 0.24,
             "outputTokens": 32768,
-            "outputTokenPrice": 0
+            "outputTokenPrice": 0.24
         },
         "gemma-7b-it": {
             "description": "Gemma is a family of lightweight, state-of-the-art open models from Google, built from the same research and technology used to create the Gemini models. They are text-to-text, decoder-only large language models, available in English, with open weights, pre-trained variants, and instruction-tuned variants. Gemma models are well-suited for a variety of text generation tasks, including question answering, summarization, and reasoning. Their relatively small size makes it possible to deploy them in environments with limited resources such as a laptop, desktop or your own cloud infrastructure, democratizing access to state of the art AI models and helping foster innovation for everyone.",
             "inputTokens": 8192,
-            "inputTokenPrice": 0,
-            "outputTokens": 8182,
-            "outputTokenPrice": 0
+            "inputTokenPrice": 0.07,
+            "outputTokens": 8192,
+            "outputTokenPrice": 0.07
         }
     }
-}
+}
@@ -4,51 +4,100 @@
             "description": "Our very first. A 7B transformer model, fast-deployed and easily customisable. Small, yet very powerful for a variety of use cases. English and code.",
             "inputTokens": 32000,
             "inputTokenPrice": 0.25,
-            "outputTokens": 4096,
+            "outputTokens": 8191,
             "outputTokenPrice": 0.25
         },
         "open-mixtral-8x7b": {
             "description": "A 7B sparse Mixture-of-Experts (SMoE). Uses 12B active parameters out of 45B total. Fluent in English, French, Italian, German, Spanish, and strong in code.",
             "inputTokens": 32000,
             "inputTokenPrice": 0.7,
-            "outputTokens": 4096,
+            "outputTokens": 8191,
             "outputTokenPrice": 0.7
         },
         "open-mixtral-8x22b": {
             "description": "A 22B sparse Mixture-of-Experts (SMoE). Uses only 39B active parameters out of 141B. Fluent in English, French, Italian, German, Spanish, and strong in code.",
             "inputTokens": 64000,
-            "inputTokenPrice": 2.0,
-            "outputTokens": 4096,
-            "outputTokenPrice": 6.0
+            "inputTokenPrice": 2,
+            "outputTokens": 8191,
+            "outputTokenPrice": 6
         },
         "mistral-small-latest": {
             "description": "Cost-efficient reasoning for low-latency workloads. Fluent in English, French, Italian, German, Spanish, and strong in code.",
             "inputTokens": 32000,
-            "inputTokenPrice": 2.00,
-            "outputTokens": 4096,
-            "outputTokenPrice": 6.00
+            "inputTokenPrice": 1,
+            "outputTokens": 8191,
+            "outputTokenPrice": 3
         },
         "mistral-medium-latest": {
             "description": "Balanced reasoning for a wide range of tasks. Fluent in English, French, Italian, German, Spanish, and strong in code.",
             "inputTokens": 32000,
-            "inputTokenPrice": 2.70,
-            "outputTokens": 4096,
-            "outputTokenPrice": 8.10
+            "inputTokenPrice": 2.7,
+            "outputTokens": 8191,
+            "outputTokenPrice": 8.1
         },
         "mistral-large-latest": {
             "description": "Top-tier reasoning for high-complexity tasks. Fluent in English, French, Italian, German, Spanish, and strong in code.",
             "inputTokens": 32000,
-            "inputTokenPrice": 8.00,
-            "outputTokens": 4096,
-            "outputTokenPrice": 24.00
+            "inputTokenPrice": 4,
+            "outputTokens": 8191,
+            "outputTokenPrice": 12
+        },
+        "mistral-tiny": {
+            "description": "",
+            "inputTokens": 32000,
+            "inputTokenPrice": 0.25,
+            "outputTokens": 8191,
+            "outputTokenPrice": 0.25
+        },
+        "mistral-small": {
+            "description": "",
+            "inputTokens": 32000,
+            "inputTokenPrice": 1,
+            "outputTokens": 8191,
+            "outputTokenPrice": 3
+        },
+        "mistral-medium": {
+            "description": "",
+            "inputTokens": 32000,
+            "inputTokenPrice": 2.7,
+            "outputTokens": 8191,
+            "outputTokenPrice": 8.1
+        },
+        "codestral-latest": {
+            "description": "",
+            "inputTokens": 32000,
+            "inputTokenPrice": 1,
+            "outputTokens": 8191,
+            "outputTokenPrice": 3
+        },
+        "open-mistral-nemo": {
+            "description": "https:\/\/mistral.ai\/technology\/",
+            "inputTokens": 128000,
+            "inputTokenPrice": 0.3,
+            "outputTokens": 128000,
+            "outputTokenPrice": 0.3
+        },
+        "open-codestral-mamba": {
+            "description": "https:\/\/mistral.ai\/technology\/",
+            "inputTokens": 256000,
+            "inputTokenPrice": 0.25,
+            "outputTokens": 256000,
+            "outputTokenPrice": 0.25
+        },
+        "codestral-mamba-latest": {
+            "description": "https:\/\/mistral.ai\/technology\/",
+            "inputTokens": 256000,
+            "inputTokenPrice": 0.25,
+            "outputTokens": 256000,
+            "outputTokenPrice": 0.25
         }
     },
     "embedding": {
         "mistral-embed": {
             "description": "State-of-the-art semantic for extracting representation of text extracts. English only for now.",
-            "inputTokenPrice": 0.10,
-            "inputTokens": 4096,
+            "inputTokens": 8192,
+            "inputTokenPrice": 0.1,
             "dimensions": 1024
         }
     }
-}
+}
@@ -3,50 +3,77 @@
         "gpt-3.5-turbo": {
             "description": "GPT-3.5 Turbo is a variant of GPT-3.5 that is optimized for speed and can generate responses in a fraction of the time.",
             "inputTokens": 16385,
-            "inputTokenPrice": 0.50,
+            "inputTokenPrice": 1.5,
             "outputTokens": 4096,
-            "outputTokenPrice": 1.50
+            "outputTokenPrice": 2
         },
         "gpt-4": {
             "description": "GPT-4 is the latest version of OpenAI's Generative Pre-trained Transformer (GPT) language model. It is capable of generating human-like text and can be used for a wide range of natural language processing tasks.",
-            "inputTokens": 81924,
-            "inputTokenPrice": 30.00,
+            "inputTokens": 8192,
+            "inputTokenPrice": 30,
             "outputTokens": 4096,
-            "outputTokenPrice": 60.00
+            "outputTokenPrice": 60
         },
         "gpt-4-turbo": {
             "description": "GPT-4 Turbo is a variant of GPT-4 that is optimized for speed and can generate responses in a fraction of the time.",
             "inputTokens": 128000,
-            "inputTokenPrice": 10.00,
+            "inputTokenPrice": 10,
             "outputTokens": 4096,
-            "outputTokenPrice": 30.00
+            "outputTokenPrice": 30
         },
         "gpt-4o": {
             "description": "GPT-4o has the same high intelligence as GPT-4 Turbo but is much more efficient",
             "inputTokens": 128000,
-            "inputTokenPrice": 5.00,
+            "inputTokenPrice": 5,
+            "outputTokens": 4096,
+            "outputTokenPrice": 15
+        },
+        "gpt-4o-mini": {
+            "description": "",
+            "inputTokens": 128000,
+            "inputTokenPrice": 0.15,
+            "outputTokens": 4096,
+            "outputTokenPrice": 0.6
+        },
+        "gpt-4-32k": {
+            "description": "",
+            "inputTokens": 32768,
+            "inputTokenPrice": 60,
+            "outputTokens": 4096,
+            "outputTokenPrice": 120
+        },
+        "gpt-3.5-turbo-16k": {
+            "description": "",
+            "inputTokens": 16385,
+            "inputTokenPrice": 3,
             "outputTokens": 4096,
-            "outputTokenPrice": 15.00
+            "outputTokenPrice": 4
         }
     },
     "embedding": {
         "text-embedding-ada-002": {
             "description": "Most capable 2nd generation embedding model",
-            "inputTokens": 8192,
-            "inputTokenPrice": 0.10,
+            "inputTokens": 8191,
+            "inputTokenPrice": 0.1,
             "dimensions": 1536
         },
         "text-embedding-3-small": {
             "description": "Increased performance over 2nd generation ada embedding model",
-            "inputTokens": 8192,
+            "inputTokens": 8191,
             "inputTokenPrice": 0.02,
             "dimensions": 1536
         },
         "text-embedding-3-large": {
             "description": "Most capable embedding model for both english and non-english tasks",
-            "inputTokens": 8192,
+            "inputTokens": 8191,
             "inputTokenPrice": 0.13,
             "dimensions": 3072
+        },
+        "text-embedding-ada-002-v2": {
+            "description": "",
+            "inputTokens": 8191,
+            "inputTokenPrice": 0.1,
+            "dimensions": 1536
         }
     }
-}
+}
@@ -5,21 +5,21 @@
             "inputTokens": 128000,
             "inputTokenPrice": 0.8,
             "outputTokens": 8192,
-            "outputTokenPrice": 2.0
+            "outputTokenPrice": 2
         },
         "reka-edge": {
             "description": "Lightweight model for local (i.e., on-hardware) or latency sensitive applications",
             "inputTokens": 64000,
             "inputTokenPrice": 0.4,
             "outputTokens": 8192,
-            "outputTokenPrice": 1.0
+            "outputTokenPrice": 1
         },
         "reka-core": {
             "description": "Superior capabilities for complex tasks",
             "inputTokens": 128000,
-            "inputTokenPrice": 10.0,
+            "inputTokenPrice": 10,
             "outputTokens": 8192,
-            "outputTokenPrice": 25.0
+            "outputTokenPrice": 25
         }
     }
-}
+}