update for 4o-mini

teomusatoiu · teomusatoiu · commit f2128ca1cade · 2024-09-23T14:35:35.000+03:00
diff --git a/examples/How_to_count_tokens_with_tiktoken.ipynb b/examples/How_to_count_tokens_with_tiktoken.ipynb
@@ -22,13 +22,14 @@
     "\n",
     "| Encoding name           | OpenAI models                                       |\n",
     "|-------------------------|-----------------------------------------------------|\n",
+    "| `o200k_base`            | `gpt-4o`, `gpt-4o-mini`                             |\n",
     "| `cl100k_base`           | `gpt-4`, `gpt-3.5-turbo`, `text-embedding-ada-002`, `text-embedding-3-small`, `text-embedding-3-large`  |\n",
     "| `p50k_base`             | Codex models, `text-davinci-002`, `text-davinci-003`|\n",
     "| `r50k_base` (or `gpt2`) | GPT-3 models like `davinci`                         |\n",
     "\n",
     "You can retrieve the encoding for a model using `tiktoken.encoding_for_model()` as follows:\n",
     "```python\n",
-    "encoding = tiktoken.encoding_for_model('gpt-3.5-turbo')\n",
+    "encoding = tiktoken.encoding_for_model('gpt-4o-mini')\n",
     "```\n",
     "\n",
     "Note that `p50k_base` overlaps substantially with `r50k_base`, and for non-code applications, they will usually give the same tokens.\n",
@@ -71,12 +72,27 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.0\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.2\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpython3 -m pip install --upgrade pip\u001b[0m\n",
+      "Note: you may need to restart the kernel to use updated packages.\n",
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.0\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.2\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpython3 -m pip install --upgrade pip\u001b[0m\n",
+      "Note: you may need to restart the kernel to use updated packages.\n"
+     ]
+    }
+   ],
    "source": [
-    "%pip install --upgrade tiktoken\n",
-    "%pip install --upgrade openai"
+    "%pip install --upgrade tiktoken -q\n",
+    "%pip install --upgrade openai -q"
    ]
   },
   {
@@ -89,7 +105,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -131,7 +147,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "encoding = tiktoken.encoding_for_model(\"gpt-3.5-turbo\")"
+    "encoding = tiktoken.encoding_for_model(\"gpt-4o-mini\")"
    ]
   },
   {
@@ -159,7 +175,7 @@
     {
      "data": {
       "text/plain": [
-       "[83, 1609, 5963, 374, 2294, 0]"
+       "[83, 8251, 2488, 382, 2212, 0]"
       ]
      },
      "execution_count": 5,
@@ -236,7 +252,7 @@
     {
      "data": {
       "text/plain": [
-       "'tiktoken is great!'"
+       "'turesറلás!'"
       ]
      },
      "execution_count": 8,
@@ -272,7 +288,7 @@
     {
      "data": {
       "text/plain": [
-       "[b't', b'ik', b'token', b' is', b' great', b'!']"
+       "[b't', b'ures', b'\\xe0\\xb4\\xb1', b'\\xd9\\x84', b'\\xc3\\xa1s', b'!']"
       ]
      },
      "execution_count": 9,
@@ -313,7 +329,7 @@
     "    # print the example string\n",
     "    print(f'\\nExample string: \"{example_string}\"')\n",
     "    # for each encoding, print the # of tokens, the token integers, and the token bytes\n",
-    "    for encoding_name in [\"r50k_base\", \"p50k_base\", \"cl100k_base\"]:\n",
+    "    for encoding_name in [\"r50k_base\", \"p50k_base\", \"cl100k_base\", \"o200k_base\"]:\n",
     "        encoding = tiktoken.get_encoding(encoding_name)\n",
     "        token_integers = encoding.encode(example_string)\n",
     "        num_tokens = len(token_integers)\n",
@@ -347,7 +363,11 @@
       "\n",
       "cl100k_base: 6 tokens\n",
       "token integers: [519, 85342, 34500, 479, 8997, 2191]\n",
-      "token bytes: [b'ant', b'idis', b'establish', b'ment', b'arian', b'ism']\n"
+      "token bytes: [b'ant', b'idis', b'establish', b'ment', b'arian', b'ism']\n",
+      "\n",
+      "o200k_base: 6 tokens\n",
+      "token integers: [493, 129901, 376, 160388, 21203, 2367]\n",
+      "token bytes: [b'ant', b'idis', b'est', b'ablishment', b'arian', b'ism']\n"
      ]
     }
    ],
@@ -377,6 +397,10 @@
       "\n",
       "cl100k_base: 7 tokens\n",
       "token integers: [17, 489, 220, 17, 284, 220, 19]\n",
+      "token bytes: [b'2', b' +', b' ', b'2', b' =', b' ', b'4']\n",
+      "\n",
+      "o200k_base: 7 tokens\n",
+      "token integers: [17, 659, 220, 17, 314, 220, 19]\n",
       "token bytes: [b'2', b' +', b' ', b'2', b' =', b' ', b'4']\n"
      ]
     }
@@ -407,7 +431,11 @@
       "\n",
       "cl100k_base: 9 tokens\n",
       "token integers: [33334, 45918, 243, 21990, 9080, 33334, 62004, 16556, 78699]\n",
-      "token bytes: [b'\\xe3\\x81\\x8a', b'\\xe8\\xaa', b'\\x95', b'\\xe7\\x94\\x9f', b'\\xe6\\x97\\xa5', b'\\xe3\\x81\\x8a', b'\\xe3\\x82\\x81', b'\\xe3\\x81\\xa7', b'\\xe3\\x81\\xa8\\xe3\\x81\\x86']\n"
+      "token bytes: [b'\\xe3\\x81\\x8a', b'\\xe8\\xaa', b'\\x95', b'\\xe7\\x94\\x9f', b'\\xe6\\x97\\xa5', b'\\xe3\\x81\\x8a', b'\\xe3\\x82\\x81', b'\\xe3\\x81\\xa7', b'\\xe3\\x81\\xa8\\xe3\\x81\\x86']\n",
+      "\n",
+      "o200k_base: 8 tokens\n",
+      "token integers: [8930, 9697, 243, 128225, 8930, 17693, 4344, 48669]\n",
+      "token bytes: [b'\\xe3\\x81\\x8a', b'\\xe8\\xaa', b'\\x95', b'\\xe7\\x94\\x9f\\xe6\\x97\\xa5', b'\\xe3\\x81\\x8a', b'\\xe3\\x82\\x81', b'\\xe3\\x81\\xa7', b'\\xe3\\x81\\xa8\\xe3\\x81\\x86']\n"
      ]
     }
    ],
@@ -433,36 +461,40 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [],
    "source": [
-    "def num_tokens_from_messages(messages, model=\"gpt-3.5-turbo-0613\"):\n",
+    "def num_tokens_from_messages(messages, model=\"gpt-4o-mini-2024-07-18\"):\n",
     "    \"\"\"Return the number of tokens used by a list of messages.\"\"\"\n",
     "    try:\n",
     "        encoding = tiktoken.encoding_for_model(model)\n",
     "    except KeyError:\n",
     "        print(\"Warning: model not found. Using cl100k_base encoding.\")\n",
     "        encoding = tiktoken.get_encoding(\"cl100k_base\")\n",
     "    if model in {\n",
-    "        \"gpt-3.5-turbo-0613\",\n",
-    "        \"gpt-3.5-turbo-16k-0613\",\n",
+    "        \"gpt-3.5-turbo-0125\",\n",
     "        \"gpt-4-0314\",\n",
     "        \"gpt-4-32k-0314\",\n",
     "        \"gpt-4-0613\",\n",
     "        \"gpt-4-32k-0613\",\n",
+    "        \"gpt-4o-mini-2024-07-18\",\n",
+    "        \"gpt-4o-2024-08-06\"\n",
     "        }:\n",
     "        tokens_per_message = 3\n",
     "        tokens_per_name = 1\n",
-    "    elif model == \"gpt-3.5-turbo-0301\":\n",
-    "        tokens_per_message = 4  # every message follows <|start|>{role/name}\\n{content}<|end|>\\n\n",
-    "        tokens_per_name = -1  # if there's a name, the role is omitted\n",
     "    elif \"gpt-3.5-turbo\" in model:\n",
-    "        print(\"Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0613.\")\n",
-    "        return num_tokens_from_messages(messages, model=\"gpt-3.5-turbo-0613\")\n",
+    "        print(\"Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0125.\")\n",
+    "        return num_tokens_from_messages(messages, model=\"gpt-3.5-turbo-0125\")\n",
     "    elif \"gpt-4\" in model:\n",
     "        print(\"Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.\")\n",
     "        return num_tokens_from_messages(messages, model=\"gpt-4-0613\")\n",
+    "    elif \"gpt-4o\" in model:\n",
+    "        print(\"Warning: gpt-4o and gpt-4o-mini may update over time. Returning num tokens assuming gpt-4o-2024-08-06.\")\n",
+    "        return num_tokens_from_messages(messages, model=\"ggpt-4o-2024-08-06\")\n",
+    "    elif \"gpt-4o-mini\" in model:\n",
+    "        print(\"Warning: gpt-4o-mini may update over time. Returning num tokens assuming gpt-4o-mini-2024-07-18.\")\n",
+    "        return num_tokens_from_messages(messages, model=\"gpt-4o-mini-2024-07-18\")\n",
     "    else:\n",
     "        raise NotImplementedError(\n",
     "            f\"\"\"num_tokens_from_messages() is not implemented for model {model}.\"\"\"\n",
@@ -480,38 +512,36 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 15,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "gpt-3.5-turbo-0301\n",
-      "127 prompt tokens counted by num_tokens_from_messages().\n",
-      "127 prompt tokens counted by the OpenAI API.\n",
-      "\n",
-      "gpt-3.5-turbo-0613\n",
+      "gpt-3.5-turbo\n",
+      "Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0125.\n",
       "129 prompt tokens counted by num_tokens_from_messages().\n",
       "129 prompt tokens counted by the OpenAI API.\n",
       "\n",
-      "gpt-3.5-turbo\n",
-      "Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0613.\n",
+      "gpt-4-0613\n",
       "129 prompt tokens counted by num_tokens_from_messages().\n",
       "129 prompt tokens counted by the OpenAI API.\n",
       "\n",
-      "gpt-4-0314\n",
+      "gpt-4\n",
+      "Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.\n",
       "129 prompt tokens counted by num_tokens_from_messages().\n",
       "129 prompt tokens counted by the OpenAI API.\n",
       "\n",
-      "gpt-4-0613\n",
+      "gpt-4o\n",
+      "Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.\n",
       "129 prompt tokens counted by num_tokens_from_messages().\n",
-      "129 prompt tokens counted by the OpenAI API.\n",
+      "124 prompt tokens counted by the OpenAI API.\n",
       "\n",
-      "gpt-4\n",
+      "gpt-4o-mini\n",
       "Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.\n",
       "129 prompt tokens counted by num_tokens_from_messages().\n",
-      "129 prompt tokens counted by the OpenAI API.\n",
+      "124 prompt tokens counted by the OpenAI API.\n",
       "\n"
      ]
     }
@@ -556,12 +586,11 @@
     "]\n",
     "\n",
     "for model in [\n",
-    "    \"gpt-3.5-turbo-0301\",\n",
-    "    \"gpt-3.5-turbo-0613\",\n",
     "    \"gpt-3.5-turbo\",\n",
-    "    \"gpt-4-0314\",\n",
     "    \"gpt-4-0613\",\n",
     "    \"gpt-4\",\n",
+    "    \"gpt-4o\",\n",
+    "    \"gpt-4o-mini\"\n",
     "    ]:\n",
     "    print(model)\n",
     "    # example token count from the function defined above\n",
@@ -574,13 +603,6 @@
     "    print(f'{response.usage.prompt_tokens} prompt tokens counted by the OpenAI API.')\n",
     "    print()\n"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
@@ -599,7 +621,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.11.5"
+   "version": "3.12.1"
   },
   "vscode": {
    "interpreter": {