Support o3/o4 models (#110)

zurawiki · web-flow · commit 917022138a59 · 2025-07-22T22:38:46.000-04:00
diff --git a/tiktoken-rs/README.md b/tiktoken-rs/README.md
@@ -105,7 +105,7 @@ println!("max_tokens: {}", max_tokens);
 
 | Encoding name           | OpenAI models                                                             |
 | ----------------------- | ------------------------------------------------------------------------- |
-| `o200k_base`            | GPT-4o models, o1 models                                                  |
+| `o200k_base`            | GPT-4o models, GPT-4.1, o1, o3, and o4 models                             |
 | `cl100k_base`           | ChatGPT models, `text-embedding-ada-002`                                  |
 | `p50k_base`             | Code models, `text-davinci-002`, `text-davinci-003`                       |
 | `p50k_edit`             | Use for edit models like `text-davinci-edit-001`, `code-davinci-edit-001` |
diff --git a/tiktoken-rs/src/model.rs b/tiktoken-rs/src/model.rs
@@ -36,8 +36,11 @@ pub fn get_context_size(model: &str) -> usize {
         let base = rest.split(':').next().unwrap_or(rest);
         return get_context_size(base);
     }
-    if starts_with_any!(model, "o1-") {
-        return 128_000;
+    if starts_with_any!(model, "o1", "o3", "o4") {
+        return 200_000;
+    }
+    if starts_with_any!(model, "gpt-4.1") {
+        return 1_047_576;
     }
     if starts_with_any!(model, "gpt-4o") {
         return 128_000;
diff --git a/tiktoken-rs/src/singleton.rs b/tiktoken-rs/src/singleton.rs
@@ -49,7 +49,7 @@ pub fn cl100k_base_singleton() -> &'static CoreBPE {
 }
 
 /// Returns a singleton instance of the o200k_base tokenizer.
-/// Use for GPT-4o models.
+/// Use for GPT-4o models and other `o` series models like `o1`, `o3`, and `o4`.
 ///
 /// This function will only initialize the tokenizer once, and then return a reference the tokenizer
 pub fn o200k_base_singleton() -> &'static CoreBPE {
diff --git a/tiktoken-rs/src/tiktoken_ext/openai_public.rs b/tiktoken-rs/src/tiktoken_ext/openai_public.rs
@@ -118,7 +118,7 @@ pub fn cl100k_base() -> Result<CoreBPE> {
     Ok(bpe)
 }
 
-/// Use for GPT-4o models.
+/// Use for GPT-4o models and other `o` series models like `o1`, `o3`, and `o4`.
 /// Initializes and returns a new instance of the o200k_base tokenizer.
 pub fn o200k_base() -> Result<CoreBPE> {
     let o200k_base = include_str!("../../assets/o200k_base.tiktoken");
diff --git a/tiktoken-rs/src/tokenizer.rs b/tiktoken-rs/src/tokenizer.rs
@@ -55,6 +55,7 @@ const MODEL_TO_TOKENIZER: &[(&str, Tokenizer)] = &[
     // reasoning
     ("o1", Tokenizer::O200kBase),
     ("o3", Tokenizer::O200kBase),
+    ("o4", Tokenizer::O200kBase),
     // chat
     ("gpt-4.1", Tokenizer::O200kBase),
     ("chatgpt-4o-latest", Tokenizer::O200kBase),
diff --git a/tiktoken-rs/src/vendor_tiktoken.rs b/tiktoken-rs/src/vendor_tiktoken.rs
@@ -164,6 +164,7 @@ impl std::fmt::Display for DecodeKeyError {
 impl std::error::Error for DecodeKeyError {}
 
 #[derive(Debug, Clone)]
+#[allow(dead_code)]
 pub struct DecodeError {
     pub message: String,
 }
diff --git a/tiktoken-rs/tests/model.rs b/tiktoken-rs/tests/model.rs
@@ -11,3 +11,9 @@ fn test_finetuned_context_size() {
         get_context_size("gpt-4o")
     );
 }
+
+#[test]
+fn test_o_series_context_size() {
+    assert_eq!(get_context_size("o3-small"), 200_000);
+    assert_eq!(get_context_size("o4"), 200_000);
+}

Original file line number	Diff line number	Diff line change
`@@ -36,8 +36,11 @@ pub fn get_context_size(model: &str) -> usize {`
`36`	`36`	`let base = rest.split(':').next().unwrap_or(rest);`
`37`	`37`	`return get_context_size(base);`
`38`	`38`	`}`
`39`		`- if starts_with_any!(model, "o1-") {`
`40`		`- return 128_000;`
	`39`	`+ if starts_with_any!(model, "o1", "o3", "o4") {`
	`40`	`+ return 200_000;`
	`41`	`+ }`
	`42`	`+ if starts_with_any!(model, "gpt-4.1") {`
	`43`	`+ return 1_047_576;`
`41`	`44`	`}`
`42`	`45`	`if starts_with_any!(model, "gpt-4o") {`
`43`	`46`	`return 128_000;`
Original file line number	Diff line number	Diff line change
`@@ -49,7 +49,7 @@ pub fn cl100k_base_singleton() -> &'static CoreBPE {`
`49`	`49`	`}`
`50`	`50`
`51`	`51`	`/// Returns a singleton instance of the o200k_base tokenizer.`
`52`		`-/// Use for GPT-4o models.`
	`52`	+/// Use for GPT-4o models and other `o` series models like `o1`, `o3`, and `o4`.
`53`	`53`	`///`
`54`	`54`	`/// This function will only initialize the tokenizer once, and then return a reference the tokenizer`
`55`	`55`	`pub fn o200k_base_singleton() -> &'static CoreBPE {`
Original file line number	Diff line number	Diff line change
`@@ -118,7 +118,7 @@ pub fn cl100k_base() -> Result<CoreBPE> {`
`118`	`118`	`Ok(bpe)`
`119`	`119`	`}`
`120`	`120`
`121`		`-/// Use for GPT-4o models.`
	`121`	+/// Use for GPT-4o models and other `o` series models like `o1`, `o3`, and `o4`.
`122`	`122`	`/// Initializes and returns a new instance of the o200k_base tokenizer.`
`123`	`123`	`pub fn o200k_base() -> Result<CoreBPE> {`
`124`	`124`	`let o200k_base = include_str!("../../assets/o200k_base.tiktoken");`
Original file line number	Diff line number	Diff line change
`@@ -164,6 +164,7 @@ impl std::fmt::Display for DecodeKeyError {`
`164`	`164`	`impl std::error::Error for DecodeKeyError {}`
`165`	`165`
`166`	`166`	`#[derive(Debug, Clone)]`
	`167`	`+#[allow(dead_code)]`
`167`	`168`	`pub struct DecodeError {`
`168`	`169`	`pub message: String,`
`169`	`170`	`}`