Register OpenAI GPT-OSS and GPT-OSS-SAFEGUARD Presets to kerashub. (#2473)

laxmareddyp · web-flow · commit cea564353382 · 2025-12-17T16:24:40.000-08:00
* Test GPT_OSS files through porter

* generate API and moved files to respective folders

* Fix format issues

* Add gpt_oss to preset loader and Fix format issues

* Add gpt_oss to preset loader

* generated files through 2.5-pro model

* Format fix

* Add converter, RoPE update

* Fix format

* Fix BPE tests

* Update converter

* Fix converter, checkpoints conversion and attention

* Fix the parameter count and debug code

* Add dequantization logic to converter

* Add YaRN support,Fix Serialisation,Fix dequantization

* Fixed several pytest tests

* Address gpt_oss_causal_lm tests

* Fix format issues

* Address review comments

* set start token id to None to match the HF output

* Fix test cases

* Fix test

* Fix error

* Fix

* Address all  comments

* Register GPT-OSS Presets

* FIx fromat
diff --git a/keras_hub/src/models/gpt_oss/gpt_oss_presets.py b/keras_hub/src/models/gpt_oss/gpt_oss_presets.py
@@ -1 +1,51 @@
-backbone_presets = {}
+backbone_presets = {
+    "gpt_oss_20b_en": {
+        "metadata": {
+            "description": (
+                "This preset has 21 billion total parameters, "
+                "with 3.6 billion active parameters, a 128k context "
+                "length, and is de-quantized from MXFP4."
+            ),
+            "params": 20_914_757_184,
+            "path": "gpt_oss",
+        },
+        "kaggle_handle": "kaggle://keras/gpt-oss/keras/gpt_oss_20b_en/1",
+    },
+    "gpt_oss_120b_en": {
+        "metadata": {
+            "description": (
+                "This preset has 117 billion total parameters, "
+                "with 5.1 billion active parameters, a 128k context "
+                "length, and is de-quantized from MXFP4."
+            ),
+            "params": 116_829_156_672,
+            "path": "gpt_oss",
+        },
+        "kaggle_handle": "kaggle://keras/gpt-oss/keras/gpt_oss_120b_en/1",
+    },
+    "gpt_oss_safeguard_20b_en": {
+        "metadata": {
+            "description": (
+                "Open-weight safety reasoning model with 21 billion "
+                "total parameters,with 3.6 billion active "
+                "parameters, a context length of over 128k, "
+                "and is de-quantized from MXFP4."
+            ),
+            "params": 20_914_757_184,
+            "path": "gpt_oss",
+        },
+        "kaggle_handle": "kaggle://keras/gpt-oss-safeguard/keras/gpt_oss_safeguard_20b_en/1",
+    },
+    "gpt_oss_safeguard_120b_en": {
+        "metadata": {
+            "description": (
+                "Open-weight safety reasoning model with 117 billion "
+                "total parameters,with 5.1 billion active parameters, "
+                "a 128k context length, and is de-quantized from MXFP4."
+            ),
+            "params": 116_829_156_672,
+            "path": "gpt_oss",
+        },
+        "kaggle_handle": "kaggle://keras/gpt-oss-safeguard/keras/gpt_oss_safeguard_120b_en/1",
+    },
+}
diff --git a/tools/checkpoint_conversion/convert_gpt_oss_checkpoints.py b/tools/checkpoint_conversion/convert_gpt_oss_checkpoints.py
@@ -30,6 +30,8 @@
 PRESET_MAP = {
     "gpt_oss_20b_en": "openai/gpt-oss-20b",
     "gpt_oss_120b_en": "openai/gpt-oss-120b",
+    "gpt_oss_safeguard_20b_en": "openai/gpt-oss-safeguard-20b",
+    "gpt_oss_safeguard_120b_en": "openai/gpt-oss-safeguard-120b",
 }
 
 FLAGS = flags.FLAGS

Original file line number	Diff line number	Diff line change
`@@ -30,6 +30,8 @@`
`30`	`30`	`PRESET_MAP = {`
`31`	`31`	`"gpt_oss_20b_en": "openai/gpt-oss-20b",`
`32`	`32`	`"gpt_oss_120b_en": "openai/gpt-oss-120b",`
	`33`	`+ "gpt_oss_safeguard_20b_en": "openai/gpt-oss-safeguard-20b",`
	`34`	`+ "gpt_oss_safeguard_120b_en": "openai/gpt-oss-safeguard-120b",`
`33`	`35`	`}`
`34`	`36`
`35`	`37`	`FLAGS = flags.FLAGS`