Skip to content
Open
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
17 commits
Select commit Hold shift + click to select a range
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions fast_llm/models/gpt/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@
AutoGPTHuggingfaceCheckpointFormat,
DiffusionDreamCheckpointFormat,
DiffusionLlamaCheckpointFormat,
GptOssCheckpointFormat,
LlamaCheckpointFormat,
MistralCheckpointFormat,
MixtralCheckpointFormat,
Expand Down Expand Up @@ -117,6 +118,7 @@ class GPTModelConfig(FastLLMModelConfig):
DiffusionDreamCheckpointFormat,
DiffusionLlamaCheckpointFormat,
AprielHybridSSMCheckpointFormat,
GptOssCheckpointFormat,
)

@classmethod
Expand Down
3 changes: 3 additions & 0 deletions fast_llm/models/gpt/conversion/auto.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@
AprielHybridSSMCheckpointFormat,
DiffusionDreamCheckpointFormat,
DiffusionLlamaCheckpointFormat,
GptOssCheckpointFormat,
LlamaCheckpointFormat,
MistralCheckpointFormat,
MixtralCheckpointFormat,
Expand All @@ -15,6 +16,7 @@
)
from fast_llm.models.gpt.conversion.diffusion_dream import DiffusionDreamHuggingfaceCheckpointHandler
from fast_llm.models.gpt.conversion.diffusion_llama import DiffusionLlamaHuggingfaceCheckpointHandler
from fast_llm.models.gpt.conversion.gpt_oss import GptOssHuggingfaceCheckpointHandler
from fast_llm.models.gpt.conversion.llama import LlamaHuggingfaceCheckpointHandler
from fast_llm.models.gpt.conversion.mistral import MistralHuggingfaceCheckpointHandler
from fast_llm.models.gpt.conversion.mixtral import MixtralHuggingfaceCheckpointHandler
Expand All @@ -35,4 +37,5 @@ class AutoGPTHuggingfaceCheckpointHandler(
DiffusionDreamCheckpointFormat.name: DiffusionDreamHuggingfaceCheckpointHandler,
DiffusionLlamaCheckpointFormat.name: DiffusionLlamaHuggingfaceCheckpointHandler,
AprielHybridSSMCheckpointFormat.name: AprielHuggingfaceCheckpointHandler,
GptOssCheckpointFormat.name: GptOssHuggingfaceCheckpointHandler,
}
4 changes: 4 additions & 0 deletions fast_llm/models/gpt/conversion/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,3 +47,7 @@ class DiffusionLlamaCheckpointFormat(GPTHuggingfaceCheckpointFormat):

class AprielHybridSSMCheckpointFormat(GPTHuggingfaceCheckpointFormat):
name: typing.ClassVar[str] = "apriel_hybrid_ssm"


class GptOssCheckpointFormat(GPTHuggingfaceCheckpointFormat):
name: typing.ClassVar[str] = "gpt_oss"
Loading