Skip to content

Commit 106def4

Browse files
committed
Fix llama4 (#5105)
1 parent 05bba0a commit 106def4

File tree

2 files changed

+10
-1
lines changed

2 files changed

+10
-1
lines changed

swift/llm/model/model/llama.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -232,7 +232,7 @@ def get_model_tokenizer_llama4(*args, **kwargs):
232232
get_model_tokenizer_llama4,
233233
requires=['transformers>=4.51'],
234234
architectures=['Llama4ForConditionalGeneration'],
235-
model_arch=ModelArch.llama3_2_vision,
235+
model_arch=ModelArch.llama4,
236236
tags=['vision'],
237237
))
238238

swift/llm/model/model_arch.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@ class MLLMModelArch:
3939

4040
llama3_1_omni = 'llama3_1_omni'
4141
llama3_2_vision = 'llama3_2_vision'
42+
llama4 = 'llama4'
4243

4344
llava_hf = 'llava_hf'
4445
llava_hf_legacy = 'llava_hf_legacy' # transformers<4.52
@@ -573,6 +574,14 @@ def register_model_arch(model_arch: ModelKeys, *, exist_ok: bool = False) -> Non
573574
vision_tower='vision_model',
574575
))
575576

577+
register_model_arch(
578+
MultiModelKeys(
579+
MLLMModelArch.llama4,
580+
language_model='language_model',
581+
aligner='multi_modal_projector',
582+
vision_tower='vision_model',
583+
))
584+
576585
register_model_arch(MultiModelKeys(
577586
MLLMModelArch.ovis1_6,
578587
language_model='llm',

0 commit comments

Comments
 (0)