@@ -4572,6 +4572,22 @@ export class Qwen2Model extends Qwen2PreTrainedModel { }
45724572export class Qwen2ForCausalLM extends Qwen2PreTrainedModel { }
45734573//////////////////////////////////////////////////
45744574
4575+
4576+ //////////////////////////////////////////////////
4577+ // Qwen3 models
4578+
4579+ /**
4580+ * The bare Qwen3 Model outputting raw hidden-states without any specific head on top.
4581+ */
4582+ export class Qwen3PreTrainedModel extends PreTrainedModel { }
4583+ /**
4584+ * The bare Qwen3 Model outputting raw hidden-states without any specific head on top.
4585+ */
4586+ export class Qwen3Model extends Qwen3PreTrainedModel { }
4587+
4588+ export class Qwen3ForCausalLM extends Qwen3PreTrainedModel { }
4589+ //////////////////////////////////////////////////
4590+
45754591export class Qwen2VLPreTrainedModel extends PreTrainedModel {
45764592 forward_params = [
45774593 // Text inputs
@@ -7621,6 +7637,7 @@ const MODEL_MAPPING_NAMES_DECODER_ONLY = new Map([
76217637 [ 'glm' , [ 'GlmModel' , GlmModel ] ] ,
76227638 [ 'openelm' , [ 'OpenELMModel' , OpenELMModel ] ] ,
76237639 [ 'qwen2' , [ 'Qwen2Model' , Qwen2Model ] ] ,
7640+ [ 'qwen3' , [ 'Qwen3Model' , Qwen3Model ] ] ,
76247641 [ 'phi' , [ 'PhiModel' , PhiModel ] ] ,
76257642 [ 'phi3' , [ 'Phi3Model' , Phi3Model ] ] ,
76267643 [ 'mpt' , [ 'MptModel' , MptModel ] ] ,
@@ -7721,6 +7738,7 @@ const MODEL_FOR_CAUSAL_LM_MAPPING_NAMES = new Map([
77217738 [ 'glm' , [ 'GlmForCausalLM' , GlmForCausalLM ] ] ,
77227739 [ 'openelm' , [ 'OpenELMForCausalLM' , OpenELMForCausalLM ] ] ,
77237740 [ 'qwen2' , [ 'Qwen2ForCausalLM' , Qwen2ForCausalLM ] ] ,
7741+ [ 'qwen3' , [ 'Qwen3ForCausalLM' , Qwen3ForCausalLM ] ] ,
77247742 [ 'phi' , [ 'PhiForCausalLM' , PhiForCausalLM ] ] ,
77257743 [ 'phi3' , [ 'Phi3ForCausalLM' , Phi3ForCausalLM ] ] ,
77267744 [ 'mpt' , [ 'MptForCausalLM' , MptForCausalLM ] ] ,
0 commit comments