@@ -4562,7 +4562,7 @@ def _ccached_diffusers_tiny_torch_full_checker_unet():
45624562 }
45634563
45644564
4565- def _ccached_riny_random_gemma_3 ():
4565+ def _ccached_tiny_random_gemma_3 ():
45664566 "tiny-random/gemma-3"
45674567 return transformers .Gemma3Config (
45684568 ** {
@@ -4618,3 +4618,72 @@ def _ccached_riny_random_gemma_3():
46184618 },
46194619 }
46204620 )
4621+
4622+
4623+ def _ccached_zai_glm_45 ():
4624+ "zai-org/GLM-4.5V"
4625+ return transformers .Glm4vMoeConfig (
4626+ ** {
4627+ "architectures" : ["Glm4vMoeForConditionalGeneration" ],
4628+ "model_type" : "glm4v_moe" ,
4629+ "text_config" : {
4630+ "pad_token_id" : 151329 ,
4631+ "vocab_size" : 151552 ,
4632+ "eos_token_id" : [151329 , 151336 , 151338 ],
4633+ "image_end_token_id" : 151340 ,
4634+ "image_start_token_id" : 151339 ,
4635+ "image_token_id" : 151363 ,
4636+ "head_dim" : 128 ,
4637+ "attention_bias" : true ,
4638+ "attention_dropout" : 0.0 ,
4639+ "first_k_dense_replace" : 1 ,
4640+ "hidden_act" : "silu" ,
4641+ "hidden_size" : 4096 ,
4642+ "initializer_range" : 0.02 ,
4643+ "intermediate_size" : 10944 ,
4644+ "max_position_embeddings" : 65536 ,
4645+ "model_type" : "glm4v_moe_text" ,
4646+ "moe_intermediate_size" : 1408 ,
4647+ "n_group" : 1 ,
4648+ "n_routed_experts" : 128 ,
4649+ "n_shared_experts" : 1 ,
4650+ "norm_topk_prob" : true ,
4651+ "num_attention_heads" : 96 ,
4652+ "num_experts_per_tok" : 8 ,
4653+ "num_hidden_layers" : 46 ,
4654+ "num_key_value_heads" : 8 ,
4655+ "partial_rotary_factor" : 0.5 ,
4656+ "rms_norm_eps" : 1e-05 ,
4657+ "torch_dtype" : "bfloat16" ,
4658+ "rope_scaling" : {"rope_type" : "default" , "mrope_section" : [8 , 12 , 12 ]},
4659+ "rope_theta" : 10000.0 ,
4660+ "routed_scaling_factor" : 1.0 ,
4661+ "topk_group" : 1 ,
4662+ "use_cache" : true ,
4663+ "use_qk_norm" : false ,
4664+ },
4665+ "torch_dtype" : "bfloat16" ,
4666+ "transformers_version" : "4.55.0.dev0" ,
4667+ "video_end_token_id" : 151342 ,
4668+ "video_start_token_id" : 151341 ,
4669+ "video_token_id" : 151364 ,
4670+ "vision_config" : {
4671+ "attention_bias" : false ,
4672+ "attention_dropout" : 0.0 ,
4673+ "depth" : 24 ,
4674+ "hidden_act" : "silu" ,
4675+ "hidden_size" : 1536 ,
4676+ "image_size" : 336 ,
4677+ "in_channels" : 3 ,
4678+ "initializer_range" : 0.02 ,
4679+ "intermediate_size" : 10944 ,
4680+ "model_type" : "glm4v_moe" ,
4681+ "num_heads" : 12 ,
4682+ "out_hidden_size" : 4096 ,
4683+ "patch_size" : 14 ,
4684+ "rms_norm_eps" : 1e-05 ,
4685+ "spatial_merge_size" : 2 ,
4686+ "temporal_patch_size" : 2 ,
4687+ },
4688+ }
4689+ )
0 commit comments