@@ -2463,23 +2463,43 @@ def _cfg(url: str = '', **kwargs) -> Dict[str, Any]:
24632463 'test_vit4.r160_in1k' : _cfg (
24642464 input_size = (3 , 160 , 160 ), crop_pct = 0.95 ),
24652465
2466- # BEiT3 models (remapped to VisionTransformer with scale_norm =True)
2466+ # BEiT3 models (remapped to VisionTransformer with scale_attn_norm=True, scale_mlp_norm =True)
24672467 'beit3_base_patch16_224.in22k_ft_in1k' : _cfg (
2468- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_base_patch16_224_in1k.pth ' ,
2468+ hf_hub_id = 'timm/ ' ,
24692469 mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2470- 'beit3_base_patch16_224.in22k_indomain_ft_in1k ' : _cfg (
2471- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_base_indomain_patch16_224_in1k.pth ' ,
2470+ 'beit3_base_patch16_224.indomain_in22k_ft_in1k ' : _cfg (
2471+ hf_hub_id = 'timm/ ' ,
24722472 mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
24732473 'beit3_large_patch16_224.in22k_ft_in1k' : _cfg (
2474- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_large_patch16_224_in1k.pth ' ,
2474+ hf_hub_id = 'timm/ ' ,
24752475 mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2476- 'beit3_large_patch16_224.in22k_indomain_ft_in1k ' : _cfg (
2477- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_large_indomain_patch16_224_in1k.pth ' ,
2476+ 'beit3_large_patch16_224.indomain_in22k_ft_in1k ' : _cfg (
2477+ hf_hub_id = 'timm/ ' ,
24782478 mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
24792479 'beit3_giant_patch14_224.untrained' : _cfg (
24802480 url = '' , mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
24812481 'beit3_giant_patch14_336.untrained' : _cfg (
24822482 url = '' , input_size = (3 , 336 , 336 ), mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2483+ 'beit3_base_patch16_224.pt' : _cfg (
2484+ hf_hub_id = 'timm/' ,
2485+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2486+ num_classes = 0 ,
2487+ ),
2488+ 'beit3_base_patch16_224.indomain_pt' : _cfg (
2489+ hf_hub_id = 'timm/' ,
2490+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2491+ num_classes = 0 ,
2492+ ),
2493+ 'beit3_large_patch16_224.pt' : _cfg (
2494+ hf_hub_id = 'timm/' ,
2495+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2496+ num_classes = 0 ,
2497+ ),
2498+ 'beit3_large_patch16_224.indomain_pt' : _cfg (
2499+ hf_hub_id = 'timm/' ,
2500+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2501+ num_classes = 0 ,
2502+ ),
24832503}
24842504
24852505_quick_gelu_cfgs = [n for n , c in default_cfgs .items () if c .get ('notes' , ()) and 'quickgelu' in c ['notes' ][0 ]]
@@ -3728,7 +3748,6 @@ def vit_giantopt_patch16_siglip_gap_384(pretrained: bool = False, **kwargs) -> V
37283748 return model
37293749
37303750
3731-
37323751@register_model
37333752def vit_wee_patch16_reg1_gap_256 (pretrained : bool = False , ** kwargs ) -> VisionTransformer :
37343753 model_args = dict (
0 commit comments