@@ -2463,23 +2463,43 @@ def _cfg(url: str = '', **kwargs) -> Dict[str, Any]:
2463
2463
'test_vit4.r160_in1k' : _cfg (
2464
2464
input_size = (3 , 160 , 160 ), crop_pct = 0.95 ),
2465
2465
2466
- # BEiT3 models (remapped to VisionTransformer with scale_norm =True)
2466
+ # BEiT3 models (remapped to VisionTransformer with scale_attn_norm=True, scale_mlp_norm =True)
2467
2467
'beit3_base_patch16_224.in22k_ft_in1k' : _cfg (
2468
- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_base_patch16_224_in1k.pth ' ,
2468
+ hf_hub_id = 'timm/ ' ,
2469
2469
mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2470
- 'beit3_base_patch16_224.in22k_indomain_ft_in1k ' : _cfg (
2471
- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_base_indomain_patch16_224_in1k.pth ' ,
2470
+ 'beit3_base_patch16_224.indomain_in22k_ft_in1k ' : _cfg (
2471
+ hf_hub_id = 'timm/ ' ,
2472
2472
mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2473
2473
'beit3_large_patch16_224.in22k_ft_in1k' : _cfg (
2474
- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_large_patch16_224_in1k.pth ' ,
2474
+ hf_hub_id = 'timm/ ' ,
2475
2475
mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2476
- 'beit3_large_patch16_224.in22k_indomain_ft_in1k ' : _cfg (
2477
- url = 'https://github.com/addf400/files/releases/download/beit3/beit3_large_indomain_patch16_224_in1k.pth ' ,
2476
+ 'beit3_large_patch16_224.indomain_in22k_ft_in1k ' : _cfg (
2477
+ hf_hub_id = 'timm/ ' ,
2478
2478
mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2479
2479
'beit3_giant_patch14_224.untrained' : _cfg (
2480
2480
url = '' , mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2481
2481
'beit3_giant_patch14_336.untrained' : _cfg (
2482
2482
url = '' , input_size = (3 , 336 , 336 ), mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ),
2483
+ 'beit3_base_patch16_224.pt' : _cfg (
2484
+ hf_hub_id = 'timm/' ,
2485
+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2486
+ num_classes = 0 ,
2487
+ ),
2488
+ 'beit3_base_patch16_224.indomain_pt' : _cfg (
2489
+ hf_hub_id = 'timm/' ,
2490
+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2491
+ num_classes = 0 ,
2492
+ ),
2493
+ 'beit3_large_patch16_224.pt' : _cfg (
2494
+ hf_hub_id = 'timm/' ,
2495
+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2496
+ num_classes = 0 ,
2497
+ ),
2498
+ 'beit3_large_patch16_224.indomain_pt' : _cfg (
2499
+ hf_hub_id = 'timm/' ,
2500
+ mean = IMAGENET_DEFAULT_MEAN , std = IMAGENET_DEFAULT_STD , crop_pct = 1.0 ,
2501
+ num_classes = 0 ,
2502
+ ),
2483
2503
}
2484
2504
2485
2505
_quick_gelu_cfgs = [n for n , c in default_cfgs .items () if c .get ('notes' , ()) and 'quickgelu' in c ['notes' ][0 ]]
@@ -3728,7 +3748,6 @@ def vit_giantopt_patch16_siglip_gap_384(pretrained: bool = False, **kwargs) -> V
3728
3748
return model
3729
3749
3730
3750
3731
-
3732
3751
@register_model
3733
3752
def vit_wee_patch16_reg1_gap_256 (pretrained : bool = False , ** kwargs ) -> VisionTransformer :
3734
3753
model_args = dict (
0 commit comments