Skip to content

Commit 1be7999

Browse files
committed
Upload beit3 weights to hub, add pretrain weights
1 parent 3a3d98b commit 1be7999

File tree

1 file changed

+27
-8
lines changed

1 file changed

+27
-8
lines changed

timm/models/vision_transformer.py

Lines changed: 27 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -2463,23 +2463,43 @@ def _cfg(url: str = '', **kwargs) -> Dict[str, Any]:
24632463
'test_vit4.r160_in1k': _cfg(
24642464
input_size=(3, 160, 160), crop_pct=0.95),
24652465

2466-
# BEiT3 models (remapped to VisionTransformer with scale_norm=True)
2466+
# BEiT3 models (remapped to VisionTransformer with scale_attn_norm=True, scale_mlp_norm=True)
24672467
'beit3_base_patch16_224.in22k_ft_in1k': _cfg(
2468-
url='https://github.com/addf400/files/releases/download/beit3/beit3_base_patch16_224_in1k.pth',
2468+
hf_hub_id='timm/',
24692469
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0),
2470-
'beit3_base_patch16_224.in22k_indomain_ft_in1k': _cfg(
2471-
url='https://github.com/addf400/files/releases/download/beit3/beit3_base_indomain_patch16_224_in1k.pth',
2470+
'beit3_base_patch16_224.indomain_in22k_ft_in1k': _cfg(
2471+
hf_hub_id='timm/',
24722472
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0),
24732473
'beit3_large_patch16_224.in22k_ft_in1k': _cfg(
2474-
url='https://github.com/addf400/files/releases/download/beit3/beit3_large_patch16_224_in1k.pth',
2474+
hf_hub_id='timm/',
24752475
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0),
2476-
'beit3_large_patch16_224.in22k_indomain_ft_in1k': _cfg(
2477-
url='https://github.com/addf400/files/releases/download/beit3/beit3_large_indomain_patch16_224_in1k.pth',
2476+
'beit3_large_patch16_224.indomain_in22k_ft_in1k': _cfg(
2477+
hf_hub_id='timm/',
24782478
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0),
24792479
'beit3_giant_patch14_224.untrained': _cfg(
24802480
url='', mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0),
24812481
'beit3_giant_patch14_336.untrained': _cfg(
24822482
url='', input_size=(3, 336, 336), mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0),
2483+
'beit3_base_patch16_224.pt': _cfg(
2484+
hf_hub_id='timm/',
2485+
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0,
2486+
num_classes=0,
2487+
),
2488+
'beit3_base_patch16_224.indomain_pt': _cfg(
2489+
hf_hub_id='timm/',
2490+
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0,
2491+
num_classes=0,
2492+
),
2493+
'beit3_large_patch16_224.pt': _cfg(
2494+
hf_hub_id='timm/',
2495+
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0,
2496+
num_classes=0,
2497+
),
2498+
'beit3_large_patch16_224.indomain_pt': _cfg(
2499+
hf_hub_id='timm/',
2500+
mean=IMAGENET_DEFAULT_MEAN, std=IMAGENET_DEFAULT_STD, crop_pct=1.0,
2501+
num_classes=0,
2502+
),
24832503
}
24842504

24852505
_quick_gelu_cfgs = [n for n, c in default_cfgs.items() if c.get('notes', ()) and 'quickgelu' in c['notes'][0]]
@@ -3728,7 +3748,6 @@ def vit_giantopt_patch16_siglip_gap_384(pretrained: bool = False, **kwargs) -> V
37283748
return model
37293749

37303750

3731-
37323751
@register_model
37333752
def vit_wee_patch16_reg1_gap_256(pretrained: bool = False, **kwargs) -> VisionTransformer:
37343753
model_args = dict(

0 commit comments

Comments
 (0)