@@ -1964,6 +1964,9 @@ def _cfg(url: str = '', **kwargs) -> Dict[str, Any]:
19641964 hf_hub_id = 'timm/' ,
19651965 num_classes = 11821 ,
19661966 input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
1967+ 'vit_mediumd_patch16_reg4_gap_256.sbb2_e200_in12k_ft_in1k' : _cfg (
1968+ hf_hub_id = 'timm/' ,
1969+ input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
19671970 'vit_mediumd_patch16_reg4_gap_256.sbb_in12k_ft_in1k' : _cfg (
19681971 hf_hub_id = 'timm/' ,
19691972 input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
@@ -1975,9 +1978,15 @@ def _cfg(url: str = '', **kwargs) -> Dict[str, Any]:
19751978 hf_hub_id = 'timm/' ,
19761979 num_classes = 11821 ,
19771980 input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
1981+ 'vit_mediumd_patch16_reg4_gap_384.sbb2_e200_in12k_ft_in1k' : _cfg (
1982+ hf_hub_id = 'timm/' ,
1983+ input_size = (3 , 384 , 384 ), crop_pct = 1.0 ),
19781984 'vit_betwixt_patch16_reg1_gap_256.sbb_in1k' : _cfg (
19791985 hf_hub_id = 'timm/' ,
19801986 input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
1987+ 'vit_betwixt_patch16_reg4_gap_256.sbb2_e200_in12k_ft_in1k' : _cfg (
1988+ hf_hub_id = 'timm/' ,
1989+ input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
19811990 'vit_betwixt_patch16_reg4_gap_256.sbb_in12k_ft_in1k' : _cfg (
19821991 hf_hub_id = 'timm/' ,
19831992 input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
@@ -1992,6 +2001,9 @@ def _cfg(url: str = '', **kwargs) -> Dict[str, Any]:
19922001 hf_hub_id = 'timm/' ,
19932002 num_classes = 11821 ,
19942003 input_size = (3 , 256 , 256 ), crop_pct = 0.95 ),
2004+ 'vit_betwixt_patch16_reg4_gap_384.sbb2_e200_in12k_ft_in1k' : _cfg (
2005+ hf_hub_id = 'timm/' ,
2006+ input_size = (3 , 384 , 384 ), crop_pct = 1.0 ),
19952007 'vit_base_patch16_reg4_gap_256.untrained' : _cfg (
19962008 input_size = (3 , 256 , 256 )),
19972009
@@ -3118,6 +3130,17 @@ def vit_mediumd_patch16_reg4_gap_256(pretrained: bool = False, **kwargs) -> Visi
31183130 return model
31193131
31203132
3133+ @register_model
3134+ def vit_mediumd_patch16_reg4_gap_384 (pretrained : bool = False , ** kwargs ) -> VisionTransformer :
3135+ model_args = dict (
3136+ patch_size = 16 , embed_dim = 512 , depth = 20 , num_heads = 8 , init_values = 1e-5 ,
3137+ class_token = False , no_embed_class = True , reg_tokens = 4 , global_pool = 'avg' ,
3138+ )
3139+ model = _create_vision_transformer (
3140+ 'vit_mediumd_patch16_reg4_gap_384' , pretrained = pretrained , ** dict (model_args , ** kwargs ))
3141+ return model
3142+
3143+
31213144@register_model
31223145def vit_betwixt_patch16_reg1_gap_256 (pretrained : bool = False , ** kwargs ) -> VisionTransformer :
31233146 model_args = dict (
@@ -3140,6 +3163,17 @@ def vit_betwixt_patch16_reg4_gap_256(pretrained: bool = False, **kwargs) -> Visi
31403163 return model
31413164
31423165
3166+ @register_model
3167+ def vit_betwixt_patch16_reg4_gap_384 (pretrained : bool = False , ** kwargs ) -> VisionTransformer :
3168+ model_args = dict (
3169+ patch_size = 16 , embed_dim = 640 , depth = 12 , num_heads = 10 , init_values = 1e-5 ,
3170+ class_token = False , no_embed_class = True , reg_tokens = 4 , global_pool = 'avg' ,
3171+ )
3172+ model = _create_vision_transformer (
3173+ 'vit_betwixt_patch16_reg4_gap_384' , pretrained = pretrained , ** dict (model_args , ** kwargs ))
3174+ return model
3175+
3176+
31433177@register_model
31443178def vit_base_patch16_reg4_gap_256 (pretrained : bool = False , ** kwargs ) -> VisionTransformer :
31453179 model_args = dict (
0 commit comments