huggingface/pytorch-image-modelsPublic

NotificationsYou must be signed in to change notification settings
Fork5k
Star34.8k

Commit94e13b7

authored

Merge pull request#2529 from huggingface/rope_vit

Adding Naver rope-vit compatibility to EVA ViT

2 parents8d41071 +cec7290 commit94e13b7Copy full SHA for 94e13b7

File tree

16 files changed

+873

-167

lines changed

16 files changed

+873

-167

lines changed

`‎README.md`

Lines changed: 1 addition & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -508,6 +508,7 @@ All model architecture families include variants with pretrained weights. There`
`508`	`508`	`* Res2Net -https://arxiv.org/abs/1904.01169`
`509`	`509`	`* ResNeSt -https://arxiv.org/abs/2004.08955`
`510`	`510`	`* ReXNet -https://arxiv.org/abs/2007.00992`
	`511`	`+* ROPE-ViT -https://arxiv.org/abs/2403.13298`
`511`	`512`	`* SelecSLS -https://arxiv.org/abs/1907.00837`
`512`	`513`	`* Selective Kernel Networks -https://arxiv.org/abs/1903.06586`
`513`	`514`	`* Sequencer2D -https://arxiv.org/abs/2205.01972`

`‎timm/layers/init.py`

Lines changed: 86 additions & 16 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,16 +1,40 @@`
	`1`	`+from ._fximport (`
	`2`	`+create_feature_extractor,`
	`3`	`+get_graph_node_names,`
	`4`	`+register_notrace_function,`
	`5`	`+register_notrace_module,`
	`6`	`+is_notrace_module,`
	`7`	`+is_notrace_function,`
	`8`	`+get_notrace_modules,`
	`9`	`+get_notrace_functions,`
	`10`	`+)`
`1`	`11`	`from .activationsimport*`
`2`		`-from .adaptive_avgmax_poolimport \`
`3`		`-adaptive_avgmax_pool2d,select_adaptive_pool2d,AdaptiveAvgMaxPool2d,SelectAdaptivePool2d`
	`12`	`+from .adaptive_avgmax_poolimport (`
	`13`	`+adaptive_avgmax_pool2d,`
	`14`	`+select_adaptive_pool2d,`
	`15`	`+AdaptiveAvgMaxPool2d,`
	`16`	`+SelectAdaptivePool2d,`
	`17`	`+)`
`4`	`18`	`from .attentionimportAttention,AttentionRope,maybe_add_mask`
`5`	`19`	`from .attention2dimportMultiQueryAttention2d,Attention2d,MultiQueryAttentionV2`
`6`	`20`	`from .attention_poolimportAttentionPoolLatent`
`7`	`21`	`from .attention_pool2dimportAttentionPool2d,RotAttentionPool2d,RotaryEmbedding`
`8`	`22`	`from .blur_poolimportBlurPool2d,create_aa`
`9`	`23`	`from .classifierimportcreate_classifier,ClassifierHead,NormMlpClassifierHead,ClNormMlpClassifierHead`
`10`	`24`	`from .cond_conv2dimportCondConv2d,get_condconv_initializer`
`11`		`-from .configimportis_exportable,is_scriptable,is_no_jit,use_fused_attn, \`
`12`		`-set_exportable,set_scriptable,set_no_jit,set_layer_config,set_fused_attn, \`
`13`		`-set_reentrant_ckpt,use_reentrant_ckpt`
	`25`	`+from .configimport (`
	`26`	`+is_exportable,`
	`27`	`+is_scriptable,`
	`28`	`+is_no_jit,`
	`29`	`+use_fused_attn,`
	`30`	`+set_exportable,`
	`31`	`+set_scriptable,`
	`32`	`+set_no_jit,`
	`33`	`+set_layer_config,`
	`34`	`+set_fused_attn,`
	`35`	`+set_reentrant_ckpt,`
	`36`	`+use_reentrant_ckpt,`
	`37`	`+)`
`14`	`38`	`from .conv2d_sameimportConv2dSame,conv2d_same`
`15`	`39`	`from .conv_bn_actimportConvNormAct,ConvNormActAa,ConvBnAct`
`16`	`40`	`from .create_actimportcreate_act_layer,get_act_layer,get_act_fn`
`@@ -20,8 +44,17 @@`
`20`	`44`	`from .create_norm_actimportget_norm_act_layer,create_norm_act_layer,get_norm_act_layer`
`21`	`45`	`from .dropimportDropBlock2d,DropPath,drop_block_2d,drop_path`
`22`	`46`	`from .ecaimportEcaModule,CecaModule,EfficientChannelAttn,CircularEfficientChannelAttn`
`23`		`-from .evo_normimportEvoNorm2dB0,EvoNorm2dB1,EvoNorm2dB2,\`
`24`		`-EvoNorm2dS0,EvoNorm2dS0a,EvoNorm2dS1,EvoNorm2dS1a,EvoNorm2dS2,EvoNorm2dS2a`
	`47`	`+from .evo_normimport (`
	`48`	`+EvoNorm2dB0,`
	`49`	`+EvoNorm2dB1,`
	`50`	`+EvoNorm2dB2,`
	`51`	`+EvoNorm2dS0,`
	`52`	`+EvoNorm2dS0a,`
	`53`	`+EvoNorm2dS1,`
	`54`	`+EvoNorm2dS1a,`
	`55`	`+EvoNorm2dS2,`
	`56`	`+EvoNorm2dS2a,`
	`57`	`+)`
`25`	`58`	`from .fast_normimportis_fast_norm,set_fast_norm,fast_group_norm,fast_layer_norm`
`26`	`59`	`from .filter_response_normimportFilterResponseNormTlu2d,FilterResponseNormAct2d`
`27`	`60`	`from .formatimportFormat,get_channel_dim,get_spatial_dim,nchw_to,nhwc_to`
`@@ -37,19 +70,50 @@`
`37`	`70`	`from .mlpimportMlp,GluMlp,GatedMlp,SwiGLU,SwiGLUPacked,ConvMlp,GlobalResponseNormMlp`
`38`	`71`	`from .non_local_attnimportNonLocalAttn,BatNonLocalAttn`
`39`	`72`	`from .normimportGroupNorm,GroupNorm1,LayerNorm,LayerNorm2d,RmsNorm,RmsNorm2d,SimpleNorm,SimpleNorm2d`
`40`		`-from .norm_actimportBatchNormAct2d,GroupNormAct,GroupNorm1Act,LayerNormAct,LayerNormAct2d,\`
`41`		`-SyncBatchNormAct,convert_sync_batchnorm,FrozenBatchNormAct2d,freeze_batch_norm_2d,unfreeze_batch_norm_2d`
	`73`	`+from .norm_actimport (`
	`74`	`+BatchNormAct2d,`
	`75`	`+GroupNormAct,`
	`76`	`+GroupNorm1Act,`
	`77`	`+LayerNormAct,`
	`78`	`+LayerNormAct2d,`
	`79`	`+SyncBatchNormAct,`
	`80`	`+convert_sync_batchnorm,`
	`81`	`+FrozenBatchNormAct2d,`
	`82`	`+freeze_batch_norm_2d,`
	`83`	`+unfreeze_batch_norm_2d,`
	`84`	`+)`
`42`	`85`	`from .paddingimportget_padding,get_same_padding,pad_same`
`43`	`86`	`from .patch_dropoutimportPatchDropout`
`44`	`87`	`from .patch_embedimportPatchEmbed,PatchEmbedWithSize,PatchEmbedInterpolator,resample_patch_embed`
`45`	`88`	`from .pool1dimportglobal_pool_nlc`
`46`	`89`	`from .pool2d_sameimportAvgPool2dSame,create_pool2d`
`47`	`90`	`from .pos_embedimportresample_abs_pos_embed,resample_abs_pos_embed_nhwc`
`48`		`-from .pos_embed_relimportRelPosMlp,RelPosBias,RelPosBiasTf,gen_relative_position_index,gen_relative_log_coords, \`
`49`		`-resize_rel_pos_bias_table,resize_rel_pos_bias_table_simple,resize_rel_pos_bias_table_levit`
`50`		`-from .pos_embed_sincosimportpixel_freq_bands,freq_bands,build_sincos2d_pos_embed,build_fourier_pos_embed, \`
`51`		`-build_rotary_pos_embed,apply_rot_embed,apply_rot_embed_cat,apply_rot_embed_list,apply_keep_indices_nlc, \`
`52`		`-FourierEmbed,RotaryEmbedding,RotaryEmbeddingCat`
	`91`	`+from .pos_embed_relimport (`
	`92`	`+RelPosMlp,`
	`93`	`+RelPosBias,`
	`94`	`+RelPosBiasTf,`
	`95`	`+gen_relative_position_index,`
	`96`	`+gen_relative_log_coords,`
	`97`	`+resize_rel_pos_bias_table,`
	`98`	`+resize_rel_pos_bias_table_simple,`
	`99`	`+resize_rel_pos_bias_table_levit,`
	`100`	`+)`
	`101`	`+from .pos_embed_sincosimport (`
	`102`	`+pixel_freq_bands,`
	`103`	`+freq_bands,`
	`104`	`+build_sincos2d_pos_embed,`
	`105`	`+build_fourier_pos_embed,`
	`106`	`+build_rotary_pos_embed,`
	`107`	`+apply_rot_embed,`
	`108`	`+apply_rot_embed_cat,`
	`109`	`+apply_rot_embed_list,`
	`110`	`+apply_keep_indices_nlc,`
	`111`	`+FourierEmbed,`
	`112`	`+RotaryEmbedding,`
	`113`	`+RotaryEmbeddingCat,`
	`114`	`+RotaryEmbeddingMixed,`
	`115`	`+get_mixed_freqs,`
	`116`	`+)`
`53`	`117`	`from .squeeze_exciteimportSEModule,SqueezeExcite,EffectiveSEModule,EffectiveSqueezeExcite`
`54`	`118`	`from .selective_kernelimportSelectiveKernel`
`55`	`119`	`from .separable_convimportSeparableConv2d,SeparableConvNormAct`
`@@ -60,5 +124,11 @@`
`60`	`124`	`from .test_time_poolimportTestTimePoolHead,apply_test_time_pool`
`61`	`125`	`from .trace_utilsimport_assert,_float_to_int`
`62`	`126`	`from .typingimportLayerType,PadType`
`63`		`-from .weight_initimporttrunc_normal_,trunc_normal_tf_,variance_scaling_,lecun_normal_, \`
`64`		`-init_weight_jax,init_weight_vit`
	`127`	`+from .weight_initimport (`
	`128`	`+trunc_normal_,`
	`129`	`+trunc_normal_tf_,`
	`130`	`+variance_scaling_,`
	`131`	`+lecun_normal_,`
	`132`	`+init_weight_jax,`
	`133`	`+init_weight_vit,`
	`134`	`+)`

`‎timm/layers/_fx.py`

Lines changed: 81 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,81 @@`
	`1`	`+fromtypingimportCallable,Dict,List,Optional,Union,Tuple,Type`
	`2`	`+`
	`3`	`+importtorch`
	`4`	`+fromtorchimportnn`
	`5`	`+`
	`6`	`+try:`
	`7`	`+# NOTE we wrap torchvision fns to use timm leaf / no trace definitions`
	`8`	`+fromtorchvision.models.feature_extractionimportcreate_feature_extractoras_create_feature_extractor`
	`9`	`+fromtorchvision.models.feature_extractionimportget_graph_node_namesas_get_graph_node_names`
	`10`	`+has_fx_feature_extraction=True`
	`11`	`+exceptImportError:`
	`12`	`+has_fx_feature_extraction=False`
	`13`	`+`
	`14`	`+`
	`15`	`+__all__= [`
	`16`	`+'register_notrace_module',`
	`17`	`+'is_notrace_module',`
	`18`	`+'get_notrace_modules',`
	`19`	`+'register_notrace_function',`
	`20`	`+'is_notrace_function',`
	`21`	`+'get_notrace_functions',`
	`22`	`+'create_feature_extractor',`
	`23`	`+'get_graph_node_names',`
	`24`	`+]`
	`25`	`+`
	`26`	`+# modules to treat as leafs when tracing`
	`27`	`+_leaf_modules=set()`
	`28`	`+`
	`29`	`+`
	`30`	`+defregister_notrace_module(module:Type[nn.Module]):`
	`31`	`+"""`
	`32`	`+ Any module not under timm.models.layers should get this decorator if we don't want to trace through it.`
	`33`	`+ """`
	`34`	`+_leaf_modules.add(module)`
	`35`	`+returnmodule`
	`36`	`+`
	`37`	`+`
	`38`	`+defis_notrace_module(module:Type[nn.Module]):`
	`39`	`+returnmodulein_leaf_modules`
	`40`	`+`
	`41`	`+`
	`42`	`+defget_notrace_modules():`
	`43`	`+returnlist(_leaf_modules)`
	`44`	`+`
	`45`	`+`
	`46`	`+# Functions we want to autowrap (treat them as leaves)`
	`47`	`+_autowrap_functions=set()`
	`48`	`+`
	`49`	`+`
	`50`	`+defregister_notrace_function(name_or_fn):`
	`51`	`+_autowrap_functions.add(name_or_fn)`
	`52`	`+returnname_or_fn`
	`53`	`+`
	`54`	`+`
	`55`	`+defis_notrace_function(func:Callable):`
	`56`	`+returnfuncin_autowrap_functions`
	`57`	`+`
	`58`	`+`
	`59`	`+defget_notrace_functions():`
	`60`	`+returnlist(_autowrap_functions)`
	`61`	`+`
	`62`	`+`
	`63`	`+defget_graph_node_names(model:nn.Module)->Tuple[List[str],List[str]]:`
	`64`	`+return_get_graph_node_names(`
	`65`	`+model,`
	`66`	`+tracer_kwargs={`
	`67`	`+'leaf_modules':list(_leaf_modules),`
	`68`	`+'autowrap_functions':list(_autowrap_functions)`
	`69`	`+ }`
	`70`	`+ )`
	`71`	`+`
	`72`	`+`
	`73`	`+defcreate_feature_extractor(model:nn.Module,return_nodes:Union[Dict[str,str],List[str]]):`
	`74`	`+asserthas_fx_feature_extraction,'Please update to PyTorch 1.10+, torchvision 0.11+ for FX feature extraction'`
	`75`	`+return_create_feature_extractor(`
	`76`	`+model,return_nodes,`
	`77`	`+tracer_kwargs={`
	`78`	`+'leaf_modules':list(_leaf_modules),`
	`79`	`+'autowrap_functions':list(_autowrap_functions)`
	`80`	`+ }`
	`81`	`+ )`

`‎timm/layers/attention.py`

Lines changed: 3 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -4,10 +4,13 @@`
`4`	`4`	`fromtorchimportnnasnn`
`5`	`5`	`fromtorch.nnimportfunctionalasF`
`6`	`6`
	`7`	`+from ._fximportregister_notrace_function`
`7`	`8`	`from .configimportuse_fused_attn`
`8`	`9`	`from .pos_embed_sincosimportapply_rot_embed_cat`
`9`	`10`
`10`	`11`
	`12`	`+@torch.fx.wrap`
	`13`	`+@register_notrace_function`
`11`	`14`	`defmaybe_add_mask(scores:torch.Tensor,attn_mask:Optional[torch.Tensor]=None):`
`12`	`15`	`returnscoresifattn_maskisNoneelsescores+attn_mask`
`13`	`16`

`‎timm/layers/attention_pool2d.py`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -12,7 +12,7 @@`
`12`	`12`	`importtorch`
`13`	`13`	`importtorch.nnasnn`
`14`	`14`
`15`		`-from.configimportuse_fused_attn`
	`15`	`+from .configimportuse_fused_attn`
`16`	`16`	`from .helpersimportto_2tuple`
`17`	`17`	`from .pos_embedimportresample_abs_pos_embed`
`18`	`18`	`from .pos_embed_sincosimportapply_rot_embed,RotaryEmbedding`

`‎timm/layers/cond_conv2d.py`

Lines changed: 2 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -12,6 +12,7 @@`
`12`	`12`	`fromtorchimportnnasnn`
`13`	`13`	`fromtorch.nnimportfunctionalasF`
`14`	`14`
	`15`	`+from ._fximportregister_notrace_module`
`15`	`16`	`from .helpersimportto_2tuple`
`16`	`17`	`from .conv2d_sameimportconv2d_same`
`17`	`18`	`from .paddingimportget_padding_value`
`@@ -30,6 +31,7 @@ def condconv_initializer(weight):`
`30`	`31`	`returncondconv_initializer`
`31`	`32`
`32`	`33`
	`34`	`+@register_notrace_module`
`33`	`35`	`classCondConv2d(nn.Module):`
`34`	`36`	`""" Conditionally Parameterized Convolution`
`35`	`37`	`Inspired by: https://github.com/tensorflow/tpu/blob/master/models/official/efficientnet/condconv/condconv_layers.py`

`‎timm/layers/conv2d_same.py`

Lines changed: 2 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -7,6 +7,7 @@`
`7`	`7`	`importtorch.nn.functionalasF`
`8`	`8`	`fromtypingimportTuple,Optional`
`9`	`9`
	`10`	`+from ._fximportregister_notrace_module`
`10`	`11`	`from .configimportis_exportable,is_scriptable`
`11`	`12`	`from .paddingimportpad_same,pad_same_arg,get_padding_value`
`12`	`13`
`@@ -27,6 +28,7 @@ def conv2d_same(`
`27`	`28`	`returnF.conv2d(x,weight,bias,stride, (0,0),dilation,groups)`
`28`	`29`
`29`	`30`
	`31`	`+@register_notrace_module`
`30`	`32`	`classConv2dSame(nn.Conv2d):`
`31`	`33`	`""" Tensorflow like 'SAME' convolution wrapper for 2D convolutions`
`32`	`34`	`"""`

`‎timm/layers/inplace_abn.py`

Lines changed: 3 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -15,7 +15,10 @@ def inplace_abn(x, weight, bias, running_mean, running_var,`
`15`	`15`	`definplace_abn_sync(**kwargs):`
`16`	`16`	`inplace_abn(**kwargs)`
`17`	`17`
	`18`	`+from ._fximportregister_notrace_module`
`18`	`19`
	`20`	`+`
	`21`	`+@register_notrace_module`
`19`	`22`	`classInplaceAbn(nn.Module):`
`20`	`23`	`"""Activated Batch Normalization`
`21`	`24`

`‎timm/layers/non_local_attn.py`

Lines changed: 2 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,6 +8,7 @@`
`8`	`8`	`fromtorchimportnn`
`9`	`9`	`fromtorch.nnimportfunctionalasF`
`10`	`10`
	`11`	`+from ._fximportregister_notrace_module`
`11`	`12`	`from .conv_bn_actimportConvNormAct`
`12`	`13`	`from .helpersimportmake_divisible`
`13`	`14`	`from .trace_utilsimport_assert`
`@@ -69,6 +70,7 @@ def reset_parameters(self):`
`69`	`70`	`nn.init.constant_(m.bias,0)`
`70`	`71`
`71`	`72`
	`73`	`+@register_notrace_module`
`72`	`74`	`classBilinearAttnTransform(nn.Module):`
`73`	`75`
`74`	`76`	`def__init__(self,in_channels,block_size,groups,act_layer=nn.ReLU,norm_layer=nn.BatchNorm2d):`

`‎timm/layers/norm_act.py`

Lines changed: 4 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -19,6 +19,7 @@`
`19`	`19`	`fromtorch.nnimportfunctionalasF`
`20`	`20`	`fromtorchvision.ops.miscimportFrozenBatchNorm2d`
`21`	`21`
	`22`	`+from ._fximportregister_notrace_module`
`22`	`23`	`from .create_actimportcreate_act_layer`
`23`	`24`	`from .fast_normimportis_fast_norm,fast_group_norm,fast_layer_norm,fast_rms_norm,rms_norm2d,fast_rms_norm2d`
`24`	`25`	`from .normimportRmsNorm,RmsNorm2d`
`@@ -39,6 +40,7 @@ def _create_act(act_layer, act_kwargs=None, inplace=False, apply_act=True):`
`39`	`40`	`returnnn.Identity()ifactisNoneelseact`
`40`	`41`
`41`	`42`
	`43`	`+@register_notrace_module`
`42`	`44`	`classBatchNormAct2d(nn.BatchNorm2d):`
`43`	`45`	`"""BatchNorm + Activation`
`44`	`46`
`@@ -134,6 +136,7 @@ def forward(self, x):`
`134`	`136`	`returnx`
`135`	`137`
`136`	`138`
	`139`	`+@register_notrace_module`
`137`	`140`	`classSyncBatchNormAct(nn.SyncBatchNorm):`
`138`	`141`	`# Thanks to Selim Seferbekov (https://github.com/rwightman/pytorch-image-models/issues/1254)`
`139`	`142`	`# This is a quick workaround to support SyncBatchNorm for timm BatchNormAct2d layers`
`@@ -191,6 +194,7 @@ def convert_sync_batchnorm(module, process_group=None):`
`191`	`194`	`returnmodule_output`
`192`	`195`
`193`	`196`
	`197`	`+@register_notrace_module`
`194`	`198`	`classFrozenBatchNormAct2d(torch.nn.Module):`
`195`	`199`	`"""`
`196`	`200`	`BatchNormAct2d where the batch statistics and the affine parameters are fixed`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

Commit94e13b7

File tree

16 files changed

16 files changed

`‎README.md`

`‎timm/layers/init.py`

`‎timm/layers/_fx.py`

`‎timm/layers/attention.py`

`‎timm/layers/attention_pool2d.py`

`‎timm/layers/cond_conv2d.py`

`‎timm/layers/conv2d_same.py`

`‎timm/layers/inplace_abn.py`

`‎timm/layers/non_local_attn.py`

`‎timm/layers/norm_act.py`

0 commit comments