diff --git a/config.py b/config.py index 60971e420..0b4028afe 100644 --- a/config.py +++ b/config.py @@ -182,8 +182,14 @@ def create_parser(): help='Weight decay (default=1e-6)') group.add_argument('--use_nesterov', type=str2bool, nargs='?', const=True, default=False, help='Enables the Nesterov momentum (default=False)') - group.add_argument('--filter_bias_and_bn', type=str2bool, nargs='?', const=True, default=True, - help='Filter Bias and BatchNorm (default=True)') + group.add_argument('--weight_decay_filter', type=str, default="disable", + choices=['disable', 'auto', 'norm_and_bias'], + help='filter parameters from weight_decay. ' + 'choice: "disable" - No parameters to filter from weight_decay; "auto" - In this case, ' + 'we do not apply weight decay filtering to any parameters. However, MindSpore currently ' + 'automatically filters norm parameters from weight decay. It is unclear whether there ' + 'will be any changes in future versions of MindSpore, so it is recommended to stay updated;' + '"norm_and_bias" - Filter the paramtersof Norm layer and Bias from weight decay') group.add_argument('--eps', type=float, default=1e-10, help='Term Added to the Denominator to Improve Numerical Stability (default=1e-10)') diff --git a/configs/bit/bit_resnet101_ascend.yaml b/configs/bit/bit_resnet101_ascend.yaml index 314113366..a0911c818 100644 --- a/configs/bit/bit_resnet101_ascend.yaml +++ b/configs/bit/bit_resnet101_ascend.yaml @@ -41,7 +41,7 @@ multi_step_decay_milestones: [30, 40, 50, 60, 70, 80, 85] # optimizer opt: 'sgd' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/bit/bit_resnet50_ascend.yaml b/configs/bit/bit_resnet50_ascend.yaml index 148c08e55..956ef6b45 100644 --- a/configs/bit/bit_resnet50_ascend.yaml +++ b/configs/bit/bit_resnet50_ascend.yaml @@ -40,7 +40,7 @@ multi_step_decay_milestones: [30, 40, 50, 60, 70, 80, 85] # optimizer opt: 'sgd' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/bit/bit_resnet50x3_ascend.yaml b/configs/bit/bit_resnet50x3_ascend.yaml index baf959281..22c96aebb 100644 --- a/configs/bit/bit_resnet50x3_ascend.yaml +++ b/configs/bit/bit_resnet50x3_ascend.yaml @@ -43,7 +43,7 @@ multi_step_decay_milestones: [30, 40, 50, 60, 70, 80, 85] # optimizer opt: 'sgd' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/cmt/cmt_small_ascend.yaml b/configs/cmt/cmt_small_ascend.yaml index 94d6965d2..16bb34b05 100644 --- a/configs/cmt/cmt_small_ascend.yaml +++ b/configs/cmt/cmt_small_ascend.yaml @@ -52,7 +52,6 @@ warmup_epochs: 5 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: 'dynamic' diff --git a/configs/coat/coat_lite_mini_ascend.yaml b/configs/coat/coat_lite_mini_ascend.yaml index d3eda21e2..3849d8a64 100644 --- a/configs/coat/coat_lite_mini_ascend.yaml +++ b/configs/coat/coat_lite_mini_ascend.yaml @@ -54,6 +54,5 @@ cycle_decay: 1.0 # optimizer opt: 'adamw' weight_decay: 0.025 -filter_bias_and_bn: True loss_scale: 1024 use_nesterov: False diff --git a/configs/coat/coat_lite_tiny_ascend.yaml b/configs/coat/coat_lite_tiny_ascend.yaml index 0ea55dbc4..8d4252677 100644 --- a/configs/coat/coat_lite_tiny_ascend.yaml +++ b/configs/coat/coat_lite_tiny_ascend.yaml @@ -54,6 +54,5 @@ cycle_decay: 1.0 # optimizer opt: 'adamw' weight_decay: 0.025 -filter_bias_and_bn: True loss_scale: 1024 use_nesterov: False diff --git a/configs/coat/coat_mini_ascend.yaml b/configs/coat/coat_mini_ascend.yaml index e209778ba..c3db85de7 100644 --- a/configs/coat/coat_mini_ascend.yaml +++ b/configs/coat/coat_mini_ascend.yaml @@ -55,7 +55,6 @@ epoch_size: 300 # optimizer opt: 'lion' weight_decay: 0.15 -filter_bias_and_bn: True loss_scale: 4096 use_nesterov: False loss_scale_type: dynamic diff --git a/configs/coat/coat_tiny_ascend.yaml b/configs/coat/coat_tiny_ascend.yaml index 927eaa0dd..6a2711c95 100644 --- a/configs/coat/coat_tiny_ascend.yaml +++ b/configs/coat/coat_tiny_ascend.yaml @@ -57,7 +57,6 @@ epoch_size: 300 # optimizer opt: 'lion' weight_decay: 0.15 -filter_bias_and_bn: True loss_scale: 4096 use_nesterov: False loss_scale_type: dynamic diff --git a/configs/convit/convit_base_ascend.yaml b/configs/convit/convit_base_ascend.yaml index 818903210..996c8b8a3 100644 --- a/configs/convit/convit_base_ascend.yaml +++ b/configs/convit/convit_base_ascend.yaml @@ -51,5 +51,4 @@ decay_epochs: 260 opt: 'adamw' weight_decay: 0.1 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convit/convit_base_plus_ascend.yaml b/configs/convit/convit_base_plus_ascend.yaml index 58f8a38b5..4130852a5 100644 --- a/configs/convit/convit_base_plus_ascend.yaml +++ b/configs/convit/convit_base_plus_ascend.yaml @@ -51,5 +51,4 @@ decay_epochs: 260 opt: 'adamw' weight_decay: 0.1 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convit/convit_small_ascend.yaml b/configs/convit/convit_small_ascend.yaml index f644f4a78..e940dcae8 100644 --- a/configs/convit/convit_small_ascend.yaml +++ b/configs/convit/convit_small_ascend.yaml @@ -51,5 +51,4 @@ decay_epochs: 260 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convit/convit_small_plus_ascend.yaml b/configs/convit/convit_small_plus_ascend.yaml index 2725711cd..4a935dd63 100644 --- a/configs/convit/convit_small_plus_ascend.yaml +++ b/configs/convit/convit_small_plus_ascend.yaml @@ -51,5 +51,4 @@ decay_epochs: 260 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convit/convit_tiny_ascend.yaml b/configs/convit/convit_tiny_ascend.yaml index 4777777e9..9fe422ddc 100644 --- a/configs/convit/convit_tiny_ascend.yaml +++ b/configs/convit/convit_tiny_ascend.yaml @@ -50,5 +50,4 @@ decay_epochs: 295 opt: 'adamw' weight_decay: 0.0001 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convit/convit_tiny_gpu.yaml b/configs/convit/convit_tiny_gpu.yaml index 8393f32a9..8e2690adb 100644 --- a/configs/convit/convit_tiny_gpu.yaml +++ b/configs/convit/convit_tiny_gpu.yaml @@ -47,5 +47,4 @@ decay_epochs: 200 # optimizer opt: 'adamw' weight_decay: 0.025 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convit/convit_tiny_plus_ascend.yaml b/configs/convit/convit_tiny_plus_ascend.yaml index d21330d3d..ef2295d20 100644 --- a/configs/convit/convit_tiny_plus_ascend.yaml +++ b/configs/convit/convit_tiny_plus_ascend.yaml @@ -50,5 +50,4 @@ decay_epochs: 260 opt: 'adamw' weight_decay: 0.0001 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/convnext/convnext_base_ascend.yaml b/configs/convnext/convnext_base_ascend.yaml index b643ea174..1f083f08d 100644 --- a/configs/convnext/convnext_base_ascend.yaml +++ b/configs/convnext/convnext_base_ascend.yaml @@ -51,7 +51,6 @@ warmup_epochs: 20 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: 'auto' diff --git a/configs/convnext/convnext_small_ascend.yaml b/configs/convnext/convnext_small_ascend.yaml index fb5abc131..5972bb0d7 100644 --- a/configs/convnext/convnext_small_ascend.yaml +++ b/configs/convnext/convnext_small_ascend.yaml @@ -51,7 +51,6 @@ warmup_epochs: 20 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: 'auto' diff --git a/configs/convnext/convnext_tiny_ascend.yaml b/configs/convnext/convnext_tiny_ascend.yaml index b786b2c42..ffec32c8a 100644 --- a/configs/convnext/convnext_tiny_ascend.yaml +++ b/configs/convnext/convnext_tiny_ascend.yaml @@ -51,7 +51,6 @@ warmup_epochs: 20 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: 'dynamic' diff --git a/configs/convnextv2/convnextv2_tiny_ascend.yaml b/configs/convnextv2/convnextv2_tiny_ascend.yaml index 605a0acb3..697790e53 100644 --- a/configs/convnextv2/convnextv2_tiny_ascend.yaml +++ b/configs/convnextv2/convnextv2_tiny_ascend.yaml @@ -52,7 +52,6 @@ warmup_epochs: 20 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.049 loss_scale_type: 'auto' diff --git a/configs/crossvit/crossvit_15_ascend.yaml b/configs/crossvit/crossvit_15_ascend.yaml index 74c403e73..7d6d24b21 100644 --- a/configs/crossvit/crossvit_15_ascend.yaml +++ b/configs/crossvit/crossvit_15_ascend.yaml @@ -57,7 +57,6 @@ cycle_decay: 1 # optimizer opt: 'adamw' weight_decay: 0.05 -filter_bias_and_bn: True loss_scale: 512 use_nesterov: False eps: 1e-8 diff --git a/configs/crossvit/crossvit_18_ascend.yaml b/configs/crossvit/crossvit_18_ascend.yaml index a9564a2fb..07bf783a7 100644 --- a/configs/crossvit/crossvit_18_ascend.yaml +++ b/configs/crossvit/crossvit_18_ascend.yaml @@ -55,7 +55,6 @@ decay_rate: 0.1 # optimizer opt: 'adamw' weight_decay: 0.05 -filter_bias_and_bn: True loss_scale: 1024 drop_overflow_update: True loss_scale_type: 'dynamic' diff --git a/configs/crossvit/crossvit_9_ascend.yaml b/configs/crossvit/crossvit_9_ascend.yaml index f6abb6a57..e6a03e7d8 100644 --- a/configs/crossvit/crossvit_9_ascend.yaml +++ b/configs/crossvit/crossvit_9_ascend.yaml @@ -54,7 +54,6 @@ decay_rate: 0.1 # optimizer opt: 'adamw' weight_decay: 0.05 -filter_bias_and_bn: True loss_scale_type: 'dynamic' drop_overflow_update: True use_nesterov: False diff --git a/configs/densenet/densenet_121_ascend.yaml b/configs/densenet/densenet_121_ascend.yaml index 70bf38878..fdcf44e9f 100644 --- a/configs/densenet/densenet_121_ascend.yaml +++ b/configs/densenet/densenet_121_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_121_gpu.yaml b/configs/densenet/densenet_121_gpu.yaml index 82e5e2688..d571ac970 100644 --- a/configs/densenet/densenet_121_gpu.yaml +++ b/configs/densenet/densenet_121_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_161_ascend.yaml b/configs/densenet/densenet_161_ascend.yaml index 9447dd0c4..6e3442fa0 100644 --- a/configs/densenet/densenet_161_ascend.yaml +++ b/configs/densenet/densenet_161_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_161_gpu.yaml b/configs/densenet/densenet_161_gpu.yaml index 9447dd0c4..6e3442fa0 100644 --- a/configs/densenet/densenet_161_gpu.yaml +++ b/configs/densenet/densenet_161_gpu.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_169_ascend.yaml b/configs/densenet/densenet_169_ascend.yaml index 53c27502d..0068fcd75 100644 --- a/configs/densenet/densenet_169_ascend.yaml +++ b/configs/densenet/densenet_169_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_169_gpu.yaml b/configs/densenet/densenet_169_gpu.yaml index 53c27502d..0068fcd75 100644 --- a/configs/densenet/densenet_169_gpu.yaml +++ b/configs/densenet/densenet_169_gpu.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_201_ascend.yaml b/configs/densenet/densenet_201_ascend.yaml index 4de9c1c34..124fd0620 100644 --- a/configs/densenet/densenet_201_ascend.yaml +++ b/configs/densenet/densenet_201_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/densenet/densenet_201_gpu.yaml b/configs/densenet/densenet_201_gpu.yaml index 4de9c1c34..124fd0620 100644 --- a/configs/densenet/densenet_201_gpu.yaml +++ b/configs/densenet/densenet_201_gpu.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/dpn/dpn107_ascend.yaml b/configs/dpn/dpn107_ascend.yaml index 9b7366ec6..c9228e1c4 100644 --- a/configs/dpn/dpn107_ascend.yaml +++ b/configs/dpn/dpn107_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'SGD' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/dpn/dpn131_ascend.yaml b/configs/dpn/dpn131_ascend.yaml index d9a737a6b..4d2e5ea03 100644 --- a/configs/dpn/dpn131_ascend.yaml +++ b/configs/dpn/dpn131_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'SGD' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/dpn/dpn92_ascend.yaml b/configs/dpn/dpn92_ascend.yaml index 9da4fc83f..0dd2b6246 100644 --- a/configs/dpn/dpn92_ascend.yaml +++ b/configs/dpn/dpn92_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'SGD' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/dpn/dpn98_ascend.yaml b/configs/dpn/dpn98_ascend.yaml index f9d9439de..4aa855c80 100644 --- a/configs/dpn/dpn98_ascend.yaml +++ b/configs/dpn/dpn98_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'SGD' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/edgenext/edgenext_base_ascend.yaml b/configs/edgenext/edgenext_base_ascend.yaml index 9c7511121..35a02c599 100644 --- a/configs/edgenext/edgenext_base_ascend.yaml +++ b/configs/edgenext/edgenext_base_ascend.yaml @@ -58,7 +58,6 @@ decay_epochs: 330 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale: 1024 diff --git a/configs/edgenext/edgenext_small_ascend.yaml b/configs/edgenext/edgenext_small_ascend.yaml index 1f4ad74f2..a9fb549ef 100644 --- a/configs/edgenext/edgenext_small_ascend.yaml +++ b/configs/edgenext/edgenext_small_ascend.yaml @@ -57,7 +57,6 @@ decay_epochs: 330 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale: 1024 diff --git a/configs/edgenext/edgenext_x_small_ascend.yaml b/configs/edgenext/edgenext_x_small_ascend.yaml index 71345491f..13e06d051 100644 --- a/configs/edgenext/edgenext_x_small_ascend.yaml +++ b/configs/edgenext/edgenext_x_small_ascend.yaml @@ -57,7 +57,6 @@ decay_epochs: 330 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale: 1024 diff --git a/configs/edgenext/edgenext_xx_small_ascend.yaml b/configs/edgenext/edgenext_xx_small_ascend.yaml index f3075d643..fc521837e 100644 --- a/configs/edgenext/edgenext_xx_small_ascend.yaml +++ b/configs/edgenext/edgenext_xx_small_ascend.yaml @@ -56,7 +56,6 @@ decay_epochs: 330 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale: 1024 diff --git a/configs/efficientnet/efficientnet_b0_ascend.yaml b/configs/efficientnet/efficientnet_b0_ascend.yaml index 38a538a49..01bae8652 100644 --- a/configs/efficientnet/efficientnet_b0_ascend.yaml +++ b/configs/efficientnet/efficientnet_b0_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 445 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale_type: 'dynamic' diff --git a/configs/efficientnet/efficientnet_b1_ascend.yaml b/configs/efficientnet/efficientnet_b1_ascend.yaml index 7d34b1d04..c11dc0027 100644 --- a/configs/efficientnet/efficientnet_b1_ascend.yaml +++ b/configs/efficientnet/efficientnet_b1_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 430 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale_type: 'dynamic' diff --git a/configs/ghostnet/ghostnet_050_ascend.yaml b/configs/ghostnet/ghostnet_050_ascend.yaml index 0629c74c1..5947a29cb 100644 --- a/configs/ghostnet/ghostnet_050_ascend.yaml +++ b/configs/ghostnet/ghostnet_050_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 580 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00002 loss_scale_type: "dynamic" diff --git a/configs/ghostnet/ghostnet_100_ascend.yaml b/configs/ghostnet/ghostnet_100_ascend.yaml index d307e5342..2428ce128 100644 --- a/configs/ghostnet/ghostnet_100_ascend.yaml +++ b/configs/ghostnet/ghostnet_100_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 580 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00002 loss_scale_type: "dynamic" diff --git a/configs/ghostnet/ghostnet_130_ascend.yaml b/configs/ghostnet/ghostnet_130_ascend.yaml index 904bf98d0..395dbd566 100644 --- a/configs/ghostnet/ghostnet_130_ascend.yaml +++ b/configs/ghostnet/ghostnet_130_ascend.yaml @@ -47,7 +47,6 @@ decay_epochs: 580 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00002 loss_scale_type: "dynamic" diff --git a/configs/googlenet/googlenet_ascend.yaml b/configs/googlenet/googlenet_ascend.yaml index c0268aeaa..c08d83924 100644 --- a/configs/googlenet/googlenet_ascend.yaml +++ b/configs/googlenet/googlenet_ascend.yaml @@ -44,7 +44,6 @@ warmup_epochs: 5 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/halonet/halonet_50t_ascend.yaml b/configs/halonet/halonet_50t_ascend.yaml index 50693bdf8..603dcffa9 100644 --- a/configs/halonet/halonet_50t_ascend.yaml +++ b/configs/halonet/halonet_50t_ascend.yaml @@ -43,7 +43,6 @@ val_amp_level: 'O2' # optimizer opt: 'adamw' -filter_bias_and_bn: True weight_decay: 0.04 loss_scale: 1024 use_nesterov: False diff --git a/configs/hrnet/hrnet_w32_ascend.yaml b/configs/hrnet/hrnet_w32_ascend.yaml index 43375be8b..d1e78af89 100644 --- a/configs/hrnet/hrnet_w32_ascend.yaml +++ b/configs/hrnet/hrnet_w32_ascend.yaml @@ -52,4 +52,3 @@ decay_epochs: 280 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True diff --git a/configs/hrnet/hrnet_w48_ascend.yaml b/configs/hrnet/hrnet_w48_ascend.yaml index 8d1c06032..6e2818f0b 100644 --- a/configs/hrnet/hrnet_w48_ascend.yaml +++ b/configs/hrnet/hrnet_w48_ascend.yaml @@ -52,4 +52,3 @@ decay_epochs: 280 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True diff --git a/configs/inceptionv3/inception_v3_ascend.yaml b/configs/inceptionv3/inception_v3_ascend.yaml index 4bdfbe246..56313ae8d 100644 --- a/configs/inceptionv3/inception_v3_ascend.yaml +++ b/configs/inceptionv3/inception_v3_ascend.yaml @@ -47,7 +47,6 @@ warmup_epochs: 5 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/inceptionv4/inception_v4_ascend.yaml b/configs/inceptionv4/inception_v4_ascend.yaml index 22ad03d40..7c1cf6342 100644 --- a/configs/inceptionv4/inception_v4_ascend.yaml +++ b/configs/inceptionv4/inception_v4_ascend.yaml @@ -46,7 +46,6 @@ warmup_epochs: 5 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/mixnet/mixnet_l_ascend.yaml b/configs/mixnet/mixnet_l_ascend.yaml index c72755f12..7b6ec097a 100644 --- a/configs/mixnet/mixnet_l_ascend.yaml +++ b/configs/mixnet/mixnet_l_ascend.yaml @@ -48,7 +48,6 @@ warmup_epochs: 20 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00002 loss_scale_type: "dynamic" diff --git a/configs/mixnet/mixnet_m_ascend.yaml b/configs/mixnet/mixnet_m_ascend.yaml index a655a2c7e..50f430c7f 100644 --- a/configs/mixnet/mixnet_m_ascend.yaml +++ b/configs/mixnet/mixnet_m_ascend.yaml @@ -50,7 +50,6 @@ warmup_epochs: 15 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00002 loss_scale: 1024 diff --git a/configs/mixnet/mixnet_s_ascend.yaml b/configs/mixnet/mixnet_s_ascend.yaml index eaad3961f..e362e8a2d 100644 --- a/configs/mixnet/mixnet_s_ascend.yaml +++ b/configs/mixnet/mixnet_s_ascend.yaml @@ -49,7 +49,6 @@ warmup_epochs: 15 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00002 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_0.5_ascend.yaml b/configs/mnasnet/mnasnet_0.5_ascend.yaml index bbce1a8bf..791a70ccc 100644 --- a/configs/mnasnet/mnasnet_0.5_ascend.yaml +++ b/configs/mnasnet/mnasnet_0.5_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 395 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_0.75_ascend.yaml b/configs/mnasnet/mnasnet_0.75_ascend.yaml index 814c35807..f527eb810 100644 --- a/configs/mnasnet/mnasnet_0.75_ascend.yaml +++ b/configs/mnasnet/mnasnet_0.75_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 345 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_0.75_gpu.yaml b/configs/mnasnet/mnasnet_0.75_gpu.yaml index 7bbbadd9a..a19d44a01 100644 --- a/configs/mnasnet/mnasnet_0.75_gpu.yaml +++ b/configs/mnasnet/mnasnet_0.75_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 345 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_1.0_ascend.yaml b/configs/mnasnet/mnasnet_1.0_ascend.yaml index 771fdda34..3fb5e2017 100644 --- a/configs/mnasnet/mnasnet_1.0_ascend.yaml +++ b/configs/mnasnet/mnasnet_1.0_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 445 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_1.0_gpu.yaml b/configs/mnasnet/mnasnet_1.0_gpu.yaml index 4efd8240b..aedb770c7 100644 --- a/configs/mnasnet/mnasnet_1.0_gpu.yaml +++ b/configs/mnasnet/mnasnet_1.0_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 445 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_1.3_ascend.yaml b/configs/mnasnet/mnasnet_1.3_ascend.yaml index 5dcc2624f..95e0c7710 100644 --- a/configs/mnasnet/mnasnet_1.3_ascend.yaml +++ b/configs/mnasnet/mnasnet_1.3_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 395 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_1.4_ascend.yaml b/configs/mnasnet/mnasnet_1.4_ascend.yaml index dc84463ab..71f26a5d0 100644 --- a/configs/mnasnet/mnasnet_1.4_ascend.yaml +++ b/configs/mnasnet/mnasnet_1.4_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 395 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mnasnet/mnasnet_1.4_gpu.yaml b/configs/mnasnet/mnasnet_1.4_gpu.yaml index 7d30e3568..92790cfb3 100644 --- a/configs/mnasnet/mnasnet_1.4_gpu.yaml +++ b/configs/mnasnet/mnasnet_1.4_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 395 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale: 256 diff --git a/configs/mobilenetv1/mobilenet_v1_0.25_ascend.yaml b/configs/mobilenetv1/mobilenet_v1_0.25_ascend.yaml index a089bb6b3..28058873c 100644 --- a/configs/mobilenetv1/mobilenet_v1_0.25_ascend.yaml +++ b/configs/mobilenetv1/mobilenet_v1_0.25_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_0.25_gpu.yaml b/configs/mobilenetv1/mobilenet_v1_0.25_gpu.yaml index a089bb6b3..28058873c 100644 --- a/configs/mobilenetv1/mobilenet_v1_0.25_gpu.yaml +++ b/configs/mobilenetv1/mobilenet_v1_0.25_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_0.5_ascend.yaml b/configs/mobilenetv1/mobilenet_v1_0.5_ascend.yaml index e9c0445cb..58beff2c9 100644 --- a/configs/mobilenetv1/mobilenet_v1_0.5_ascend.yaml +++ b/configs/mobilenetv1/mobilenet_v1_0.5_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_0.5_gpu.yaml b/configs/mobilenetv1/mobilenet_v1_0.5_gpu.yaml index e9c0445cb..58beff2c9 100644 --- a/configs/mobilenetv1/mobilenet_v1_0.5_gpu.yaml +++ b/configs/mobilenetv1/mobilenet_v1_0.5_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_0.75_ascend.yaml b/configs/mobilenetv1/mobilenet_v1_0.75_ascend.yaml index 8a37f2394..c9b8f35e3 100644 --- a/configs/mobilenetv1/mobilenet_v1_0.75_ascend.yaml +++ b/configs/mobilenetv1/mobilenet_v1_0.75_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_0.75_gpu.yaml b/configs/mobilenetv1/mobilenet_v1_0.75_gpu.yaml index 8a37f2394..c9b8f35e3 100644 --- a/configs/mobilenetv1/mobilenet_v1_0.75_gpu.yaml +++ b/configs/mobilenetv1/mobilenet_v1_0.75_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_1.0_ascend.yaml b/configs/mobilenetv1/mobilenet_v1_1.0_ascend.yaml index 543e65832..2c6ad6f35 100644 --- a/configs/mobilenetv1/mobilenet_v1_1.0_ascend.yaml +++ b/configs/mobilenetv1/mobilenet_v1_1.0_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv1/mobilenet_v1_1.0_gpu.yaml b/configs/mobilenetv1/mobilenet_v1_1.0_gpu.yaml index 4ef48e61c..05967c6ec 100644 --- a/configs/mobilenetv1/mobilenet_v1_1.0_gpu.yaml +++ b/configs/mobilenetv1/mobilenet_v1_1.0_gpu.yaml @@ -44,7 +44,6 @@ decay_epochs: 198 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv2/mobilenet_v2_0.75_ascend.yaml b/configs/mobilenetv2/mobilenet_v2_0.75_ascend.yaml index 82fb12395..bc9ad4f33 100644 --- a/configs/mobilenetv2/mobilenet_v2_0.75_ascend.yaml +++ b/configs/mobilenetv2/mobilenet_v2_0.75_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 396 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00003 loss_scale: 1024 diff --git a/configs/mobilenetv2/mobilenet_v2_1.0_ascend.yaml b/configs/mobilenetv2/mobilenet_v2_1.0_ascend.yaml index 5d271c1f7..0192d7804 100644 --- a/configs/mobilenetv2/mobilenet_v2_1.0_ascend.yaml +++ b/configs/mobilenetv2/mobilenet_v2_1.0_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 316 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/mobilenetv2/mobilenet_v2_1.4_ascend.yaml b/configs/mobilenetv2/mobilenet_v2_1.4_ascend.yaml index 56397195a..7201f01cc 100644 --- a/configs/mobilenetv2/mobilenet_v2_1.4_ascend.yaml +++ b/configs/mobilenetv2/mobilenet_v2_1.4_ascend.yaml @@ -45,7 +45,7 @@ decay_epochs: 296 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/mobilenetv3/mobilenet_v3_large_ascend.yaml b/configs/mobilenetv3/mobilenet_v3_large_ascend.yaml index 19eb0120f..8abe7c2c6 100644 --- a/configs/mobilenetv3/mobilenet_v3_large_ascend.yaml +++ b/configs/mobilenetv3/mobilenet_v3_large_ascend.yaml @@ -45,7 +45,7 @@ decay_epochs: 416 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00002 loss_scale: 1024 diff --git a/configs/mobilenetv3/mobilenet_v3_small_ascend.yaml b/configs/mobilenetv3/mobilenet_v3_small_ascend.yaml index 5c75d4e0e..fe19448e4 100644 --- a/configs/mobilenetv3/mobilenet_v3_small_ascend.yaml +++ b/configs/mobilenetv3/mobilenet_v3_small_ascend.yaml @@ -46,7 +46,7 @@ decay_epochs: 466 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00002 loss_scale: 1024 diff --git a/configs/mobilevit/mobilevit_small_ascend.yaml b/configs/mobilevit/mobilevit_small_ascend.yaml index 4650cadbe..5be05d8d7 100644 --- a/configs/mobilevit/mobilevit_small_ascend.yaml +++ b/configs/mobilevit/mobilevit_small_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 430 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.01 use_nesterov: False diff --git a/configs/mobilevit/mobilevit_x_small_ascend.yaml b/configs/mobilevit/mobilevit_x_small_ascend.yaml index 994a7c60b..a8f2fa92b 100644 --- a/configs/mobilevit/mobilevit_x_small_ascend.yaml +++ b/configs/mobilevit/mobilevit_x_small_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 430 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.01 use_nesterov: False diff --git a/configs/mobilevit/mobilevit_xx_small_ascend.yaml b/configs/mobilevit/mobilevit_xx_small_ascend.yaml index 127c5a9f7..583cbda27 100644 --- a/configs/mobilevit/mobilevit_xx_small_ascend.yaml +++ b/configs/mobilevit/mobilevit_xx_small_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 410 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.01 use_nesterov: False diff --git a/configs/nasnet/nasnet_a_4x1056_ascend.yaml b/configs/nasnet/nasnet_a_4x1056_ascend.yaml index 07ea9b141..f996d16e2 100644 --- a/configs/nasnet/nasnet_a_4x1056_ascend.yaml +++ b/configs/nasnet/nasnet_a_4x1056_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 445 # optimizer opt: 'rmsprop' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1e-5 loss_scale_type: 'dynamic' diff --git a/configs/pit/pit_b_ascend.yaml b/configs/pit/pit_b_ascend.yaml index 5ca3c629a..47dc116e5 100644 --- a/configs/pit/pit_b_ascend.yaml +++ b/configs/pit/pit_b_ascend.yaml @@ -53,7 +53,6 @@ warmup_factor: 0.002 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "auto" diff --git a/configs/pit/pit_s_ascend.yaml b/configs/pit/pit_s_ascend.yaml index ef13fb3d8..0f2b79beb 100644 --- a/configs/pit/pit_s_ascend.yaml +++ b/configs/pit/pit_s_ascend.yaml @@ -53,7 +53,6 @@ warmup_factor: 0.002 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "dynamic" diff --git a/configs/pit/pit_ti_ascend.yaml b/configs/pit/pit_ti_ascend.yaml index 0c8a47b51..7a8f73d03 100644 --- a/configs/pit/pit_ti_ascend.yaml +++ b/configs/pit/pit_ti_ascend.yaml @@ -50,7 +50,6 @@ warmup_epochs: 10 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "auto" diff --git a/configs/pit/pit_xs_ascend.yaml b/configs/pit/pit_xs_ascend.yaml index 9b8fc5fdf..c789d6658 100644 --- a/configs/pit/pit_xs_ascend.yaml +++ b/configs/pit/pit_xs_ascend.yaml @@ -51,7 +51,6 @@ warmup_epochs: 10 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "dynamic" diff --git a/configs/poolformer/poolformer_s12_ascend.yaml b/configs/poolformer/poolformer_s12_ascend.yaml index 535a5fe64..0e42aa94f 100644 --- a/configs/poolformer/poolformer_s12_ascend.yaml +++ b/configs/poolformer/poolformer_s12_ascend.yaml @@ -54,7 +54,6 @@ decay_rate: 0.1 # optimizer opt: 'AdamW' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale: 1024 diff --git a/configs/pvt/pvt_large_ascend.yaml b/configs/pvt/pvt_large_ascend.yaml index 76a12370f..2078a499e 100644 --- a/configs/pvt/pvt_large_ascend.yaml +++ b/configs/pvt/pvt_large_ascend.yaml @@ -52,5 +52,4 @@ decay_epochs: 390 opt: 'adamw' weight_decay: 0.05 loss_scale: 300 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/pvt/pvt_medium_ascend.yaml b/configs/pvt/pvt_medium_ascend.yaml index 21560b614..d663f2c0f 100644 --- a/configs/pvt/pvt_medium_ascend.yaml +++ b/configs/pvt/pvt_medium_ascend.yaml @@ -52,5 +52,4 @@ decay_epochs: 390 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/pvt/pvt_small_ascend.yaml b/configs/pvt/pvt_small_ascend.yaml index 55f0ca9be..4b773e791 100644 --- a/configs/pvt/pvt_small_ascend.yaml +++ b/configs/pvt/pvt_small_ascend.yaml @@ -52,5 +52,4 @@ decay_epochs: 390 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/pvt/pvt_tiny_ascend.yaml b/configs/pvt/pvt_tiny_ascend.yaml index 5610ea5ed..368922728 100644 --- a/configs/pvt/pvt_tiny_ascend.yaml +++ b/configs/pvt/pvt_tiny_ascend.yaml @@ -52,5 +52,4 @@ decay_epochs: 440 opt: 'adamw' weight_decay: 0.05 loss_scale: 1024 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/pvtv2/pvt_v2_b0_ascend.yaml b/configs/pvtv2/pvt_v2_b0_ascend.yaml index 8cd627636..518d4b23f 100644 --- a/configs/pvtv2/pvt_v2_b0_ascend.yaml +++ b/configs/pvtv2/pvt_v2_b0_ascend.yaml @@ -51,7 +51,6 @@ warmup_epochs: 10 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "dynamic" diff --git a/configs/pvtv2/pvt_v2_b1_ascend.yaml b/configs/pvtv2/pvt_v2_b1_ascend.yaml index 0e556eb70..9639adfe8 100644 --- a/configs/pvtv2/pvt_v2_b1_ascend.yaml +++ b/configs/pvtv2/pvt_v2_b1_ascend.yaml @@ -51,7 +51,6 @@ warmup_epochs: 10 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "dynamic" diff --git a/configs/pvtv2/pvt_v2_b2_ascend.yaml b/configs/pvtv2/pvt_v2_b2_ascend.yaml index 1f2ff2a44..a35addd9c 100644 --- a/configs/pvtv2/pvt_v2_b2_ascend.yaml +++ b/configs/pvtv2/pvt_v2_b2_ascend.yaml @@ -50,7 +50,6 @@ warmup_epochs: 20 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "dynamic" diff --git a/configs/pvtv2/pvt_v2_b3_ascend.yaml b/configs/pvtv2/pvt_v2_b3_ascend.yaml index e8037caf4..c2f51da6f 100644 --- a/configs/pvtv2/pvt_v2_b3_ascend.yaml +++ b/configs/pvtv2/pvt_v2_b3_ascend.yaml @@ -50,7 +50,6 @@ warmup_epochs: 20 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "auto" diff --git a/configs/pvtv2/pvt_v2_b4_ascend.yaml b/configs/pvtv2/pvt_v2_b4_ascend.yaml index 91bffc05b..1a247e124 100644 --- a/configs/pvtv2/pvt_v2_b4_ascend.yaml +++ b/configs/pvtv2/pvt_v2_b4_ascend.yaml @@ -50,7 +50,6 @@ warmup_epochs: 20 # optimizer opt: "adamw" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale_type: "auto" diff --git a/configs/regnet/regnet_x_200mf_ascend.yaml b/configs/regnet/regnet_x_200mf_ascend.yaml index 1293f7431..272b45526 100644 --- a/configs/regnet/regnet_x_200mf_ascend.yaml +++ b/configs/regnet/regnet_x_200mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_x_400mf_ascend.yaml b/configs/regnet/regnet_x_400mf_ascend.yaml index 3073cfc3e..b93c62dea 100644 --- a/configs/regnet/regnet_x_400mf_ascend.yaml +++ b/configs/regnet/regnet_x_400mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_x_600mf_ascend.yaml b/configs/regnet/regnet_x_600mf_ascend.yaml index b45d7484e..6d7e9cb7f 100644 --- a/configs/regnet/regnet_x_600mf_ascend.yaml +++ b/configs/regnet/regnet_x_600mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_x_800mf_ascend.yaml b/configs/regnet/regnet_x_800mf_ascend.yaml index 9902be17b..ee2892371 100644 --- a/configs/regnet/regnet_x_800mf_ascend.yaml +++ b/configs/regnet/regnet_x_800mf_ascend.yaml @@ -52,4 +52,3 @@ momentum: 0.9 weight_decay: 0.0001 loss_scale: 128 use_nesterov: False -filter_bias_and_bn: True diff --git a/configs/regnet/regnet_y_16gf_ascend.yaml b/configs/regnet/regnet_y_16gf_ascend.yaml index c5588c231..29cd15886 100644 --- a/configs/regnet/regnet_y_16gf_ascend.yaml +++ b/configs/regnet/regnet_y_16gf_ascend.yaml @@ -55,7 +55,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 4e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_y_200mf_ascend.yaml b/configs/regnet/regnet_y_200mf_ascend.yaml index 2fecef323..aea21aaeb 100644 --- a/configs/regnet/regnet_y_200mf_ascend.yaml +++ b/configs/regnet/regnet_y_200mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_y_400mf_ascend.yaml b/configs/regnet/regnet_y_400mf_ascend.yaml index b8b90be87..e88aa1211 100644 --- a/configs/regnet/regnet_y_400mf_ascend.yaml +++ b/configs/regnet/regnet_y_400mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_y_600mf_ascend.yaml b/configs/regnet/regnet_y_600mf_ascend.yaml index b2687b424..b233e7e31 100644 --- a/configs/regnet/regnet_y_600mf_ascend.yaml +++ b/configs/regnet/regnet_y_600mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/regnet/regnet_y_800mf_ascend.yaml b/configs/regnet/regnet_y_800mf_ascend.yaml index 9471a0a49..ec72f0612 100644 --- a/configs/regnet/regnet_y_800mf_ascend.yaml +++ b/configs/regnet/regnet_y_800mf_ascend.yaml @@ -49,7 +49,6 @@ opt: 'momentum' momentum: 0.9 weight_decay: 5e-5 use_nesterov: False -filter_bias_and_bn: True # amp amp_level: 'O2' diff --git a/configs/repmlp/repmlp_t224_ascend.yaml b/configs/repmlp/repmlp_t224_ascend.yaml index c47e2777f..4c4fb4d2b 100644 --- a/configs/repmlp/repmlp_t224_ascend.yaml +++ b/configs/repmlp/repmlp_t224_ascend.yaml @@ -55,7 +55,6 @@ decay_rate: 0.01 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 2e-05 loss_scale: 1024 diff --git a/configs/repvgg/repvgg_a0_ascend.yaml b/configs/repvgg/repvgg_a0_ascend.yaml index 05919cb33..534d9d1a7 100644 --- a/configs/repvgg/repvgg_a0_ascend.yaml +++ b/configs/repvgg/repvgg_a0_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 390 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_a1_ascend.yaml b/configs/repvgg/repvgg_a1_ascend.yaml index 8b09349f5..3144967f0 100644 --- a/configs/repvgg/repvgg_a1_ascend.yaml +++ b/configs/repvgg/repvgg_a1_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_a2_ascend.yaml b/configs/repvgg/repvgg_a2_ascend.yaml index 36ee7269a..554f43acf 100644 --- a/configs/repvgg/repvgg_a2_ascend.yaml +++ b/configs/repvgg/repvgg_a2_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b0_ascend.yaml b/configs/repvgg/repvgg_b0_ascend.yaml index e5ab6bbb1..92c38c723 100644 --- a/configs/repvgg/repvgg_b0_ascend.yaml +++ b/configs/repvgg/repvgg_b0_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b1_ascend.yaml b/configs/repvgg/repvgg_b1_ascend.yaml index b33462022..8329ac589 100644 --- a/configs/repvgg/repvgg_b1_ascend.yaml +++ b/configs/repvgg/repvgg_b1_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b1g2_ascend.yaml b/configs/repvgg/repvgg_b1g2_ascend.yaml index 28b5bd8c5..c44cbc0ed 100644 --- a/configs/repvgg/repvgg_b1g2_ascend.yaml +++ b/configs/repvgg/repvgg_b1g2_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b1g4_ascend.yaml b/configs/repvgg/repvgg_b1g4_ascend.yaml index 05e336b03..0c6af8863 100644 --- a/configs/repvgg/repvgg_b1g4_ascend.yaml +++ b/configs/repvgg/repvgg_b1g4_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b2_ascend.yaml b/configs/repvgg/repvgg_b2_ascend.yaml index e98e3df1d..c0d72b6fa 100644 --- a/configs/repvgg/repvgg_b2_ascend.yaml +++ b/configs/repvgg/repvgg_b2_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b2g4_ascend.yaml b/configs/repvgg/repvgg_b2g4_ascend.yaml index 324a45fa7..819ba81e6 100644 --- a/configs/repvgg/repvgg_b2g4_ascend.yaml +++ b/configs/repvgg/repvgg_b2g4_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/repvgg/repvgg_b3_ascend.yaml b/configs/repvgg/repvgg_b3_ascend.yaml index d870f9c1b..e6dc995fe 100644 --- a/configs/repvgg/repvgg_b3_ascend.yaml +++ b/configs/repvgg/repvgg_b3_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 235 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/res2net/res2net_101_ascend.yaml b/configs/res2net/res2net_101_ascend.yaml index a645151a0..ab9487df2 100644 --- a/configs/res2net/res2net_101_ascend.yaml +++ b/configs/res2net/res2net_101_ascend.yaml @@ -49,7 +49,6 @@ decay_epochs: 30 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_101_gpu.yaml b/configs/res2net/res2net_101_gpu.yaml index 632d7c29e..d1336cb3f 100644 --- a/configs/res2net/res2net_101_gpu.yaml +++ b/configs/res2net/res2net_101_gpu.yaml @@ -49,7 +49,6 @@ decay_epochs: 295 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_101_v1b_ascend.yaml b/configs/res2net/res2net_101_v1b_ascend.yaml index 5fdbe6fab..65f97ce98 100644 --- a/configs/res2net/res2net_101_v1b_ascend.yaml +++ b/configs/res2net/res2net_101_v1b_ascend.yaml @@ -48,7 +48,6 @@ decay_epochs: 196 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_101_v1b_gpu.yaml b/configs/res2net/res2net_101_v1b_gpu.yaml index 929678bd6..2282b5fb0 100644 --- a/configs/res2net/res2net_101_v1b_gpu.yaml +++ b/configs/res2net/res2net_101_v1b_gpu.yaml @@ -49,7 +49,6 @@ decay_epochs: 295 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_50_ascend.yaml b/configs/res2net/res2net_50_ascend.yaml index a9339b79d..8891f61b1 100644 --- a/configs/res2net/res2net_50_ascend.yaml +++ b/configs/res2net/res2net_50_ascend.yaml @@ -48,7 +48,6 @@ decay_epochs: 196 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_50_gpu.yaml b/configs/res2net/res2net_50_gpu.yaml index e283e00d6..74637a924 100644 --- a/configs/res2net/res2net_50_gpu.yaml +++ b/configs/res2net/res2net_50_gpu.yaml @@ -49,7 +49,6 @@ decay_epochs: 295 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_50_v1b_ascend.yaml b/configs/res2net/res2net_50_v1b_ascend.yaml index e75ce6b81..4f14e7035 100644 --- a/configs/res2net/res2net_50_v1b_ascend.yaml +++ b/configs/res2net/res2net_50_v1b_ascend.yaml @@ -49,7 +49,6 @@ decay_epochs: 295 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/res2net/res2net_50_v1b_gpu.yaml b/configs/res2net/res2net_50_v1b_gpu.yaml index f404a027c..acd7ff522 100644 --- a/configs/res2net/res2net_50_v1b_gpu.yaml +++ b/configs/res2net/res2net_50_v1b_gpu.yaml @@ -49,7 +49,6 @@ decay_epochs: 295 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnest/resnest101_ascend.yaml b/configs/resnest/resnest101_ascend.yaml index a26319f3a..393536781 100644 --- a/configs/resnest/resnest101_ascend.yaml +++ b/configs/resnest/resnest101_ascend.yaml @@ -50,7 +50,6 @@ decay_epochs: 345 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00009 loss_scale_type: "auto" diff --git a/configs/resnest/resnest50_ascend.yaml b/configs/resnest/resnest50_ascend.yaml index c558f5c82..3d37a2267 100644 --- a/configs/resnest/resnest50_ascend.yaml +++ b/configs/resnest/resnest50_ascend.yaml @@ -49,7 +49,6 @@ decay_epochs: 345 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale_type: "dynamic" diff --git a/configs/resnet/resnet_101_ascend.yaml b/configs/resnet/resnet_101_ascend.yaml index 9022c0246..cdcffef17 100644 --- a/configs/resnet/resnet_101_ascend.yaml +++ b/configs/resnet/resnet_101_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_101_gpu.yaml b/configs/resnet/resnet_101_gpu.yaml index 9022c0246..cdcffef17 100644 --- a/configs/resnet/resnet_101_gpu.yaml +++ b/configs/resnet/resnet_101_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_152_ascend.yaml b/configs/resnet/resnet_152_ascend.yaml index ee01e33ad..7eb2b7b82 100644 --- a/configs/resnet/resnet_152_ascend.yaml +++ b/configs/resnet/resnet_152_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_152_gpu.yaml b/configs/resnet/resnet_152_gpu.yaml index ee01e33ad..7eb2b7b82 100644 --- a/configs/resnet/resnet_152_gpu.yaml +++ b/configs/resnet/resnet_152_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_18_ascend.yaml b/configs/resnet/resnet_18_ascend.yaml index 33b014631..33e08ac32 100644 --- a/configs/resnet/resnet_18_ascend.yaml +++ b/configs/resnet/resnet_18_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_18_gpu.yaml b/configs/resnet/resnet_18_gpu.yaml index 33b014631..33e08ac32 100644 --- a/configs/resnet/resnet_18_gpu.yaml +++ b/configs/resnet/resnet_18_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_34_ascend.yaml b/configs/resnet/resnet_34_ascend.yaml index 8e130cd3f..a9ecc5bae 100644 --- a/configs/resnet/resnet_34_ascend.yaml +++ b/configs/resnet/resnet_34_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_34_gpu.yaml b/configs/resnet/resnet_34_gpu.yaml index 8e130cd3f..a9ecc5bae 100644 --- a/configs/resnet/resnet_34_gpu.yaml +++ b/configs/resnet/resnet_34_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_50_ascend.yaml b/configs/resnet/resnet_50_ascend.yaml index 76f0be6de..2a2d7bbde 100644 --- a/configs/resnet/resnet_50_ascend.yaml +++ b/configs/resnet/resnet_50_ascend.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnet/resnet_50_gpu.yaml b/configs/resnet/resnet_50_gpu.yaml index 76f0be6de..2a2d7bbde 100644 --- a/configs/resnet/resnet_50_gpu.yaml +++ b/configs/resnet/resnet_50_gpu.yaml @@ -43,7 +43,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnetv2/resnetv2_101_ascend.yaml b/configs/resnetv2/resnetv2_101_ascend.yaml index 3f72b2e1b..35044d3fd 100644 --- a/configs/resnetv2/resnetv2_101_ascend.yaml +++ b/configs/resnetv2/resnetv2_101_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnetv2/resnetv2_50_ascend.yaml b/configs/resnetv2/resnetv2_50_ascend.yaml index d299e424e..4ecbf9f4a 100644 --- a/configs/resnetv2/resnetv2_50_ascend.yaml +++ b/configs/resnetv2/resnetv2_50_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 120 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnext/resnext101_32x4d_ascend.yaml b/configs/resnext/resnext101_32x4d_ascend.yaml index 247af9042..276d3fa7c 100644 --- a/configs/resnext/resnext101_32x4d_ascend.yaml +++ b/configs/resnext/resnext101_32x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnext/resnext101_64x4d_ascend.yaml b/configs/resnext/resnext101_64x4d_ascend.yaml index 25c9b5cb7..651e62ef1 100644 --- a/configs/resnext/resnext101_64x4d_ascend.yaml +++ b/configs/resnext/resnext101_64x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnext/resnext152_64x4d_ascend.yaml b/configs/resnext/resnext152_64x4d_ascend.yaml index 9864bc906..12defbff0 100644 --- a/configs/resnext/resnext152_64x4d_ascend.yaml +++ b/configs/resnext/resnext152_64x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/resnext/resnext50_32x4d_ascend.yaml b/configs/resnext/resnext50_32x4d_ascend.yaml index 80d461d87..d3eee9284 100644 --- a/configs/resnext/resnext50_32x4d_ascend.yaml +++ b/configs/resnext/resnext50_32x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/rexnet/rexnet_x09_ascend.yaml b/configs/rexnet/rexnet_x09_ascend.yaml index 615b41a41..d3ed9a0c0 100644 --- a/configs/rexnet/rexnet_x09_ascend.yaml +++ b/configs/rexnet/rexnet_x09_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 395 # optimizer opt: "sgd" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1.0e-5 loss_scale: 1024 diff --git a/configs/rexnet/rexnet_x10_ascend.yaml b/configs/rexnet/rexnet_x10_ascend.yaml index 1439df063..f2637fc38 100644 --- a/configs/rexnet/rexnet_x10_ascend.yaml +++ b/configs/rexnet/rexnet_x10_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 395 # optimizer opt: "sgd" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1.0e-5 loss_scale: 1024 diff --git a/configs/rexnet/rexnet_x13_ascend.yaml b/configs/rexnet/rexnet_x13_ascend.yaml index 38d07d352..ec57a82ff 100644 --- a/configs/rexnet/rexnet_x13_ascend.yaml +++ b/configs/rexnet/rexnet_x13_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 395 # optimizer opt: "sgd" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1.0e-5 loss_scale: 1024 diff --git a/configs/rexnet/rexnet_x15_ascend.yaml b/configs/rexnet/rexnet_x15_ascend.yaml index 2165d8c3f..d5845ad26 100644 --- a/configs/rexnet/rexnet_x15_ascend.yaml +++ b/configs/rexnet/rexnet_x15_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 370 # optimizer opt: "sgd" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1.0e-5 loss_scale: 1024 diff --git a/configs/rexnet/rexnet_x20_ascend.yaml b/configs/rexnet/rexnet_x20_ascend.yaml index b1729e176..023646973 100644 --- a/configs/rexnet/rexnet_x20_ascend.yaml +++ b/configs/rexnet/rexnet_x20_ascend.yaml @@ -46,7 +46,6 @@ decay_epochs: 370 # optimizer opt: "sgd" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 1.0e-5 loss_scale: 1024 diff --git a/configs/senet/seresnet18_ascend.yaml b/configs/senet/seresnet18_ascend.yaml index b437edba6..111f51a9d 100644 --- a/configs/senet/seresnet18_ascend.yaml +++ b/configs/senet/seresnet18_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/senet/seresnet34_ascend.yaml b/configs/senet/seresnet34_ascend.yaml index 34420bc62..ac49133c6 100644 --- a/configs/senet/seresnet34_ascend.yaml +++ b/configs/senet/seresnet34_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/senet/seresnet50_ascend.yaml b/configs/senet/seresnet50_ascend.yaml index f1a1849c6..f9b5aa21d 100644 --- a/configs/senet/seresnet50_ascend.yaml +++ b/configs/senet/seresnet50_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/senet/seresnext26_32x4d_ascend.yaml b/configs/senet/seresnext26_32x4d_ascend.yaml index 18b519c8d..c424f9c46 100644 --- a/configs/senet/seresnext26_32x4d_ascend.yaml +++ b/configs/senet/seresnext26_32x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/senet/seresnext50_32x4d_ascend.yaml b/configs/senet/seresnext50_32x4d_ascend.yaml index 8c1ec6e89..88d3781ab 100644 --- a/configs/senet/seresnext50_32x4d_ascend.yaml +++ b/configs/senet/seresnext50_32x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 150 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/shufflenetv1/shufflenet_v1_0.5_ascend.yaml b/configs/shufflenetv1/shufflenet_v1_0.5_ascend.yaml index adccfdb9f..56b2dead3 100644 --- a/configs/shufflenetv1/shufflenet_v1_0.5_ascend.yaml +++ b/configs/shufflenetv1/shufflenet_v1_0.5_ascend.yaml @@ -42,7 +42,7 @@ decay_epochs: 246 # optimizer opt: "momentum" -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/shufflenetv1/shufflenet_v1_1.0_ascend.yaml b/configs/shufflenetv1/shufflenet_v1_1.0_ascend.yaml index a48a0d28b..85cff636d 100644 --- a/configs/shufflenetv1/shufflenet_v1_1.0_ascend.yaml +++ b/configs/shufflenetv1/shufflenet_v1_1.0_ascend.yaml @@ -42,7 +42,7 @@ decay_epochs: 246 # optimizer opt: "momentum" -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/shufflenetv2/shufflenet_v2_0.5_ascend.yaml b/configs/shufflenetv2/shufflenet_v2_0.5_ascend.yaml index 23f6e42fd..29d2752da 100644 --- a/configs/shufflenetv2/shufflenet_v2_0.5_ascend.yaml +++ b/configs/shufflenetv2/shufflenet_v2_0.5_ascend.yaml @@ -44,7 +44,7 @@ decay_epochs: 246 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/shufflenetv2/shufflenet_v2_1.0_ascend.yaml b/configs/shufflenetv2/shufflenet_v2_1.0_ascend.yaml index d21403653..76f557221 100644 --- a/configs/shufflenetv2/shufflenet_v2_1.0_ascend.yaml +++ b/configs/shufflenetv2/shufflenet_v2_1.0_ascend.yaml @@ -44,7 +44,7 @@ decay_epochs: 295 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/shufflenetv2/shufflenet_v2_1.5_ascend.yaml b/configs/shufflenetv2/shufflenet_v2_1.5_ascend.yaml index a6871768a..4801974e8 100644 --- a/configs/shufflenetv2/shufflenet_v2_1.5_ascend.yaml +++ b/configs/shufflenetv2/shufflenet_v2_1.5_ascend.yaml @@ -44,7 +44,7 @@ decay_epochs: 295 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/shufflenetv2/shufflenet_v2_2.0_ascend.yaml b/configs/shufflenetv2/shufflenet_v2_2.0_ascend.yaml index 974149fbe..a8531236b 100644 --- a/configs/shufflenetv2/shufflenet_v2_2.0_ascend.yaml +++ b/configs/shufflenetv2/shufflenet_v2_2.0_ascend.yaml @@ -44,7 +44,7 @@ decay_epochs: 295 # optimizer opt: 'momentum' -filter_bias_and_bn: False +weight_decay_filter: 'auto' momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/sknet/skresnet18_ascend.yaml b/configs/sknet/skresnet18_ascend.yaml index c8f9fa2a2..97ebfca39 100644 --- a/configs/sknet/skresnet18_ascend.yaml +++ b/configs/sknet/skresnet18_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 195 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/sknet/skresnet34_ascend.yaml b/configs/sknet/skresnet34_ascend.yaml index 22275fc5b..87e62b8a9 100644 --- a/configs/sknet/skresnet34_ascend.yaml +++ b/configs/sknet/skresnet34_ascend.yaml @@ -47,7 +47,6 @@ warmup_factor: 0.01 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 128 diff --git a/configs/sknet/skresnext50_32x4d_ascend.yaml b/configs/sknet/skresnext50_32x4d_ascend.yaml index 7da59b34a..9e557e558 100644 --- a/configs/sknet/skresnext50_32x4d_ascend.yaml +++ b/configs/sknet/skresnext50_32x4d_ascend.yaml @@ -44,7 +44,6 @@ decay_epochs: 195 # optimizer opt: "momentum" -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/squeezenet/squeezenet_1.0_ascend.yaml b/configs/squeezenet/squeezenet_1.0_ascend.yaml index 0179d00cb..cb2df5061 100644 --- a/configs/squeezenet/squeezenet_1.0_ascend.yaml +++ b/configs/squeezenet/squeezenet_1.0_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0001 loss_scale: 1024 diff --git a/configs/squeezenet/squeezenet_1.0_gpu.yaml b/configs/squeezenet/squeezenet_1.0_gpu.yaml index 73eab2961..932ec107b 100644 --- a/configs/squeezenet/squeezenet_1.0_gpu.yaml +++ b/configs/squeezenet/squeezenet_1.0_gpu.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00007 loss_scale: 1024 diff --git a/configs/squeezenet/squeezenet_1.1_ascend.yaml b/configs/squeezenet/squeezenet_1.1_ascend.yaml index d5a6ee90d..790dded67 100644 --- a/configs/squeezenet/squeezenet_1.1_ascend.yaml +++ b/configs/squeezenet/squeezenet_1.1_ascend.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.0002 loss_scale: 1024 diff --git a/configs/squeezenet/squeezenet_1.1_gpu.yaml b/configs/squeezenet/squeezenet_1.1_gpu.yaml index 806783fd8..ee9ffa1a3 100644 --- a/configs/squeezenet/squeezenet_1.1_gpu.yaml +++ b/configs/squeezenet/squeezenet_1.1_gpu.yaml @@ -45,7 +45,6 @@ decay_epochs: 200 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00007 loss_scale: 1024 diff --git a/configs/swintransformer/swin_tiny_ascend.yaml b/configs/swintransformer/swin_tiny_ascend.yaml index 86ad0d396..1717a0dac 100644 --- a/configs/swintransformer/swin_tiny_ascend.yaml +++ b/configs/swintransformer/swin_tiny_ascend.yaml @@ -55,5 +55,4 @@ lr_epoch_stair: False # optimizer opt: "adamw" weight_decay: 0.025 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/swintransformerv2/swinv2_tiny_window8_ascend.yaml b/configs/swintransformerv2/swinv2_tiny_window8_ascend.yaml index bca9c0c00..b381f6679 100644 --- a/configs/swintransformerv2/swinv2_tiny_window8_ascend.yaml +++ b/configs/swintransformerv2/swinv2_tiny_window8_ascend.yaml @@ -49,7 +49,6 @@ warmup_epochs: 20 # optimizer opt: 'adamw' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.05 loss_scale: 1024 diff --git a/configs/vgg/vgg11_ascend.yaml b/configs/vgg/vgg11_ascend.yaml index 26c2744a1..effa5a6d2 100644 --- a/configs/vgg/vgg11_ascend.yaml +++ b/configs/vgg/vgg11_ascend.yaml @@ -44,7 +44,6 @@ warmup_epochs: 2 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/vgg/vgg13_ascend.yaml b/configs/vgg/vgg13_ascend.yaml index 2f04aed11..419e49b57 100644 --- a/configs/vgg/vgg13_ascend.yaml +++ b/configs/vgg/vgg13_ascend.yaml @@ -44,7 +44,6 @@ warmup_epochs: 2 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/vgg/vgg16_ascend.yaml b/configs/vgg/vgg16_ascend.yaml index 07f12f31d..5ddfd2826 100644 --- a/configs/vgg/vgg16_ascend.yaml +++ b/configs/vgg/vgg16_ascend.yaml @@ -44,7 +44,6 @@ warmup_epochs: 2 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/vgg/vgg19_ascend.yaml b/configs/vgg/vgg19_ascend.yaml index 0a6aa2a97..c01d97e40 100644 --- a/configs/vgg/vgg19_ascend.yaml +++ b/configs/vgg/vgg19_ascend.yaml @@ -44,7 +44,6 @@ warmup_epochs: 2 # optimizer opt: 'momentum' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00004 loss_scale: 1024 diff --git a/configs/vit/vit_b32_224_ascend.yaml b/configs/vit/vit_b32_224_ascend.yaml index 06d03914b..e7b17e53f 100644 --- a/configs/vit/vit_b32_224_ascend.yaml +++ b/configs/vit/vit_b32_224_ascend.yaml @@ -57,5 +57,4 @@ lr_epoch_stair: False # optimizer opt: "adamw" weight_decay: 0.025 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/vit/vit_l16_224_ascend.yaml b/configs/vit/vit_l16_224_ascend.yaml index d336788a4..fd1c66ccc 100644 --- a/configs/vit/vit_l16_224_ascend.yaml +++ b/configs/vit/vit_l16_224_ascend.yaml @@ -57,5 +57,4 @@ lr_epoch_stair: False # optimizer opt: "adamw" weight_decay: 0.05 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/vit/vit_l32_224_ascend.yaml b/configs/vit/vit_l32_224_ascend.yaml index 82084c4c3..511e7f4e7 100644 --- a/configs/vit/vit_l32_224_ascend.yaml +++ b/configs/vit/vit_l32_224_ascend.yaml @@ -57,5 +57,4 @@ lr_epoch_stair: False # optimizer opt: "adamw" weight_decay: 0.025 -filter_bias_and_bn: True use_nesterov: False diff --git a/configs/volo/volo_d1_ascend.yaml b/configs/volo/volo_d1_ascend.yaml index 247817aa6..d7fffd19b 100644 --- a/configs/volo/volo_d1_ascend.yaml +++ b/configs/volo/volo_d1_ascend.yaml @@ -60,7 +60,6 @@ decay_rate: 0.1 opt: 'adamw' weight_decay: 0.05 momentum: 0.9 -filter_bias_and_bn: True loss_scale_type: 'dynamic' loss_scale: 1024 use_nesterov: False diff --git a/configs/volo/volo_d2_ascend.yaml b/configs/volo/volo_d2_ascend.yaml index a62083ffe..5a92ef8bd 100644 --- a/configs/volo/volo_d2_ascend.yaml +++ b/configs/volo/volo_d2_ascend.yaml @@ -60,7 +60,6 @@ decay_rate: 0.1 opt: 'adamw' weight_decay: 0.05 momentum: 0.9 -filter_bias_and_bn: True loss_scale_type: 'dynamic' loss_scale: 2048 use_nesterov: False diff --git a/configs/volo/volo_d3_ascend.yaml b/configs/volo/volo_d3_ascend.yaml index 60e67e68d..ce15f75b1 100644 --- a/configs/volo/volo_d3_ascend.yaml +++ b/configs/volo/volo_d3_ascend.yaml @@ -61,7 +61,6 @@ decay_rate: 0.1 opt: 'adamw' weight_decay: 0.05 momentum: 0.9 -filter_bias_and_bn: True loss_scale_type: 'dynamic' loss_scale: 1024 use_nesterov: False diff --git a/configs/volo/volo_d4_ascend.yaml b/configs/volo/volo_d4_ascend.yaml index 72e70023b..a2c300da3 100644 --- a/configs/volo/volo_d4_ascend.yaml +++ b/configs/volo/volo_d4_ascend.yaml @@ -60,7 +60,6 @@ decay_rate: 0.1 opt: 'adamw' weight_decay: 0.05 momentum: 0.9 -filter_bias_and_bn: True loss_scale_type: 'dynamic' loss_scale: 1024 use_nesterov: False diff --git a/configs/xception/xception_ascend.yaml b/configs/xception/xception_ascend.yaml index 03db59d47..907d5809e 100644 --- a/configs/xception/xception_ascend.yaml +++ b/configs/xception/xception_ascend.yaml @@ -46,7 +46,6 @@ warmup_epochs: 5 # optimizer opt: 'sgd' -filter_bias_and_bn: True momentum: 0.9 weight_decay: 0.00001 loss_scale: 1024 diff --git a/configs/xcit/xcit_tiny_12_p16_ascend.yaml b/configs/xcit/xcit_tiny_12_p16_ascend.yaml index 4307ef3ea..898f86573 100644 --- a/configs/xcit/xcit_tiny_12_p16_ascend.yaml +++ b/configs/xcit/xcit_tiny_12_p16_ascend.yaml @@ -52,7 +52,6 @@ decay_rate: 0.1 # optimizer opt: 'adamw' -filter_bias_and_bn: True weight_decay: 0.05 loss_scale: 1024 use_nesterov: False diff --git a/docs/en/tutorials/configuration.md b/docs/en/tutorials/configuration.md index d91325a41..661eb059b 100644 --- a/docs/en/tutorials/configuration.md +++ b/docs/en/tutorials/configuration.md @@ -354,7 +354,7 @@ Let's use squeezenet_1.0 model as an example to explain how to configure the cor - opt: name of optimizer. - - filter_bias_and_bn: filter Bias and BatchNorm. + - weight_decay_filter: weight decay filter (filter parameters from weight decay). - momentum: Hyperparameter of type float, means momentum for the moving average. @@ -368,7 +368,7 @@ Let's use squeezenet_1.0 model as an example to explain how to configure the cor ```yaml opt: 'momentum' - filter_bias_and_bn: True + weight_decay_filter: 'norm_and_bias' momentum: 0.9 weight_decay: 0.00007 loss_scale: 1024 @@ -379,7 +379,7 @@ Let's use squeezenet_1.0 model as an example to explain how to configure the cor 3. Parse parameter setting ```shell - python train.py ... --opt momentum --filter_bias_and_bn True --weight_decay 0.00007 \ + python train.py ... --opt momentum --weight_decay_filter 'norm_and_bias' --weight_decay 0.00007 \ --loss_scale 1024 --use_nesterov False ... ``` @@ -395,7 +395,7 @@ Let's use squeezenet_1.0 model as an example to explain how to configure the cor weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, loss_scale=args.loss_scale, checkpoint_path=opt_ckpt_path, eps=args.eps @@ -407,7 +407,7 @@ Let's use squeezenet_1.0 model as an example to explain how to configure the cor weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, checkpoint_path=opt_ckpt_path, eps=args.eps ) diff --git a/docs/zh/tutorials/configuration.md b/docs/zh/tutorials/configuration.md index c8f2ea28a..e24242f44 100644 --- a/docs/zh/tutorials/configuration.md +++ b/docs/zh/tutorials/configuration.md @@ -354,7 +354,7 @@ - opt:优化器名称。 - - filter_bias_and_bn:参数中是否包含bias,gamma或者beta。 + - weight_decay_filter:权重衰减过滤器 (过滤一些参数, 使其在跟新时不做权重衰减)。 - momentum:移动平均的动量。 @@ -368,7 +368,7 @@ ```yaml opt: 'momentum' - filter_bias_and_bn: True + weight_decay_filter: 'norm_and_bias' momentum: 0.9 weight_decay: 0.00007 loss_scale: 1024 @@ -379,7 +379,7 @@ 3. parse参数设置 ```shell - python train.py ... --opt momentum --filter_bias_and_bn True --weight_decay 0.00007 \ + python train.py ... --opt momentum --weight_decay_filter 'norm_and_bias" --weight_decay 0.00007 \ --loss_scale 1024 --use_nesterov False ... ``` @@ -395,7 +395,7 @@ weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, loss_scale=args.loss_scale, checkpoint_path=opt_ckpt_path, eps=args.eps @@ -407,7 +407,7 @@ weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, checkpoint_path=opt_ckpt_path, eps=args.eps ) diff --git a/examples/finetune/finetune.py b/examples/finetune/finetune.py index d3af1d87a..966651108 100644 --- a/examples/finetune/finetune.py +++ b/examples/finetune/finetune.py @@ -283,7 +283,7 @@ def finetune_train(args): weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, loss_scale=optimizer_loss_scale, checkpoint_path=opt_ckpt_path, eps=args.eps, diff --git a/examples/seg/deeplabv3/config/deeplabv3_s16_dilated_resnet101.yaml b/examples/seg/deeplabv3/config/deeplabv3_s16_dilated_resnet101.yaml index 8ddd0b13b..186175c48 100644 --- a/examples/seg/deeplabv3/config/deeplabv3_s16_dilated_resnet101.yaml +++ b/examples/seg/deeplabv3/config/deeplabv3_s16_dilated_resnet101.yaml @@ -51,7 +51,7 @@ drop_overflow_update: False loss_scale: 3072.0 momentum: 0.9 weight_decay: 0.0001 -filter_bias_and_bn: False +weight_decay_filter": 'auto' gradient_accumulation_steps: 1 # callbacks diff --git a/examples/seg/deeplabv3/config/deeplabv3_s8_dilated_resnet101.yaml b/examples/seg/deeplabv3/config/deeplabv3_s8_dilated_resnet101.yaml index 626774f79..be44da9cf 100644 --- a/examples/seg/deeplabv3/config/deeplabv3_s8_dilated_resnet101.yaml +++ b/examples/seg/deeplabv3/config/deeplabv3_s8_dilated_resnet101.yaml @@ -51,7 +51,7 @@ drop_overflow_update: False loss_scale: 2048.0 momentum: 0.9 weight_decay: 0.0001 -filter_bias_and_bn: False +weight_decay_filter": 'auto' gradient_accumulation_steps: 1 # callbacks diff --git a/examples/seg/deeplabv3/config/deeplabv3plus_s16_dilated_resnet101.yaml b/examples/seg/deeplabv3/config/deeplabv3plus_s16_dilated_resnet101.yaml index 9fec9af09..3dfcf277c 100644 --- a/examples/seg/deeplabv3/config/deeplabv3plus_s16_dilated_resnet101.yaml +++ b/examples/seg/deeplabv3/config/deeplabv3plus_s16_dilated_resnet101.yaml @@ -51,7 +51,7 @@ drop_overflow_update: False loss_scale: 3072.0 momentum: 0.9 weight_decay: 0.0001 -filter_bias_and_bn: False +weight_decay_filter": 'auto' gradient_accumulation_steps: 1 # callbacks diff --git a/examples/seg/deeplabv3/config/deeplabv3plus_s8_dilated_resnet101.yaml b/examples/seg/deeplabv3/config/deeplabv3plus_s8_dilated_resnet101.yaml index 7e97d7910..73f0e8881 100644 --- a/examples/seg/deeplabv3/config/deeplabv3plus_s8_dilated_resnet101.yaml +++ b/examples/seg/deeplabv3/config/deeplabv3plus_s8_dilated_resnet101.yaml @@ -51,7 +51,7 @@ drop_overflow_update: False loss_scale: 2048.0 momentum: 0.9 weight_decay: 0.0001 -filter_bias_and_bn: False +weight_decay_filter": 'auto' gradient_accumulation_steps: 1 # callbacks diff --git a/examples/seg/deeplabv3/train.py b/examples/seg/deeplabv3/train.py index 9b5ff1179..d0c021c01 100644 --- a/examples/seg/deeplabv3/train.py +++ b/examples/seg/deeplabv3/train.py @@ -118,7 +118,7 @@ def train(args): lr=lr_scheduler, weight_decay=args.weight_decay, momentum=args.momentum, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, loss_scale=optimizer_loss_scale, ) diff --git a/mindcv/optim/optim_factory.py b/mindcv/optim/optim_factory.py index 7fe6bf282..9d5e54ccc 100644 --- a/mindcv/optim/optim_factory.py +++ b/mindcv/optim/optim_factory.py @@ -1,4 +1,5 @@ """ optim factory """ +import logging import os from typing import Optional @@ -11,11 +12,18 @@ __all__ = ["create_optimizer"] +_logger = logging.getLogger(__name__) + + +def init_group_params(params, weight_decay, weight_decay_filter): + if weight_decay_filter == "disable": + return [ + {"params": params, "weight_decay": weight_decay}, + {"order_params": params}, + ] -def init_group_params(params, weight_decay): decay_params = [] no_decay_params = [] - for param in params: if "beta" not in param.name and "gamma" not in param.name and "bias" not in param.name: decay_params.append(param) @@ -23,7 +31,7 @@ def init_group_params(params, weight_decay): no_decay_params.append(param) return [ {"params": decay_params, "weight_decay": weight_decay}, - {"params": no_decay_params}, + {"params": no_decay_params, "weight_decay": 0.0}, {"order_params": params}, ] @@ -35,7 +43,7 @@ def create_optimizer( weight_decay: float = 0, momentum: float = 0.9, nesterov: bool = False, - filter_bias_and_bn: bool = True, + weight_decay_filter: str = "disable", loss_scale: float = 1.0, schedule_decay: float = 4e-3, checkpoint_path: str = "", @@ -59,8 +67,11 @@ def create_optimizer( of current step. Default: 0. momentum: momentum if the optimizer supports. Default: 0.9. nesterov: Whether to use Nesterov Accelerated Gradient (NAG) algorithm to update the gradients. Default: False. - filter_bias_and_bn: whether to filter batch norm parameters and bias from weight decay. - If True, weight decay will not apply on BN parameters and bias in Conv or Dense layers. Default: True. + weight_decay_filter: filters to filter parameters from weight_decay. + - "disable": No parameters to filter. + - "auto": We do not apply weight decay filtering to any parameters. However, MindSpore currently + automatically filters the parameters of Norm layer from weight decay. + - "norm_and_bias": Filter the paramters of Norm layer and Bias from weight decay. loss_scale: A floating point value for the loss scale, which must be larger than 0.0. Default: 1.0. Returns: @@ -68,9 +79,19 @@ def create_optimizer( """ opt = opt.lower() - - if weight_decay and filter_bias_and_bn: - params = init_group_params(params, weight_decay) + if weight_decay_filter == "auto": + _logger.warning( + "You are using AUTO weight decay filter, which means the weight decay filter isn't explicitly pass in " + "when creating an mindspore.nn.Optimizer instance. " + "NOTE: mindspore.nn.Optimizer will filter Norm parmas from weight decay. " + ) + elif weight_decay_filter == "disable" or "norm_and_bias": + params = init_group_params(params, weight_decay, weight_decay_filter) + weight_decay = 0.0 + else: + raise ValueError( + f"weight decay filter only support ['disable', 'auto', 'norm_and_bias'], but got{weight_decay_filter}." + ) opt_args = dict(**kwargs) # if lr is not None: diff --git a/tests/modules/parallel/test_parallel_optim.py b/tests/modules/parallel/test_parallel_optim.py index 651f36c4d..9a2bf6616 100644 --- a/tests/modules/parallel/test_parallel_optim.py +++ b/tests/modules/parallel/test_parallel_optim.py @@ -44,8 +44,8 @@ def construct(self, x): @pytest.mark.parametrize("opt", ["sgd", "momentum"]) @pytest.mark.parametrize("nesterov", [True, False]) -@pytest.mark.parametrize("filter_bias_and_bn", [True, False]) -def test_sgd_optimizer(opt, nesterov, filter_bias_and_bn): +@pytest.mark.parametrize("weight_decay_filter", ["auto", "disable", "norm_and_bias"]) +def test_sgd_optimizer(opt, nesterov, weight_decay_filter): init("nccl") device_num = get_group_size() rank_id = get_rank() # noqa: F841 @@ -64,7 +64,7 @@ def test_sgd_optimizer(opt, nesterov, filter_bias_and_bn): weight_decay=1e-5, momentum=0.9, nesterov=nesterov, - filter_bias_and_bn=filter_bias_and_bn, + weight_decay_filter=weight_decay_filter, ) bs = 8 @@ -227,7 +227,7 @@ def test_param_lr_001_filter_bias_and_bn_optimizer(): weight_decay=1e-5, momentum=0.9, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -273,7 +273,7 @@ def test_param_lr_0001_filter_bias_and_bn_optimizer(): weight_decay=1e-5, momentum=0.9, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -315,7 +315,7 @@ def test_wrong_momentum_optimizer(momentum): momentum=momentum, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -357,7 +357,7 @@ def test_wrong_loss_scale_optimizer(loss_scale): momentum=0.9, loss_scale=loss_scale, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -400,7 +400,7 @@ def test_wrong_weight_decay_optimizer(weight_decay): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -442,7 +442,7 @@ def test_wrong_lr_optimizer(lr): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -488,7 +488,7 @@ def test_param_lr_01_filter_bias_and_bn_optimizer(): weight_decay=1e-5, momentum=0.9, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -530,7 +530,7 @@ def test_wrong_opt_optimizer(opt): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -579,7 +579,7 @@ def test_wrong_params_more_optimizer(): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -627,7 +627,7 @@ def test_wrong_params_input_optimizer(): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -681,7 +681,7 @@ def test_mode_mult_single_optimizer(mode): weight_decay=1e-5, momentum=0.9, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 diff --git a/tests/modules/test_optim.py b/tests/modules/test_optim.py index 007cbb87f..56bc61244 100644 --- a/tests/modules/test_optim.py +++ b/tests/modules/test_optim.py @@ -43,8 +43,8 @@ def construct(self, x): @pytest.mark.parametrize("opt", ["sgd", "momentum"]) @pytest.mark.parametrize("nesterov", [True, False]) -@pytest.mark.parametrize("filter_bias_and_bn", [True, False]) -def test_sgd_optimizer(opt, nesterov, filter_bias_and_bn): +@pytest.mark.parametrize("weight_decay_filter", ["disable", "auto", "norm_and_bias"]) +def test_sgd_optimizer(opt, nesterov, weight_decay_filter): network = SimpleCNN(in_channels=1, num_classes=10) net_loss = nn.SoftmaxCrossEntropyWithLogits(sparse=True, reduction="mean") @@ -55,7 +55,7 @@ def test_sgd_optimizer(opt, nesterov, filter_bias_and_bn): weight_decay=1e-5, momentum=0.9, nesterov=nesterov, - filter_bias_and_bn=filter_bias_and_bn, + weight_decay_filter=weight_decay_filter, ) bs = 8 @@ -171,7 +171,7 @@ def test_param_lr_001_filter_bias_and_bn_optimizer(): ] net_loss = nn.SoftmaxCrossEntropyWithLogits(sparse=True, reduction="mean") net_opt = create_optimizer( - group_params, "adamW", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, filter_bias_and_bn=False + group_params, "adamW", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, weight_decay_filter="auto" ) bs = 8 @@ -203,7 +203,7 @@ def test_param_lr_0001_filter_bias_and_bn_optimizer(): ] net_loss = nn.SoftmaxCrossEntropyWithLogits(sparse=True, reduction="mean") net_opt = create_optimizer( - group_params, "adamW", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, filter_bias_and_bn=False + group_params, "adamW", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, weight_decay_filter="auto" ) bs = 8 @@ -237,7 +237,7 @@ def test_wrong_momentum_optimizer(momentum): momentum=momentum, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -271,7 +271,7 @@ def test_wrong_loss_scale_optimizer(loss_scale): momentum=0.9, loss_scale=loss_scale, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -306,7 +306,7 @@ def test_wrong_weight_decay_optimizer(weight_decay): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -340,7 +340,7 @@ def test_wrong_lr_optimizer(lr): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -372,7 +372,7 @@ def test_param_lr_01_filter_bias_and_bn_optimizer(): ] net_loss = nn.SoftmaxCrossEntropyWithLogits(sparse=True, reduction="mean") net_opt = create_optimizer( - group_params, "momentum", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, filter_bias_and_bn=False + group_params, "momentum", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, weight_decay_filter="auto" ) bs = 8 @@ -406,7 +406,7 @@ def test_wrong_opt_optimizer(opt): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=True, + weight_decay_filter="disable", ) bs = 8 @@ -447,7 +447,7 @@ def test_wrong_params_more_optimizer(): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -487,7 +487,7 @@ def test_wrong_params_input_optimizer(): momentum=0.9, loss_scale=1.0, nesterov=False, - filter_bias_and_bn=False, + weight_decay_filter="auto", ) bs = 8 @@ -527,7 +527,7 @@ def test_mode_mult_single_optimizer(mode): ] net_loss = nn.SoftmaxCrossEntropyWithLogits(sparse=True, reduction="mean") net_opt = create_optimizer( - group_params, "momentum", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, filter_bias_and_bn=False + group_params, "momentum", lr=0.01, weight_decay=1e-5, momentum=0.9, nesterov=False, weight_decay_filter="auto" ) bs = 8 diff --git a/train.py b/train.py index 16d943de1..0406d90a1 100644 --- a/train.py +++ b/train.py @@ -216,7 +216,7 @@ def main(): weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, loss_scale=optimizer_loss_scale, checkpoint_path=opt_ckpt_path, eps=args.eps, diff --git a/train_with_func.py b/train_with_func.py index 4b64e9345..f9040c3e0 100644 --- a/train_with_func.py +++ b/train_with_func.py @@ -227,7 +227,7 @@ def main(): weight_decay=args.weight_decay, momentum=args.momentum, nesterov=args.use_nesterov, - filter_bias_and_bn=args.filter_bias_and_bn, + weight_decay_filter=args.weight_decay_filter, loss_scale=1.0, eps=args.eps, )