====================weight_decay_scale====================
backbone/stage0/block0/conv1/weight: 1.0
backbone/stage0/block0/conv2/weight: 1.0
backbone/stage0/block0/conv3/weight: 1.0
backbone/stage0/block0/downsample/conv/weight: 1.0
backbone/stage0/block0/downsample/norm/bias: 0
backbone/stage0/block0/downsample/norm/moving_mean: 0
backbone/stage0/block0/downsample/norm/moving_variance: 0
backbone/stage0/block0/downsample/norm/scale: 0
backbone/stage0/block0/norm1/bias: 0
backbone/stage0/block0/norm1/moving_mean: 0
backbone/stage0/block0/norm1/moving_variance: 0
backbone/stage0/block0/norm1/scale: 0
backbone/stage0/block0/norm2/bias: 0
backbone/stage0/block0/norm2/moving_mean: 0
backbone/stage0/block0/norm2/moving_variance: 0
backbone/stage0/block0/norm2/scale: 0
backbone/stage0/block0/norm3/bias: 0
backbone/stage0/block0/norm3/moving_mean: 0
backbone/stage0/block0/norm3/moving_variance: 0
backbone/stage0/block0/norm3/scale: 0
backbone/stage0/block1/conv1/weight: 1.0
backbone/stage0/block1/conv2/weight: 1.0
backbone/stage0/block1/conv3/weight: 1.0
backbone/stage0/block1/norm1/bias: 0
backbone/stage0/block1/norm1/moving_mean: 0
backbone/stage0/block1/norm1/moving_variance: 0
backbone/stage0/block1/norm1/scale: 0
backbone/stage0/block1/norm2/bias: 0
backbone/stage0/block1/norm2/moving_mean: 0
backbone/stage0/block1/norm2/moving_variance: 0
backbone/stage0/block1/norm2/scale: 0
backbone/stage0/block1/norm3/bias: 0
backbone/stage0/block1/norm3/moving_mean: 0
backbone/stage0/block1/norm3/moving_variance: 0
backbone/stage0/block1/norm3/scale: 0
backbone/stage0/block2/conv1/weight: 1.0
backbone/stage0/block2/conv2/weight: 1.0
backbone/stage0/block2/conv3/weight: 1.0
backbone/stage0/block2/norm1/bias: 0
backbone/stage0/block2/norm1/moving_mean: 0
backbone/stage0/block2/norm1/moving_variance: 0
backbone/stage0/block2/norm1/scale: 0
backbone/stage0/block2/norm2/bias: 0
backbone/stage0/block2/norm2/moving_mean: 0
backbone/stage0/block2/norm2/moving_variance: 0
backbone/stage0/block2/norm2/scale: 0
backbone/stage0/block2/norm3/bias: 0
backbone/stage0/block2/norm3/moving_mean: 0
backbone/stage0/block2/norm3/moving_variance: 0
backbone/stage0/block2/norm3/scale: 0
backbone/stage1/block0/conv1/weight: 1.0
backbone/stage1/block0/conv2/weight: 1.0
backbone/stage1/block0/conv3/weight: 1.0
backbone/stage1/block0/downsample/conv/weight: 1.0
backbone/stage1/block0/downsample/norm/bias: 0
backbone/stage1/block0/downsample/norm/moving_mean: 0
backbone/stage1/block0/downsample/norm/moving_variance: 0
backbone/stage1/block0/downsample/norm/scale: 0
backbone/stage1/block0/norm1/bias: 0
backbone/stage1/block0/norm1/moving_mean: 0
backbone/stage1/block0/norm1/moving_variance: 0
backbone/stage1/block0/norm1/scale: 0
backbone/stage1/block0/norm2/bias: 0
backbone/stage1/block0/norm2/moving_mean: 0
backbone/stage1/block0/norm2/moving_variance: 0
backbone/stage1/block0/norm2/scale: 0
backbone/stage1/block0/norm3/bias: 0
backbone/stage1/block0/norm3/moving_mean: 0
backbone/stage1/block0/norm3/moving_variance: 0
backbone/stage1/block0/norm3/scale: 0
backbone/stage1/block1/conv1/weight: 1.0
backbone/stage1/block1/conv2/weight: 1.0
backbone/stage1/block1/conv3/weight: 1.0
backbone/stage1/block1/norm1/bias: 0
backbone/stage1/block1/norm1/moving_mean: 0
backbone/stage1/block1/norm1/moving_variance: 0
backbone/stage1/block1/norm1/scale: 0
backbone/stage1/block1/norm2/bias: 0
backbone/stage1/block1/norm2/moving_mean: 0
backbone/stage1/block1/norm2/moving_variance: 0
backbone/stage1/block1/norm2/scale: 0
backbone/stage1/block1/norm3/bias: 0
backbone/stage1/block1/norm3/moving_mean: 0
backbone/stage1/block1/norm3/moving_variance: 0
backbone/stage1/block1/norm3/scale: 0
backbone/stage1/block2/conv1/weight: 1.0
backbone/stage1/block2/conv2/weight: 1.0
backbone/stage1/block2/conv3/weight: 1.0
backbone/stage1/block2/norm1/bias: 0
backbone/stage1/block2/norm1/moving_mean: 0
backbone/stage1/block2/norm1/moving_variance: 0
backbone/stage1/block2/norm1/scale: 0
backbone/stage1/block2/norm2/bias: 0
backbone/stage1/block2/norm2/moving_mean: 0
backbone/stage1/block2/norm2/moving_variance: 0
backbone/stage1/block2/norm2/scale: 0
backbone/stage1/block2/norm3/bias: 0
backbone/stage1/block2/norm3/moving_mean: 0
backbone/stage1/block2/norm3/moving_variance: 0
backbone/stage1/block2/norm3/scale: 0
backbone/stage1/block3/conv1/weight: 1.0
backbone/stage1/block3/conv2/weight: 1.0
backbone/stage1/block3/conv3/weight: 1.0
backbone/stage1/block3/norm1/bias: 0
backbone/stage1/block3/norm1/moving_mean: 0
backbone/stage1/block3/norm1/moving_variance: 0
backbone/stage1/block3/norm1/scale: 0
backbone/stage1/block3/norm2/bias: 0
backbone/stage1/block3/norm2/moving_mean: 0
backbone/stage1/block3/norm2/moving_variance: 0
backbone/stage1/block3/norm2/scale: 0
backbone/stage1/block3/norm3/bias: 0
backbone/stage1/block3/norm3/moving_mean: 0
backbone/stage1/block3/norm3/moving_variance: 0
backbone/stage1/block3/norm3/scale: 0
backbone/stage2/block0/conv1/weight: 1.0
backbone/stage2/block0/conv2/weight: 1.0
backbone/stage2/block0/conv3/weight: 1.0
backbone/stage2/block0/downsample/conv/weight: 1.0
backbone/stage2/block0/downsample/norm/bias: 0
backbone/stage2/block0/downsample/norm/moving_mean: 0
backbone/stage2/block0/downsample/norm/moving_variance: 0
backbone/stage2/block0/downsample/norm/scale: 0
backbone/stage2/block0/norm1/bias: 0
backbone/stage2/block0/norm1/moving_mean: 0
backbone/stage2/block0/norm1/moving_variance: 0
backbone/stage2/block0/norm1/scale: 0
backbone/stage2/block0/norm2/bias: 0
backbone/stage2/block0/norm2/moving_mean: 0
backbone/stage2/block0/norm2/moving_variance: 0
backbone/stage2/block0/norm2/scale: 0
backbone/stage2/block0/norm3/bias: 0
backbone/stage2/block0/norm3/moving_mean: 0
backbone/stage2/block0/norm3/moving_variance: 0
backbone/stage2/block0/norm3/scale: 0
backbone/stage2/block1/conv1/weight: 1.0
backbone/stage2/block1/conv2/weight: 1.0
backbone/stage2/block1/conv3/weight: 1.0
backbone/stage2/block1/norm1/bias: 0
backbone/stage2/block1/norm1/moving_mean: 0
backbone/stage2/block1/norm1/moving_variance: 0
backbone/stage2/block1/norm1/scale: 0
backbone/stage2/block1/norm2/bias: 0
backbone/stage2/block1/norm2/moving_mean: 0
backbone/stage2/block1/norm2/moving_variance: 0
backbone/stage2/block1/norm2/scale: 0
backbone/stage2/block1/norm3/bias: 0
backbone/stage2/block1/norm3/moving_mean: 0
backbone/stage2/block1/norm3/moving_variance: 0
backbone/stage2/block1/norm3/scale: 0
backbone/stage2/block2/conv1/weight: 1.0
backbone/stage2/block2/conv2/weight: 1.0
backbone/stage2/block2/conv3/weight: 1.0
backbone/stage2/block2/norm1/bias: 0
backbone/stage2/block2/norm1/moving_mean: 0
backbone/stage2/block2/norm1/moving_variance: 0
backbone/stage2/block2/norm1/scale: 0
backbone/stage2/block2/norm2/bias: 0
backbone/stage2/block2/norm2/moving_mean: 0
backbone/stage2/block2/norm2/moving_variance: 0
backbone/stage2/block2/norm2/scale: 0
backbone/stage2/block2/norm3/bias: 0
backbone/stage2/block2/norm3/moving_mean: 0
backbone/stage2/block2/norm3/moving_variance: 0
backbone/stage2/block2/norm3/scale: 0
backbone/stage2/block3/conv1/weight: 1.0
backbone/stage2/block3/conv2/weight: 1.0
backbone/stage2/block3/conv3/weight: 1.0
backbone/stage2/block3/norm1/bias: 0
backbone/stage2/block3/norm1/moving_mean: 0
backbone/stage2/block3/norm1/moving_variance: 0
backbone/stage2/block3/norm1/scale: 0
backbone/stage2/block3/norm2/bias: 0
backbone/stage2/block3/norm2/moving_mean: 0
backbone/stage2/block3/norm2/moving_variance: 0
backbone/stage2/block3/norm2/scale: 0
backbone/stage2/block3/norm3/bias: 0
backbone/stage2/block3/norm3/moving_mean: 0
backbone/stage2/block3/norm3/moving_variance: 0
backbone/stage2/block3/norm3/scale: 0
backbone/stage2/block4/conv1/weight: 1.0
backbone/stage2/block4/conv2/weight: 1.0
backbone/stage2/block4/conv3/weight: 1.0
backbone/stage2/block4/norm1/bias: 0
backbone/stage2/block4/norm1/moving_mean: 0
backbone/stage2/block4/norm1/moving_variance: 0
backbone/stage2/block4/norm1/scale: 0
backbone/stage2/block4/norm2/bias: 0
backbone/stage2/block4/norm2/moving_mean: 0
backbone/stage2/block4/norm2/moving_variance: 0
backbone/stage2/block4/norm2/scale: 0
backbone/stage2/block4/norm3/bias: 0
backbone/stage2/block4/norm3/moving_mean: 0
backbone/stage2/block4/norm3/moving_variance: 0
backbone/stage2/block4/norm3/scale: 0
backbone/stage2/block5/conv1/weight: 1.0
backbone/stage2/block5/conv2/weight: 1.0
backbone/stage2/block5/conv3/weight: 1.0
backbone/stage2/block5/norm1/bias: 0
backbone/stage2/block5/norm1/moving_mean: 0
backbone/stage2/block5/norm1/moving_variance: 0
backbone/stage2/block5/norm1/scale: 0
backbone/stage2/block5/norm2/bias: 0
backbone/stage2/block5/norm2/moving_mean: 0
backbone/stage2/block5/norm2/moving_variance: 0
backbone/stage2/block5/norm2/scale: 0
backbone/stage2/block5/norm3/bias: 0
backbone/stage2/block5/norm3/moving_mean: 0
backbone/stage2/block5/norm3/moving_variance: 0
backbone/stage2/block5/norm3/scale: 0
backbone/stage3/block0/conv1/weight: 1.0
backbone/stage3/block0/conv2/weight: 1.0
backbone/stage3/block0/conv3/weight: 1.0
backbone/stage3/block0/downsample/conv/weight: 1.0
backbone/stage3/block0/downsample/norm/bias: 0
backbone/stage3/block0/downsample/norm/moving_mean: 0
backbone/stage3/block0/downsample/norm/moving_variance: 0
backbone/stage3/block0/downsample/norm/scale: 0
backbone/stage3/block0/norm1/bias: 0
backbone/stage3/block0/norm1/moving_mean: 0
backbone/stage3/block0/norm1/moving_variance: 0
backbone/stage3/block0/norm1/scale: 0
backbone/stage3/block0/norm2/bias: 0
backbone/stage3/block0/norm2/moving_mean: 0
backbone/stage3/block0/norm2/moving_variance: 0
backbone/stage3/block0/norm2/scale: 0
backbone/stage3/block0/norm3/bias: 0
backbone/stage3/block0/norm3/moving_mean: 0
backbone/stage3/block0/norm3/moving_variance: 0
backbone/stage3/block0/norm3/scale: 0
backbone/stage3/block1/conv1/weight: 1.0
backbone/stage3/block1/conv2/weight: 1.0
backbone/stage3/block1/conv3/weight: 1.0
backbone/stage3/block1/norm1/bias: 0
backbone/stage3/block1/norm1/moving_mean: 0
backbone/stage3/block1/norm1/moving_variance: 0
backbone/stage3/block1/norm1/scale: 0
backbone/stage3/block1/norm2/bias: 0
backbone/stage3/block1/norm2/moving_mean: 0
backbone/stage3/block1/norm2/moving_variance: 0
backbone/stage3/block1/norm2/scale: 0
backbone/stage3/block1/norm3/bias: 0
backbone/stage3/block1/norm3/moving_mean: 0
backbone/stage3/block1/norm3/moving_variance: 0
backbone/stage3/block1/norm3/scale: 0
backbone/stage3/block2/conv1/weight: 1.0
backbone/stage3/block2/conv2/weight: 1.0
backbone/stage3/block2/conv3/weight: 1.0
backbone/stage3/block2/norm1/bias: 0
backbone/stage3/block2/norm1/moving_mean: 0
backbone/stage3/block2/norm1/moving_variance: 0
backbone/stage3/block2/norm1/scale: 0
backbone/stage3/block2/norm2/bias: 0
backbone/stage3/block2/norm2/moving_mean: 0
backbone/stage3/block2/norm2/moving_variance: 0
backbone/stage3/block2/norm2/scale: 0
backbone/stage3/block2/norm3/bias: 0
backbone/stage3/block2/norm3/moving_mean: 0
backbone/stage3/block2/norm3/moving_variance: 0
backbone/stage3/block2/norm3/scale: 0
backbone/stem/conv1/weight: 1.0
backbone/stem/norm1/bias: 0
backbone/stem/norm1/moving_mean: 0
backbone/stem/norm1/moving_variance: 0
backbone/stem/norm1/scale: 0
classifier/bias: 1.0
classifier/weight: 1.0
