sonebu
moving over from github
5096607
Top:
epoch
state_dict
arch
optimizer_state_dict
optimizer_type
compression_sched
extras
-------------------------------------
arch: ai85simplenet
-------------------------------------
extras: {'current_top1': 55.76, 'best_top1': 55.76, 'best_epoch': 291}
-------------------------------------
state_dict:
conv1
output_shift: [-0.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [8.]
bias_bits: [8.]
bias
total # of elements, shape: 16 , [16]
# of unique elements: 16
min, max, mean: -0.19168334 , 0.36834052 , 0.07247388
weight
total # of elements, shape: 432 , [16, 3, 3, 3]
# of unique elements: 432
min, max, mean: -0.802268 , 0.7458835 , -0.0010856437
conv2
output_shift: [-1.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [4.]
bias_bits: [8.]
bias
total # of elements, shape: 20 , [20]
# of unique elements: 20
min, max, mean: -0.43049204 , 0.47276396 , 0.15015088
weight
total # of elements, shape: 2880 , [20, 16, 3, 3]
# of unique elements: 2880
min, max, mean: -0.6489339 , 0.44373256 , -0.0075482004
conv3
output_shift: [-2.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 20 , [20]
# of unique elements: 20
min, max, mean: -0.16107927 , 0.64212 , 0.16932115
weight
total # of elements, shape: 3600 , [20, 20, 3, 3]
# of unique elements: 3600
min, max, mean: -0.6594693 , 0.4297285 , -0.0048244996
conv4
output_shift: [-2.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 20 , [20]
# of unique elements: 20
min, max, mean: -0.2788192 , 0.36745375 , 0.08209655
weight
total # of elements, shape: 3600 , [20, 20, 3, 3]
# of unique elements: 3600
min, max, mean: -0.3781386 , 0.35877833 , -0.004330597
conv5
output_shift: [-2.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 20 , [20]
# of unique elements: 20
min, max, mean: -0.4778669 , 0.69232625 , 0.1373336
weight
total # of elements, shape: 3600 , [20, 20, 3, 3]
# of unique elements: 3600
min, max, mean: -0.48527744 , 0.3855096 , -2.4955074e-05
conv6
output_shift: [-2.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 20 , [20]
# of unique elements: 20
min, max, mean: -0.1993689 , 0.68981844 , 0.19056796
weight
total # of elements, shape: 3600 , [20, 20, 3, 3]
# of unique elements: 3600
min, max, mean: -0.32661057 , 0.3896761 , -0.0005324371
conv7
output_shift: [-2.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 44 , [44]
# of unique elements: 44
min, max, mean: -0.33314848 , 0.5373695 , 0.05712423
weight
total # of elements, shape: 7920 , [44, 20, 3, 3]
# of unique elements: 7917
min, max, mean: -0.29842344 , 0.26807493 , -0.0036170066
conv8
output_shift: [-3.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 48 , [48]
# of unique elements: 48
min, max, mean: -0.35770896 , 0.9294356 , 0.1538872
weight
total # of elements, shape: 19008 , [48, 44, 3, 3]
# of unique elements: 19005
min, max, mean: -0.25119358 , 0.22448556 , -0.00043370738
conv9
output_shift: [-3.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 48 , [48]
# of unique elements: 48
min, max, mean: -0.51157075 , 0.6982333 , 0.19713795
weight
total # of elements, shape: 20736 , [48, 48, 3, 3]
# of unique elements: 20728
min, max, mean: -0.19476362 , 0.19595417 , -0.0007558516
conv10
output_shift: [-3.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [2.]
bias_bits: [8.]
bias
total # of elements, shape: 96 , [96]
# of unique elements: 96
min, max, mean: -0.49737096 , 0.5452776 , -0.09346354
weight
total # of elements, shape: 41472 , [96, 48, 3, 3]
# of unique elements: 41434
min, max, mean: -0.1662616 , 0.32571185 , 0.003046196
conv11
output_shift: [-1.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [4.]
bias_bits: [8.]
bias
total # of elements, shape: 512 , [512]
# of unique elements: 512
min, max, mean: -0.7622132 , 0.6625604 , -0.025022728
weight
total # of elements, shape: 49152 , [512, 96, 1, 1]
# of unique elements: 49130
min, max, mean: -0.5251649 , 0.55524755 , -0.0027382441
conv12
output_shift: [-2.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [4.]
bias_bits: [8.]
bias
total # of elements, shape: 128 , [128]
# of unique elements: 128
min, max, mean: -0.276329 , 0.391946 , 0.09177708
weight
total # of elements, shape: 65536 , [128, 512, 1, 1]
# of unique elements: 65501
min, max, mean: -0.48823273 , 0.35944995 , -0.0032784953
conv13
output_shift: [-0.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [4.]
bias_bits: [8.]
bias
total # of elements, shape: 128 , [128]
# of unique elements: 128
min, max, mean: -1.1315831 , 1.3784926 , 0.32567012
weight
total # of elements, shape: 147456 , [128, 128, 3, 3]
# of unique elements: 147257
min, max, mean: -1.3093278 , 1.2955139 , -2.2848448e-05
conv14
output_shift: [1.]
adjust_output_shift: [1.]
quantize_activation: [1.]
shift_quantile: [0.985]
weight bits: [4.]
bias_bits: [8.]
bias
total # of elements, shape: 100 , [100]
# of unique elements: 100
min, max, mean: -0.2843461 , 0.25533894 , -0.0070921965
weight
total # of elements, shape: 12800 , [100, 128, 1, 1]
# of unique elements: 12799
min, max, mean: -3.512657 , 1.6331301 , -0.21426365