summaryrefslogtreecommitdiff
path: root/results/snapshot_no_outln_v1
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_no_outln_v1')
-rw-r--r--results/snapshot_no_outln_v1/run_s123.log51
-rw-r--r--results/snapshot_no_outln_v1/run_s42.log51
-rw-r--r--results/snapshot_no_outln_v1/run_s456.log51
-rw-r--r--results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json1824
-rw-r--r--results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json1824
-rw-r--r--results/snapshot_no_outln_v1/snapshot_noLN_s123.json4766
-rw-r--r--results/snapshot_no_outln_v1/snapshot_noLN_s42.json4766
-rw-r--r--results/snapshot_no_outln_v1/snapshot_noLN_s456.json4766
8 files changed, 18099 insertions, 0 deletions
diff --git a/results/snapshot_no_outln_v1/run_s123.log b/results/snapshot_no_outln_v1/run_s123.log
new file mode 100644
index 0000000..a946d6d
--- /dev/null
+++ b/results/snapshot_no_outln_v1/run_s123.log
@@ -0,0 +1,51 @@
+NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=123
+
+=== BP training (NO out_ln) ===
+ [BP-noLN] Ep 0: ||h_L||=8.791e+00 ||g||=5.394e-04 acc=0.1016
+ [BP-noLN] Ep 1: ||h_L||=3.456e+01 ||g||=1.382e-04 acc=0.4355
+ [BP-noLN] Ep 5: ||h_L||=5.193e+01 ||g||=9.721e-05 acc=0.5049
+ [BP-noLN] Ep 10: ||h_L||=6.115e+01 ||g||=8.778e-05 acc=0.5430
+ [BP-noLN] Ep 15: ||h_L||=6.668e+01 ||g||=8.387e-05 acc=0.5586
+ [BP-noLN] Ep 20: ||h_L||=6.880e+01 ||g||=8.997e-05 acc=0.5176
+ [BP-noLN] Ep 25: ||h_L||=7.092e+01 ||g||=8.184e-05 acc=0.5850
+ [BP-noLN] Ep 30: ||h_L||=7.285e+01 ||g||=7.960e-05 acc=0.5693
+ [BP-noLN] Ep 35: ||h_L||=7.522e+01 ||g||=8.247e-05 acc=0.5869
+ [BP-noLN] Ep 40: ||h_L||=7.551e+01 ||g||=8.186e-05 acc=0.6201
+ [BP-noLN] Ep 45: ||h_L||=7.421e+01 ||g||=8.565e-05 acc=0.5918
+ [BP-noLN] Ep 50: ||h_L||=7.473e+01 ||g||=9.094e-05 acc=0.5840
+ [BP-noLN] Ep 55: ||h_L||=7.556e+01 ||g||=8.896e-05 acc=0.6143
+ [BP-noLN] Ep 60: ||h_L||=7.545e+01 ||g||=9.015e-05 acc=0.6396
+ [BP-noLN] Ep 65: ||h_L||=7.509e+01 ||g||=9.009e-05 acc=0.6455
+ [BP-noLN] Ep 70: ||h_L||=7.466e+01 ||g||=9.170e-05 acc=0.6230
+ [BP-noLN] Ep 75: ||h_L||=7.410e+01 ||g||=1.030e-04 acc=0.6455
+ [BP-noLN] Ep 80: ||h_L||=7.313e+01 ||g||=1.043e-04 acc=0.6309
+ [BP-noLN] Ep 85: ||h_L||=7.275e+01 ||g||=1.035e-04 acc=0.6396
+ [BP-noLN] Ep 90: ||h_L||=7.262e+01 ||g||=1.079e-04 acc=0.6445
+ [BP-noLN] Ep 95: ||h_L||=7.256e+01 ||g||=1.087e-04 acc=0.6377
+ [BP-noLN] Ep 100: ||h_L||=7.248e+01 ||g||=1.082e-04 acc=0.6396
+
+=== DFA training (NO out_ln) ===
+ [DFA-noLN] Ep 0: ||h_L||=8.791e+00 ||g||=5.394e-04 acc=0.1016
+ [DFA-noLN] Ep 1: ||h_L||=1.231e+03 ||g||=6.461e-04 acc=0.2129 γ=0.0130
+ [DFA-noLN] Ep 5: ||h_L||=1.290e+04 ||g||=7.423e-04 acc=0.2080 γ=-0.0053
+ [DFA-noLN] Ep 10: ||h_L||=6.970e+04 ||g||=7.399e-04 acc=0.2031 γ=-0.0038
+ [DFA-noLN] Ep 15: ||h_L||=2.144e+05 ||g||=7.383e-04 acc=0.1807 γ=0.0158
+ [DFA-noLN] Ep 20: ||h_L||=5.289e+05 ||g||=7.379e-04 acc=0.2295 γ=0.0205
+ [DFA-noLN] Ep 25: ||h_L||=1.047e+06 ||g||=7.582e-04 acc=0.1729 γ=-0.0056
+ [DFA-noLN] Ep 30: ||h_L||=1.809e+06 ||g||=7.676e-04 acc=0.1934 γ=0.0171
+ [DFA-noLN] Ep 35: ||h_L||=2.741e+06 ||g||=7.757e-04 acc=0.1504 γ=0.0181
+ [DFA-noLN] Ep 40: ||h_L||=3.868e+06 ||g||=7.547e-04 acc=0.1377 γ=0.0036
+ [DFA-noLN] Ep 45: ||h_L||=5.087e+06 ||g||=7.677e-04 acc=0.2246 γ=0.0148
+ [DFA-noLN] Ep 50: ||h_L||=6.378e+06 ||g||=7.632e-04 acc=0.2002 γ=-0.0010
+ [DFA-noLN] Ep 55: ||h_L||=7.652e+06 ||g||=7.547e-04 acc=0.0908 γ=0.0198
+ [DFA-noLN] Ep 60: ||h_L||=8.786e+06 ||g||=7.196e-04 acc=0.1670 γ=0.0255
+ [DFA-noLN] Ep 65: ||h_L||=9.795e+06 ||g||=7.598e-04 acc=0.1699 γ=0.0191
+ [DFA-noLN] Ep 70: ||h_L||=1.063e+07 ||g||=7.313e-04 acc=0.2422 γ=0.0235
+ [DFA-noLN] Ep 75: ||h_L||=1.127e+07 ||g||=7.316e-04 acc=0.2490 γ=0.0445
+ [DFA-noLN] Ep 80: ||h_L||=1.173e+07 ||g||=7.425e-04 acc=0.1904 γ=0.0283
+ [DFA-noLN] Ep 85: ||h_L||=1.203e+07 ||g||=7.233e-04 acc=0.2500 γ=0.0402
+ [DFA-noLN] Ep 90: ||h_L||=1.216e+07 ||g||=7.064e-04 acc=0.3096 γ=0.0335
+ [DFA-noLN] Ep 95: ||h_L||=1.218e+07 ||g||=7.087e-04 acc=0.2920 γ=0.0295
+ [DFA-noLN] Ep 100: ||h_L||=1.218e+07 ||g||=7.086e-04 acc=0.3135 γ=0.0273
+
+Saved results/snapshot_no_outln_v1/snapshot_noLN_s123.json
diff --git a/results/snapshot_no_outln_v1/run_s42.log b/results/snapshot_no_outln_v1/run_s42.log
new file mode 100644
index 0000000..81d2970
--- /dev/null
+++ b/results/snapshot_no_outln_v1/run_s42.log
@@ -0,0 +1,51 @@
+NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=42
+
+=== BP training (NO out_ln) ===
+ [BP-noLN] Ep 0: ||h_L||=8.893e+00 ||g||=5.483e-04 acc=0.1123
+ [BP-noLN] Ep 1: ||h_L||=3.310e+01 ||g||=1.421e-04 acc=0.4229
+ [BP-noLN] Ep 5: ||h_L||=5.238e+01 ||g||=9.984e-05 acc=0.5010
+ [BP-noLN] Ep 10: ||h_L||=6.111e+01 ||g||=8.972e-05 acc=0.5518
+ [BP-noLN] Ep 15: ||h_L||=6.640e+01 ||g||=8.892e-05 acc=0.5195
+ [BP-noLN] Ep 20: ||h_L||=6.977e+01 ||g||=8.730e-05 acc=0.5488
+ [BP-noLN] Ep 25: ||h_L||=7.080e+01 ||g||=8.598e-05 acc=0.5547
+ [BP-noLN] Ep 30: ||h_L||=7.441e+01 ||g||=8.621e-05 acc=0.5723
+ [BP-noLN] Ep 35: ||h_L||=7.537e+01 ||g||=7.991e-05 acc=0.6025
+ [BP-noLN] Ep 40: ||h_L||=7.552e+01 ||g||=8.747e-05 acc=0.5859
+ [BP-noLN] Ep 45: ||h_L||=7.571e+01 ||g||=8.227e-05 acc=0.5918
+ [BP-noLN] Ep 50: ||h_L||=7.514e+01 ||g||=9.716e-05 acc=0.5811
+ [BP-noLN] Ep 55: ||h_L||=7.693e+01 ||g||=9.600e-05 acc=0.6006
+ [BP-noLN] Ep 60: ||h_L||=7.581e+01 ||g||=9.903e-05 acc=0.6113
+ [BP-noLN] Ep 65: ||h_L||=7.549e+01 ||g||=1.009e-04 acc=0.6221
+ [BP-noLN] Ep 70: ||h_L||=7.530e+01 ||g||=1.088e-04 acc=0.6074
+ [BP-noLN] Ep 75: ||h_L||=7.454e+01 ||g||=1.082e-04 acc=0.6143
+ [BP-noLN] Ep 80: ||h_L||=7.426e+01 ||g||=1.162e-04 acc=0.6123
+ [BP-noLN] Ep 85: ||h_L||=7.353e+01 ||g||=1.161e-04 acc=0.6084
+ [BP-noLN] Ep 90: ||h_L||=7.339e+01 ||g||=1.168e-04 acc=0.6123
+ [BP-noLN] Ep 95: ||h_L||=7.308e+01 ||g||=1.164e-04 acc=0.6143
+ [BP-noLN] Ep 100: ||h_L||=7.297e+01 ||g||=1.158e-04 acc=0.6162
+
+=== DFA training (NO out_ln) ===
+ [DFA-noLN] Ep 0: ||h_L||=8.893e+00 ||g||=5.483e-04 acc=0.1123
+ [DFA-noLN] Ep 1: ||h_L||=1.560e+03 ||g||=6.859e-04 acc=0.1494 γ=0.0084
+ [DFA-noLN] Ep 5: ||h_L||=1.050e+04 ||g||=7.522e-04 acc=0.1748 γ=-0.0063
+ [DFA-noLN] Ep 10: ||h_L||=2.200e+04 ||g||=7.641e-04 acc=0.1445 γ=-0.0167
+ [DFA-noLN] Ep 15: ||h_L||=1.004e+05 ||g||=7.608e-04 acc=0.1738 γ=-0.0118
+ [DFA-noLN] Ep 20: ||h_L||=3.150e+05 ||g||=7.782e-04 acc=0.2070 γ=0.0027
+ [DFA-noLN] Ep 25: ||h_L||=6.817e+05 ||g||=7.884e-04 acc=0.1572 γ=0.0340
+ [DFA-noLN] Ep 30: ||h_L||=1.298e+06 ||g||=7.771e-04 acc=0.1299 γ=0.0393
+ [DFA-noLN] Ep 35: ||h_L||=2.143e+06 ||g||=7.980e-04 acc=0.0996 γ=0.0196
+ [DFA-noLN] Ep 40: ||h_L||=3.180e+06 ||g||=7.691e-04 acc=0.1016 γ=-0.0085
+ [DFA-noLN] Ep 45: ||h_L||=4.347e+06 ||g||=7.934e-04 acc=0.1582 γ=0.0262
+ [DFA-noLN] Ep 50: ||h_L||=5.552e+06 ||g||=7.869e-04 acc=0.2197 γ=0.0165
+ [DFA-noLN] Ep 55: ||h_L||=6.742e+06 ||g||=7.851e-04 acc=0.1885 γ=0.0046
+ [DFA-noLN] Ep 60: ||h_L||=7.801e+06 ||g||=7.600e-04 acc=0.1572 γ=0.0045
+ [DFA-noLN] Ep 65: ||h_L||=8.775e+06 ||g||=7.795e-04 acc=0.2031 γ=0.0088
+ [DFA-noLN] Ep 70: ||h_L||=9.556e+06 ||g||=7.968e-04 acc=0.1836 γ=0.0093
+ [DFA-noLN] Ep 75: ||h_L||=1.016e+07 ||g||=7.656e-04 acc=0.2490 γ=0.0168
+ [DFA-noLN] Ep 80: ||h_L||=1.064e+07 ||g||=7.633e-04 acc=0.2764 γ=0.0198
+ [DFA-noLN] Ep 85: ||h_L||=1.095e+07 ||g||=7.466e-04 acc=0.2773 γ=0.0195
+ [DFA-noLN] Ep 90: ||h_L||=1.107e+07 ||g||=7.453e-04 acc=0.2695 γ=0.0131
+ [DFA-noLN] Ep 95: ||h_L||=1.113e+07 ||g||=7.446e-04 acc=0.3105 γ=0.0146
+ [DFA-noLN] Ep 100: ||h_L||=1.113e+07 ||g||=7.392e-04 acc=0.3320 γ=0.0164
+
+Saved results/snapshot_no_outln_v1/snapshot_noLN_s42.json
diff --git a/results/snapshot_no_outln_v1/run_s456.log b/results/snapshot_no_outln_v1/run_s456.log
new file mode 100644
index 0000000..a0a3bd0
--- /dev/null
+++ b/results/snapshot_no_outln_v1/run_s456.log
@@ -0,0 +1,51 @@
+NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=456
+
+=== BP training (NO out_ln) ===
+ [BP-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918
+ [BP-noLN] Ep 1: ||h_L||=3.410e+01 ||g||=1.500e-04 acc=0.4365
+ [BP-noLN] Ep 5: ||h_L||=5.250e+01 ||g||=1.052e-04 acc=0.4961
+ [BP-noLN] Ep 10: ||h_L||=6.330e+01 ||g||=8.751e-05 acc=0.5596
+ [BP-noLN] Ep 15: ||h_L||=6.619e+01 ||g||=8.857e-05 acc=0.5215
+ [BP-noLN] Ep 20: ||h_L||=7.009e+01 ||g||=8.610e-05 acc=0.5420
+ [BP-noLN] Ep 25: ||h_L||=7.285e+01 ||g||=8.470e-05 acc=0.5723
+ [BP-noLN] Ep 30: ||h_L||=7.493e+01 ||g||=8.152e-05 acc=0.5938
+ [BP-noLN] Ep 35: ||h_L||=7.640e+01 ||g||=7.781e-05 acc=0.6074
+ [BP-noLN] Ep 40: ||h_L||=7.799e+01 ||g||=8.443e-05 acc=0.5938
+ [BP-noLN] Ep 45: ||h_L||=7.734e+01 ||g||=7.914e-05 acc=0.6143
+ [BP-noLN] Ep 50: ||h_L||=7.667e+01 ||g||=8.950e-05 acc=0.5996
+ [BP-noLN] Ep 55: ||h_L||=7.591e+01 ||g||=9.021e-05 acc=0.6201
+ [BP-noLN] Ep 60: ||h_L||=7.667e+01 ||g||=8.730e-05 acc=0.6338
+ [BP-noLN] Ep 65: ||h_L||=7.629e+01 ||g||=9.670e-05 acc=0.6230
+ [BP-noLN] Ep 70: ||h_L||=7.612e+01 ||g||=9.637e-05 acc=0.6260
+ [BP-noLN] Ep 75: ||h_L||=7.544e+01 ||g||=9.639e-05 acc=0.6338
+ [BP-noLN] Ep 80: ||h_L||=7.434e+01 ||g||=9.999e-05 acc=0.6455
+ [BP-noLN] Ep 85: ||h_L||=7.429e+01 ||g||=1.013e-04 acc=0.6348
+ [BP-noLN] Ep 90: ||h_L||=7.381e+01 ||g||=1.076e-04 acc=0.6348
+ [BP-noLN] Ep 95: ||h_L||=7.380e+01 ||g||=1.084e-04 acc=0.6436
+ [BP-noLN] Ep 100: ||h_L||=7.373e+01 ||g||=1.088e-04 acc=0.6465
+
+=== DFA training (NO out_ln) ===
+ [DFA-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918
+ [DFA-noLN] Ep 1: ||h_L||=1.507e+03 ||g||=6.424e-04 acc=0.2246 γ=0.0136
+ [DFA-noLN] Ep 5: ||h_L||=1.140e+04 ||g||=7.475e-04 acc=0.2314 γ=-0.0000
+ [DFA-noLN] Ep 10: ||h_L||=2.845e+04 ||g||=7.444e-04 acc=0.1895 γ=-0.0067
+ [DFA-noLN] Ep 15: ||h_L||=8.676e+04 ||g||=7.381e-04 acc=0.2549 γ=0.0039
+ [DFA-noLN] Ep 20: ||h_L||=2.707e+05 ||g||=7.761e-04 acc=0.1670 γ=0.0171
+ [DFA-noLN] Ep 25: ||h_L||=6.628e+05 ||g||=7.894e-04 acc=0.1992 γ=0.0390
+ [DFA-noLN] Ep 30: ||h_L||=1.245e+06 ||g||=7.944e-04 acc=0.1963 γ=0.0162
+ [DFA-noLN] Ep 35: ||h_L||=2.131e+06 ||g||=8.014e-04 acc=0.1904 γ=0.0128
+ [DFA-noLN] Ep 40: ||h_L||=3.242e+06 ||g||=7.965e-04 acc=0.1855 γ=0.0227
+ [DFA-noLN] Ep 45: ||h_L||=4.568e+06 ||g||=8.172e-04 acc=0.1807 γ=0.0340
+ [DFA-noLN] Ep 50: ||h_L||=6.031e+06 ||g||=8.070e-04 acc=0.1133 γ=0.0064
+ [DFA-noLN] Ep 55: ||h_L||=7.447e+06 ||g||=7.821e-04 acc=0.1924 γ=0.0273
+ [DFA-noLN] Ep 60: ||h_L||=8.862e+06 ||g||=8.033e-04 acc=0.1650 γ=0.0210
+ [DFA-noLN] Ep 65: ||h_L||=1.008e+07 ||g||=8.274e-04 acc=0.1533 γ=0.0124
+ [DFA-noLN] Ep 70: ||h_L||=1.111e+07 ||g||=7.999e-04 acc=0.2148 γ=0.0337
+ [DFA-noLN] Ep 75: ||h_L||=1.197e+07 ||g||=7.703e-04 acc=0.1953 γ=0.0403
+ [DFA-noLN] Ep 80: ||h_L||=1.256e+07 ||g||=7.954e-04 acc=0.1445 γ=-0.0076
+ [DFA-noLN] Ep 85: ||h_L||=1.292e+07 ||g||=7.205e-04 acc=0.2607 γ=0.0257
+ [DFA-noLN] Ep 90: ||h_L||=1.306e+07 ||g||=7.565e-04 acc=0.2402 γ=0.0119
+ [DFA-noLN] Ep 95: ||h_L||=1.310e+07 ||g||=7.185e-04 acc=0.3164 γ=0.0157
+ [DFA-noLN] Ep 100: ||h_L||=1.310e+07 ||g||=7.178e-04 acc=0.3359 γ=0.0173
+
+Saved results/snapshot_no_outln_v1/snapshot_noLN_s456.json
diff --git a/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json
new file mode 100644
index 0000000..7e5cb37
--- /dev/null
+++ b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json
@@ -0,0 +1,1824 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0005561555735766888,
+ 0.0005519049009308219,
+ 0.0005482902633957565,
+ 0.0005436676437966526,
+ 0.000538847001735121
+ ],
+ "acc_eval": 0.1123046875,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 736.34716796875,
+ 1637.1044921875,
+ 2033.1922607421875,
+ 2161.380859375,
+ 2126.18505859375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0006836718530394137,
+ 0.0006813183426856995,
+ 0.0006814387743361294,
+ 0.0006832550279796124,
+ 0.0006794488872401416
+ ],
+ "acc_eval": 0.1953125,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 1106.3868408203125,
+ 2963.552001953125,
+ 4087.33837890625,
+ 4421.4921875,
+ 4265.1083984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007476353785023093,
+ 0.0007440777844749391,
+ 0.0007443943759426475,
+ 0.0007477496401406825,
+ 0.0007366884965449572
+ ],
+ "acc_eval": 0.1044921875,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 1371.9425048828125,
+ 4214.05078125,
+ 6238.47265625,
+ 6697.2333984375,
+ 6399.22314453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000730870058760047,
+ 0.00072717375587672,
+ 0.0007270713686011732,
+ 0.0007290731882676482,
+ 0.0007233614451251924
+ ],
+ "acc_eval": 0.1943359375,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 1574.7962646484375,
+ 4805.0556640625,
+ 7044.64599609375,
+ 7593.78955078125,
+ 7215.32763671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007098641362972558,
+ 0.0007034889422357082,
+ 0.0007031699060462415,
+ 0.0007120345253497362,
+ 0.000694308546371758
+ ],
+ "acc_eval": 0.2451171875,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 1726.088623046875,
+ 6184.34521484375,
+ 9521.791015625,
+ 10387.7236328125,
+ 9721.431640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007400272879749537,
+ 0.0007343650795519352,
+ 0.0007334973197430372,
+ 0.0007343514007516205,
+ 0.0007319966680370271
+ ],
+ "acc_eval": 0.212890625,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 1902.689697265625,
+ 7697.52197265625,
+ 12328.0595703125,
+ 13597.1787109375,
+ 12504.158203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007165716378949583,
+ 0.0007126733544282615,
+ 0.0007124089752323925,
+ 0.0007126083364710212,
+ 0.0007107863784767687
+ ],
+ "acc_eval": 0.15625,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 2069.750244140625,
+ 10379.2958984375,
+ 16444.7421875,
+ 18267.94921875,
+ 16595.220703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007099996437318623,
+ 0.0007088935235515237,
+ 0.0007090346189215779,
+ 0.000710709486156702,
+ 0.0007023006328381598
+ ],
+ "acc_eval": 0.154296875,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 2226.40673828125,
+ 12703.916015625,
+ 20184.30859375,
+ 22453.73828125,
+ 20183.220703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.00072157580871135,
+ 0.0007210742915049195,
+ 0.0007212630589492619,
+ 0.0007244180305860937,
+ 0.0007163899717852473
+ ],
+ "acc_eval": 0.2236328125,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 2289.455078125,
+ 15611.2138671875,
+ 24559.412109375,
+ 27336.787109375,
+ 24451.6796875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007243232685141265,
+ 0.0007221215637400746,
+ 0.0007219284889288247,
+ 0.0007259267731569707,
+ 0.0007173537742346525
+ ],
+ "acc_eval": 0.169921875,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 2396.09814453125,
+ 19678.587890625,
+ 30417.08203125,
+ 34140.70703125,
+ 30261.052734375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007124242256395519,
+ 0.0007074667955748737,
+ 0.0007074963650666177,
+ 0.0007131542661227286,
+ 0.0007022957433946431
+ ],
+ "acc_eval": 0.1904296875,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 2467.864013671875,
+ 24019.642578125,
+ 41156.921875,
+ 46706.38671875,
+ 41256.71484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007333463290706277,
+ 0.0007277126424014568,
+ 0.0007268521003425121,
+ 0.000731462670955807,
+ 0.0007225224399007857
+ ],
+ "acc_eval": 0.169921875,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 2518.561767578125,
+ 28957.451171875,
+ 55737.69140625,
+ 64112.609375,
+ 56246.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007202349370345473,
+ 0.0007073598098941147,
+ 0.0007049349951557815,
+ 0.0007059182389639318,
+ 0.0007044971571303904
+ ],
+ "acc_eval": 0.1513671875,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 2614.843994140625,
+ 34279.15625,
+ 74158.109375,
+ 86073.96875,
+ 75187.59375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007299556746147573,
+ 0.0007100331713445485,
+ 0.0007101728115230799,
+ 0.0007166104041971266,
+ 0.0007030466804280877
+ ],
+ "acc_eval": 0.24609375,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 2697.871337890625,
+ 41263.5390625,
+ 96222.8984375,
+ 112901.9765625,
+ 98551.3046875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007336065755225718,
+ 0.0007151410100050271,
+ 0.0007150733144953847,
+ 0.0007166287978179753,
+ 0.0007151660392992198
+ ],
+ "acc_eval": 0.134765625,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 2815.983154296875,
+ 53842.3828125,
+ 126185.5625,
+ 149526.796875,
+ 130144.4765625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007365003693848848,
+ 0.0007177364313974977,
+ 0.0007168670417740941,
+ 0.000717108603566885,
+ 0.0007130720769055188
+ ],
+ "acc_eval": 0.150390625,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 2928.448974609375,
+ 65162.98046875,
+ 153909.296875,
+ 184005.875,
+ 159483.03125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007613440393470228,
+ 0.000720723532140255,
+ 0.000720796815585345,
+ 0.0007208258030004799,
+ 0.0007211563643068075
+ ],
+ "acc_eval": 0.166015625,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 2970.975341796875,
+ 76176.9609375,
+ 179093.75,
+ 216167.875,
+ 186723.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007602480472996831,
+ 0.0007191941258497536,
+ 0.0007163456757552922,
+ 0.0007164765265770257,
+ 0.0007142137037590146
+ ],
+ "acc_eval": 0.1796875,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 3078.336181640625,
+ 91839.40625,
+ 215980.015625,
+ 263515.15625,
+ 227071.515625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007584959384985268,
+ 0.0007150565506890416,
+ 0.0007151922909542918,
+ 0.000715585716534406,
+ 0.0007152389152906835
+ ],
+ "acc_eval": 0.1767578125,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 3202.803466796875,
+ 104358.6875,
+ 248325.390625,
+ 305395.84375,
+ 262365.46875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007867171661928296,
+ 0.0007155268103815615,
+ 0.0007155817584134638,
+ 0.0007157608633860946,
+ 0.0007155768107622862
+ ],
+ "acc_eval": 0.138671875,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 3282.27490234375,
+ 117747.359375,
+ 284217.3125,
+ 351018.15625,
+ 300903.65625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007691550417803228,
+ 0.0007147297146730125,
+ 0.0007147309370338917,
+ 0.0007150261080823839,
+ 0.0007147534633986652
+ ],
+ "acc_eval": 0.1923828125,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 3394.945556640625,
+ 129443.9765625,
+ 317078.65625,
+ 393509.375,
+ 336658.40625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008442914695478976,
+ 0.0007179519161581993,
+ 0.0007190873729996383,
+ 0.000723545381333679,
+ 0.0007175213540904224
+ ],
+ "acc_eval": 0.1376953125,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 3484.2763671875,
+ 140426.171875,
+ 355086.84375,
+ 443148.09375,
+ 378501.53125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007702927687205374,
+ 0.0006826652679592371,
+ 0.0006794629734940827,
+ 0.0006826536264270544,
+ 0.0006794703076593578
+ ],
+ "acc_eval": 0.19140625,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 3529.414306640625,
+ 153612.265625,
+ 393522.9375,
+ 493183.03125,
+ 421284.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008731107809580863,
+ 0.0007047304534353316,
+ 0.0007038630428723991,
+ 0.000708943116478622,
+ 0.000701444165315479
+ ],
+ "acc_eval": 0.16796875,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 3604.90283203125,
+ 165405.75,
+ 423586.46875,
+ 533219.375,
+ 454992.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008110221242532134,
+ 0.0006812610663473606,
+ 0.0006812110659666359,
+ 0.0006817537359893322,
+ 0.0006813214858993888
+ ],
+ "acc_eval": 0.20703125,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 3761.85400390625,
+ 178944.296875,
+ 464984.875,
+ 587869.375,
+ 501438.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008038324886001647,
+ 0.0006578225293196738,
+ 0.0006502956384792924,
+ 0.000664222112391144,
+ 0.0006502254982478917
+ ],
+ "acc_eval": 0.240234375,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 3818.5869140625,
+ 193167.4375,
+ 505599.375,
+ 643764.4375,
+ 550033.3125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007956585614010692,
+ 0.0007038708426989615,
+ 0.0007025190279819071,
+ 0.0007078333292156458,
+ 0.0006988184759393334
+ ],
+ "acc_eval": 0.185546875,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 3924.1787109375,
+ 207801.1875,
+ 548741.125,
+ 701043.0625,
+ 599520.4375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009222823427990079,
+ 0.000673642847687006,
+ 0.0006724554114043713,
+ 0.0006726986612193286,
+ 0.0006725445855408907
+ ],
+ "acc_eval": 0.216796875,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 4061.806884765625,
+ 222595.921875,
+ 590807.5,
+ 755718.75,
+ 646775.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008092334610410035,
+ 0.0007093537133187056,
+ 0.0007078479393385351,
+ 0.0007069098646752536,
+ 0.0007029378321021795
+ ],
+ "acc_eval": 0.2158203125,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 4216.11083984375,
+ 237549.296875,
+ 636429.5625,
+ 816954.9375,
+ 699524.9375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008620031294412911,
+ 0.0007326522027142346,
+ 0.00072627910412848,
+ 0.000725903722923249,
+ 0.0007269763154909015
+ ],
+ "acc_eval": 0.1533203125,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 4319.05029296875,
+ 251667.5,
+ 681409.75,
+ 874567.9375,
+ 748820.1875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008448463049717247,
+ 0.0007160686072893441,
+ 0.000714016379788518,
+ 0.0007141274982132018,
+ 0.0007095346227288246
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 4387.8330078125,
+ 268470.375,
+ 733153.125,
+ 943456.375,
+ 808793.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009849616326391697,
+ 0.0007160623208619654,
+ 0.0007154300110414624,
+ 0.0007152247708290815,
+ 0.0007160453242249787
+ ],
+ "acc_eval": 0.1884765625,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 4495.54638671875,
+ 291274.59375,
+ 806698.75,
+ 1039374.875,
+ 892062.1875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008646573405712843,
+ 0.000731874315533787,
+ 0.0007177238585427403,
+ 0.0007205329020507634,
+ 0.0007192457560449839
+ ],
+ "acc_eval": 0.17578125,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 4596.96337890625,
+ 305228.46875,
+ 848072.5625,
+ 1092268.625,
+ 937583.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009474663529545069,
+ 0.0007221641135402024,
+ 0.000721680698916316,
+ 0.0007284134044311941,
+ 0.0007212713244371116
+ ],
+ "acc_eval": 0.171875,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 4724.111328125,
+ 321366.5,
+ 891238.9375,
+ 1149886.25,
+ 987910.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009131877450272441,
+ 0.0007397676818072796,
+ 0.0007398735033348203,
+ 0.0007397927111014724,
+ 0.0007406016811728477
+ ],
+ "acc_eval": 0.125,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 4865.970703125,
+ 344027.15625,
+ 946722.0625,
+ 1219714.625,
+ 1049445.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001010064734145999,
+ 0.0007341124583035707,
+ 0.0007336883572861552,
+ 0.0007345521007664502,
+ 0.0007338698487728834
+ ],
+ "acc_eval": 0.119140625,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 5003.3857421875,
+ 373410.21875,
+ 1026535.0625,
+ 1321456.25,
+ 1139824.625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010555180488154292,
+ 0.0007112861494533718,
+ 0.0007111895247362554,
+ 0.0007112334715202451,
+ 0.000711193191818893
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 5121.19287109375,
+ 405646.9375,
+ 1111111.125,
+ 1430716.625,
+ 1237074.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010308363707736135,
+ 0.0007563655963167548,
+ 0.0007560031372122467,
+ 0.000755665882024914,
+ 0.0007561628590337932
+ ],
+ "acc_eval": 0.134765625,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 5212.7294921875,
+ 434054.15625,
+ 1180238.125,
+ 1518019.875,
+ 1314350.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001035128254443407,
+ 0.0007314062095247209,
+ 0.0007304889149963856,
+ 0.0007291524088941514,
+ 0.0007313747191801667
+ ],
+ "acc_eval": 0.140625,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 5322.74951171875,
+ 462000.6875,
+ 1248006.75,
+ 1606243.125,
+ 1392563.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009023830061778426,
+ 0.000720554031431675,
+ 0.0007195135112851858,
+ 0.0007197313825599849,
+ 0.0007196948863565922
+ ],
+ "acc_eval": 0.1708984375,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 5453.89111328125,
+ 498941.0625,
+ 1343521.0,
+ 1731177.375,
+ 1504101.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010444134240970016,
+ 0.0007362678297795355,
+ 0.0007352089160121977,
+ 0.0007340405718423426,
+ 0.0007357052527368069
+ ],
+ "acc_eval": 0.1328125,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 5515.6982421875,
+ 529817.75,
+ 1409505.625,
+ 1816151.0,
+ 1580539.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011280628386884928,
+ 0.0007231750059872866,
+ 0.0007211649208329618,
+ 0.000721275107935071,
+ 0.0007212632917799056
+ ],
+ "acc_eval": 0.1611328125,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 5617.26513671875,
+ 567492.4375,
+ 1498097.5,
+ 1931607.875,
+ 1684206.875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010544253746047616,
+ 0.0007354306289926171,
+ 0.0007348860381171107,
+ 0.0007349851075559855,
+ 0.0007350810337811708
+ ],
+ "acc_eval": 0.1416015625,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 5740.7978515625,
+ 596215.625,
+ 1561745.25,
+ 2014107.25,
+ 1758526.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010764201870188117,
+ 0.0007244387525133789,
+ 0.000723967794328928,
+ 0.000724096957128495,
+ 0.0007241644198074937
+ ],
+ "acc_eval": 0.19921875,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 5808.19677734375,
+ 630780.3125,
+ 1636034.875,
+ 2109305.75,
+ 1845552.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010526466649025679,
+ 0.0007206913433037698,
+ 0.0007207048474811018,
+ 0.0007211468764580786,
+ 0.0007207895396277308
+ ],
+ "acc_eval": 0.173828125,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 5868.3583984375,
+ 673578.625,
+ 1729325.25,
+ 2227518.0,
+ 1953361.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009479392319917679,
+ 0.0007091389270499349,
+ 0.0007090644794516265,
+ 0.0007082624360918999,
+ 0.0007085782708600163
+ ],
+ "acc_eval": 0.1923828125,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 5953.82421875,
+ 720273.0,
+ 1840695.5,
+ 2372038.0,
+ 2084658.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0014002618845552206,
+ 0.0007315247785300016,
+ 0.0007256051758304238,
+ 0.0007254919619299471,
+ 0.000725599646102637
+ ],
+ "acc_eval": 0.17578125,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 6054.7861328125,
+ 758000.6875,
+ 1930354.375,
+ 2488163.75,
+ 2190582.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001109408913180232,
+ 0.0007018125616014004,
+ 0.0007016566814854741,
+ 0.000701890152413398,
+ 0.0007018494652584195
+ ],
+ "acc_eval": 0.203125,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 6155.0859375,
+ 790443.0,
+ 2009565.875,
+ 2590829.25,
+ 2285268.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010253023356199265,
+ 0.0007347314967773855,
+ 0.0007304528844542801,
+ 0.0007322027231566608,
+ 0.0007312395609915257
+ ],
+ "acc_eval": 0.154296875,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 6216.64453125,
+ 830678.125,
+ 2088773.5,
+ 2691122.0,
+ 2376731.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010403504129499197,
+ 0.0006902964669279754,
+ 0.0006906419876031578,
+ 0.0006905900663696229,
+ 0.0006906461785547435
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 6252.98486328125,
+ 867790.1875,
+ 2159729.75,
+ 2781409.5,
+ 2460902.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011370684951543808,
+ 0.0007390088285319507,
+ 0.0007305812323465943,
+ 0.0007310720975510776,
+ 0.0007304322207346559
+ ],
+ "acc_eval": 0.15234375,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 6294.51611328125,
+ 897267.5625,
+ 2218282.5,
+ 2858224.75,
+ 2530432.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0013790406519547105,
+ 0.0007320911972783506,
+ 0.0007304649334400892,
+ 0.0007293879170902073,
+ 0.0007303770980797708
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 6312.2314453125,
+ 935570.375,
+ 2299086.0,
+ 2963619.0,
+ 2627515.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000999285257421434,
+ 0.0007227054447866976,
+ 0.0007246703025884926,
+ 0.0007245387532748282,
+ 0.0007243558065965772
+ ],
+ "acc_eval": 0.20703125,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 6387.30322265625,
+ 977101.125,
+ 2387243.0,
+ 3077676.25,
+ 2733147.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001396833686158061,
+ 0.0007110408041626215,
+ 0.0007093287422321737,
+ 0.000708233390469104,
+ 0.0007085108081810176
+ ],
+ "acc_eval": 0.1787109375,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 6406.59033203125,
+ 1011753.1875,
+ 2450391.25,
+ 3158275.0,
+ 2807055.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0012408416951075196,
+ 0.0007304692408069968,
+ 0.000724659999832511,
+ 0.0007247650064527988,
+ 0.0007249858463183045
+ ],
+ "acc_eval": 0.130859375,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 6396.32080078125,
+ 1051044.375,
+ 2521085.5,
+ 3249326.75,
+ 2890642.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010854896390810609,
+ 0.0006957638543099165,
+ 0.0006896257400512695,
+ 0.0006964386557228863,
+ 0.0006897017010487616
+ ],
+ "acc_eval": 0.234375,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 6413.91357421875,
+ 1083474.5,
+ 2597945.5,
+ 3348271.5,
+ 2981405.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.00098806235473603,
+ 0.000719150179065764,
+ 0.0007170068565756083,
+ 0.0007178731029853225,
+ 0.0007173708290793002
+ ],
+ "acc_eval": 0.205078125,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 6406.4228515625,
+ 1124429.875,
+ 2675529.5,
+ 3447474.25,
+ 3073241.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001149638439528644,
+ 0.0007225789595395327,
+ 0.0007212197524495423,
+ 0.0007210947806015611,
+ 0.0007211659685708582
+ ],
+ "acc_eval": 0.1494140625,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 6443.423828125,
+ 1166184.375,
+ 2758561.25,
+ 3551879.75,
+ 3171214.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001115654013119638,
+ 0.000685695675201714,
+ 0.0006846366450190544,
+ 0.0006861463189125061,
+ 0.0006862673326395452
+ ],
+ "acc_eval": 0.2490234375,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 6477.5,
+ 1208826.0,
+ 2842194.75,
+ 3654862.0,
+ 3267617.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000923235435038805,
+ 0.0006659153732471168,
+ 0.0006642267107963562,
+ 0.0006722065154463053,
+ 0.000664416525978595
+ ],
+ "acc_eval": 0.2353515625,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 6486.1689453125,
+ 1249377.0,
+ 2928293.75,
+ 3765881.75,
+ 3370835.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008846685523167253,
+ 0.0006866253679618239,
+ 0.000686973100528121,
+ 0.0006869880016893148,
+ 0.0006870955694466829
+ ],
+ "acc_eval": 0.2373046875,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 6499.3720703125,
+ 1291233.25,
+ 3012714.75,
+ 3873429.75,
+ 3471234.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009820004925131798,
+ 0.0007174524944275618,
+ 0.0007178467349149287,
+ 0.0007176626822911203,
+ 0.0007174718775786459
+ ],
+ "acc_eval": 0.216796875,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 6486.14404296875,
+ 1327247.75,
+ 3088322.75,
+ 3971415.75,
+ 3562299.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010241338750347495,
+ 0.0007171124452725053,
+ 0.0007174332858994603,
+ 0.0007172181503847241,
+ 0.0007169945747591555
+ ],
+ "acc_eval": 0.18359375,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 6455.17236328125,
+ 1355067.375,
+ 3142698.25,
+ 4041006.5,
+ 3627490.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009781530825421214,
+ 0.0007034538430161774,
+ 0.000703376077581197,
+ 0.0007118352805264294,
+ 0.0007080681971274316
+ ],
+ "acc_eval": 0.189453125,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 6454.62841796875,
+ 1384795.75,
+ 3199654.0,
+ 4114095.75,
+ 3696468.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009227422997355461,
+ 0.0007023688522167504,
+ 0.0007012909045442939,
+ 0.0007004260551184416,
+ 0.0007006779196672142
+ ],
+ "acc_eval": 0.21484375,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 6451.345703125,
+ 1420232.75,
+ 3260116.5,
+ 4190244.25,
+ 3768354.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008870494784787297,
+ 0.0007146014831960201,
+ 0.0007149986922740936,
+ 0.0007148014265112579,
+ 0.0007145918207243085
+ ],
+ "acc_eval": 0.197265625,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 6445.890625,
+ 1448264.875,
+ 3319505.0,
+ 4267505.0,
+ 3840047.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010003555798903108,
+ 0.0007171350298449397,
+ 0.0007168895681388676,
+ 0.0007169176824390888,
+ 0.0007170233875513077
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 6440.8212890625,
+ 1478082.75,
+ 3376291.25,
+ 4340727.0,
+ 3909334.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009646597318351269,
+ 0.0007130720769055188,
+ 0.0007134011830203235,
+ 0.0007131980964913964,
+ 0.0007129770237952471
+ ],
+ "acc_eval": 0.171875,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 6398.03955078125,
+ 1508487.5,
+ 3436526.25,
+ 4417271.5,
+ 3981251.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009445869363844395,
+ 0.0007122856914065778,
+ 0.0007126569980755448,
+ 0.0007124742260202765,
+ 0.0007122504175640643
+ ],
+ "acc_eval": 0.189453125,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 6389.02392578125,
+ 1530834.625,
+ 3480246.5,
+ 4471170.0,
+ 4032576.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009853171650320292,
+ 0.0006874292739666998,
+ 0.0006876476109027863,
+ 0.0006881517474539578,
+ 0.0006880395230837166
+ ],
+ "acc_eval": 0.1904296875,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 6338.54443359375,
+ 1561198.875,
+ 3541681.5,
+ 4548099.0,
+ 4105499.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009333671187050641,
+ 0.0006952910916879773,
+ 0.0006947650690563023,
+ 0.0006940987077541649,
+ 0.0006943742628209293
+ ],
+ "acc_eval": 0.23046875,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 6280.18603515625,
+ 1585008.0,
+ 3589125.25,
+ 4608667.0,
+ 4162480.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009699579677544534,
+ 0.0007101434166543186,
+ 0.0007104446412995458,
+ 0.000710242718923837,
+ 0.0007100136135704815
+ ],
+ "acc_eval": 0.146484375,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 6252.455078125,
+ 1608187.875,
+ 3635014.75,
+ 4667478.5,
+ 4218253.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008955001248978078,
+ 0.0006863236776553094,
+ 0.0006864941096864641,
+ 0.000687020889017731,
+ 0.0006868807831779122
+ ],
+ "acc_eval": 0.2431640625,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 6201.6845703125,
+ 1619508.875,
+ 3661275.25,
+ 4700652.0,
+ 4249921.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009069991065189242,
+ 0.0006539999740198255,
+ 0.0006531713879667222,
+ 0.0006594359292648733,
+ 0.000653320224955678
+ ],
+ "acc_eval": 0.2216796875,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 6182.8115234375,
+ 1632587.875,
+ 3679586.25,
+ 4722070.5,
+ 4271567.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009595821611583233,
+ 0.0007079984061419964,
+ 0.0007082773372530937,
+ 0.0007081056828610599,
+ 0.000707884959410876
+ ],
+ "acc_eval": 0.193359375,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 6153.7392578125,
+ 1653576.875,
+ 3722935.0,
+ 4776921.0,
+ 4323508.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008598894928582013,
+ 0.0007073319284245372,
+ 0.0007075938628986478,
+ 0.0007074539898894727,
+ 0.0007072555599734187
+ ],
+ "acc_eval": 0.201171875,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 6135.21240234375,
+ 1667474.375,
+ 3750912.75,
+ 4812450.5,
+ 4357575.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009454588289372623,
+ 0.0007068001432344317,
+ 0.0007069715647958219,
+ 0.0007067638216540217,
+ 0.0007065933896228671
+ ],
+ "acc_eval": 0.2158203125,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 6085.7109375,
+ 1679251.75,
+ 3774334.5,
+ 4840148.5,
+ 4384792.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008410231093876064,
+ 0.0006843701121397316,
+ 0.0006845371681265533,
+ 0.00068506138632074,
+ 0.0006849151104688644
+ ],
+ "acc_eval": 0.2578125,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 6042.693359375,
+ 1685705.5,
+ 3787479.75,
+ 4856211.0,
+ 4400193.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008572259685024619,
+ 0.0006840305286459625,
+ 0.0006841861759312451,
+ 0.0006847094628028572,
+ 0.0006845552125014365
+ ],
+ "acc_eval": 0.2568359375,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 6003.5390625,
+ 1702685.5,
+ 3813174.5,
+ 4888481.0,
+ 4430612.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008342780056409538,
+ 0.0006777377566322684,
+ 0.0006779460818506777,
+ 0.0006789933540858328,
+ 0.0006781259435229003
+ ],
+ "acc_eval": 0.2685546875,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 5948.60107421875,
+ 1714243.125,
+ 3830846.5,
+ 4910337.5,
+ 4451921.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008218465954996645,
+ 0.0006832804065197706,
+ 0.0006831764476373792,
+ 0.0006826326716691256,
+ 0.0006829035119153559
+ ],
+ "acc_eval": 0.2529296875,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 5881.8525390625,
+ 1718113.375,
+ 3838036.5,
+ 4920025.5,
+ 4461931.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007958809728734195,
+ 0.000677398347761482,
+ 0.0006775528891012073,
+ 0.0006775871734134853,
+ 0.0006777321686968207
+ ],
+ "acc_eval": 0.2548828125,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 5816.7880859375,
+ 1723461.25,
+ 3850904.75,
+ 4936806.0,
+ 4478473.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008361428044736385,
+ 0.0006769691244699061,
+ 0.0006771331536583602,
+ 0.0006771665066480637,
+ 0.0006773129571229219
+ ],
+ "acc_eval": 0.251953125,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 5760.41845703125,
+ 1732135.25,
+ 3859576.0,
+ 4947171.0,
+ 4488986.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008036325452849269,
+ 0.0006821549613960087,
+ 0.0006806753808632493,
+ 0.0006799713592045009,
+ 0.0006802318384870887
+ ],
+ "acc_eval": 0.2490234375,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 5710.22998046875,
+ 1740014.25,
+ 3871992.25,
+ 4962337.5,
+ 4503463.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008278922759927809,
+ 0.0006754198693670332,
+ 0.000675307004712522,
+ 0.0006768241291865706,
+ 0.0006769676692783833
+ ],
+ "acc_eval": 0.26171875,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 5685.73828125,
+ 1745863.25,
+ 3880256.75,
+ 4973639.5,
+ 4514457.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008255501161329448,
+ 0.0006466225022450089,
+ 0.0006466452032327652,
+ 0.0006467151688411832,
+ 0.0006467655766755342
+ ],
+ "acc_eval": 0.283203125,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 5637.498046875,
+ 1743128.375,
+ 3879796.5,
+ 4973009.0,
+ 4514424.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008148956694640219,
+ 0.0006465681362897158,
+ 0.0006463592289946973,
+ 0.0006491504609584808,
+ 0.0006464755861088634
+ ],
+ "acc_eval": 0.2587890625,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 5601.87744140625,
+ 1741859.375,
+ 3884447.75,
+ 4978445.5,
+ 4518886.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008254973217844963,
+ 0.0006783050484955311,
+ 0.0006774527719244361,
+ 0.0006768335006199777,
+ 0.0006770920008420944
+ ],
+ "acc_eval": 0.298828125,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 5587.505859375,
+ 1748285.875,
+ 3887730.5,
+ 4982144.0,
+ 4523151.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008113561780191958,
+ 0.0006764904828742146,
+ 0.000676542054861784,
+ 0.0006762324483133852,
+ 0.0006764894351363182
+ ],
+ "acc_eval": 0.2734375,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 5553.013671875,
+ 1748456.75,
+ 3890722.0,
+ 4986538.5,
+ 4527315.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007909060223028064,
+ 0.0006763285491615534,
+ 0.0006762049742974341,
+ 0.0006756742368452251,
+ 0.000675930583383888
+ ],
+ "acc_eval": 0.2861328125,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 5524.611328125,
+ 1748210.0,
+ 3893003.75,
+ 4989732.5,
+ 4530436.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000797618820797652,
+ 0.0006453269743360579,
+ 0.0006453663809224963,
+ 0.0006454290705733001,
+ 0.0006454723770730197
+ ],
+ "acc_eval": 0.28515625,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 5506.21923828125,
+ 1750958.0,
+ 3894639.5,
+ 4992073.0,
+ 4532399.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007834367570467293,
+ 0.0006762953125871718,
+ 0.0006754640489816666,
+ 0.0006748714949935675,
+ 0.0006751226610504091
+ ],
+ "acc_eval": 0.2939453125,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 5485.10791015625,
+ 1747546.25,
+ 3895030.0,
+ 4992480.5,
+ 4532805.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007779909064993262,
+ 0.0006450997898355126,
+ 0.0006451247027143836,
+ 0.0006455867551267147,
+ 0.0006452234229072928
+ ],
+ "acc_eval": 0.2890625,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 5464.07763671875,
+ 1749313.125,
+ 3894610.75,
+ 4991684.0,
+ 4532270.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008090221090242267,
+ 0.0006661301013082266,
+ 0.0006646219990216196,
+ 0.0006726695573888719,
+ 0.0006649038987234235
+ ],
+ "acc_eval": 0.283203125,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 5451.2841796875,
+ 1749389.0,
+ 3894315.25,
+ 4990837.5,
+ 4531011.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007907215040177107,
+ 0.0006448677740991116,
+ 0.0006448915228247643,
+ 0.0006451430963352323,
+ 0.0006449950742535293
+ ],
+ "acc_eval": 0.2958984375,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 5437.77099609375,
+ 1750653.125,
+ 3895251.75,
+ 4992303.0,
+ 4532441.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007774807745590806,
+ 0.000676269584801048,
+ 0.0006763145211152732,
+ 0.0006763775018043816,
+ 0.000676501716952771
+ ],
+ "acc_eval": 0.2763671875,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 5427.34619140625,
+ 1751408.875,
+ 3894547.75,
+ 4991554.5,
+ 4532145.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007797307334840298,
+ 0.000664835621137172,
+ 0.0006642266525886953,
+ 0.000671364541631192,
+ 0.0006645115208812058
+ ],
+ "acc_eval": 0.296875,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 5420.30615234375,
+ 1751757.5,
+ 3894027.5,
+ 4991042.0,
+ 4531674.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007797667058184743,
+ 0.0006446840125136077,
+ 0.0006447113119065762,
+ 0.0006447701598517597,
+ 0.0006448116037063301
+ ],
+ "acc_eval": 0.2939453125,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 5416.81396484375,
+ 1751629.625,
+ 3893959.25,
+ 4991021.5,
+ 4531639.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007706825854256749,
+ 0.0006446407060138881,
+ 0.0006406756583601236,
+ 0.0006447536870837212,
+ 0.0006393496878445148
+ ],
+ "acc_eval": 0.306640625,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 5415.3095703125,
+ 1751552.75,
+ 3893897.0,
+ 4990973.0,
+ 4531587.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007776900893077254,
+ 0.0006458400748670101,
+ 0.0006446869228966534,
+ 0.0006466003833338618,
+ 0.0006447876221500337
+ ],
+ "acc_eval": 0.2978515625,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 5414.92822265625,
+ 1751530.25,
+ 3893876.5,
+ 4990954.0,
+ 4531568.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007761479937471449,
+ 0.0006465426995418966,
+ 0.0006446881452575326,
+ 0.0006466349004767835,
+ 0.0006447875639423728
+ ],
+ "acc_eval": 0.294921875,
+ "epoch": 100
+ }
+ ],
+ "arch": "resmlp_noln",
+ "seed": 42
+} \ No newline at end of file
diff --git a/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json
new file mode 100644
index 0000000..7e5cb37
--- /dev/null
+++ b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json
@@ -0,0 +1,1824 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0005561555735766888,
+ 0.0005519049009308219,
+ 0.0005482902633957565,
+ 0.0005436676437966526,
+ 0.000538847001735121
+ ],
+ "acc_eval": 0.1123046875,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 736.34716796875,
+ 1637.1044921875,
+ 2033.1922607421875,
+ 2161.380859375,
+ 2126.18505859375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0006836718530394137,
+ 0.0006813183426856995,
+ 0.0006814387743361294,
+ 0.0006832550279796124,
+ 0.0006794488872401416
+ ],
+ "acc_eval": 0.1953125,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 1106.3868408203125,
+ 2963.552001953125,
+ 4087.33837890625,
+ 4421.4921875,
+ 4265.1083984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007476353785023093,
+ 0.0007440777844749391,
+ 0.0007443943759426475,
+ 0.0007477496401406825,
+ 0.0007366884965449572
+ ],
+ "acc_eval": 0.1044921875,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 1371.9425048828125,
+ 4214.05078125,
+ 6238.47265625,
+ 6697.2333984375,
+ 6399.22314453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000730870058760047,
+ 0.00072717375587672,
+ 0.0007270713686011732,
+ 0.0007290731882676482,
+ 0.0007233614451251924
+ ],
+ "acc_eval": 0.1943359375,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 1574.7962646484375,
+ 4805.0556640625,
+ 7044.64599609375,
+ 7593.78955078125,
+ 7215.32763671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007098641362972558,
+ 0.0007034889422357082,
+ 0.0007031699060462415,
+ 0.0007120345253497362,
+ 0.000694308546371758
+ ],
+ "acc_eval": 0.2451171875,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 1726.088623046875,
+ 6184.34521484375,
+ 9521.791015625,
+ 10387.7236328125,
+ 9721.431640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007400272879749537,
+ 0.0007343650795519352,
+ 0.0007334973197430372,
+ 0.0007343514007516205,
+ 0.0007319966680370271
+ ],
+ "acc_eval": 0.212890625,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 1902.689697265625,
+ 7697.52197265625,
+ 12328.0595703125,
+ 13597.1787109375,
+ 12504.158203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007165716378949583,
+ 0.0007126733544282615,
+ 0.0007124089752323925,
+ 0.0007126083364710212,
+ 0.0007107863784767687
+ ],
+ "acc_eval": 0.15625,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 2069.750244140625,
+ 10379.2958984375,
+ 16444.7421875,
+ 18267.94921875,
+ 16595.220703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007099996437318623,
+ 0.0007088935235515237,
+ 0.0007090346189215779,
+ 0.000710709486156702,
+ 0.0007023006328381598
+ ],
+ "acc_eval": 0.154296875,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 2226.40673828125,
+ 12703.916015625,
+ 20184.30859375,
+ 22453.73828125,
+ 20183.220703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.00072157580871135,
+ 0.0007210742915049195,
+ 0.0007212630589492619,
+ 0.0007244180305860937,
+ 0.0007163899717852473
+ ],
+ "acc_eval": 0.2236328125,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 2289.455078125,
+ 15611.2138671875,
+ 24559.412109375,
+ 27336.787109375,
+ 24451.6796875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007243232685141265,
+ 0.0007221215637400746,
+ 0.0007219284889288247,
+ 0.0007259267731569707,
+ 0.0007173537742346525
+ ],
+ "acc_eval": 0.169921875,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 2396.09814453125,
+ 19678.587890625,
+ 30417.08203125,
+ 34140.70703125,
+ 30261.052734375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007124242256395519,
+ 0.0007074667955748737,
+ 0.0007074963650666177,
+ 0.0007131542661227286,
+ 0.0007022957433946431
+ ],
+ "acc_eval": 0.1904296875,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 2467.864013671875,
+ 24019.642578125,
+ 41156.921875,
+ 46706.38671875,
+ 41256.71484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007333463290706277,
+ 0.0007277126424014568,
+ 0.0007268521003425121,
+ 0.000731462670955807,
+ 0.0007225224399007857
+ ],
+ "acc_eval": 0.169921875,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 2518.561767578125,
+ 28957.451171875,
+ 55737.69140625,
+ 64112.609375,
+ 56246.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007202349370345473,
+ 0.0007073598098941147,
+ 0.0007049349951557815,
+ 0.0007059182389639318,
+ 0.0007044971571303904
+ ],
+ "acc_eval": 0.1513671875,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 2614.843994140625,
+ 34279.15625,
+ 74158.109375,
+ 86073.96875,
+ 75187.59375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007299556746147573,
+ 0.0007100331713445485,
+ 0.0007101728115230799,
+ 0.0007166104041971266,
+ 0.0007030466804280877
+ ],
+ "acc_eval": 0.24609375,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 2697.871337890625,
+ 41263.5390625,
+ 96222.8984375,
+ 112901.9765625,
+ 98551.3046875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007336065755225718,
+ 0.0007151410100050271,
+ 0.0007150733144953847,
+ 0.0007166287978179753,
+ 0.0007151660392992198
+ ],
+ "acc_eval": 0.134765625,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 2815.983154296875,
+ 53842.3828125,
+ 126185.5625,
+ 149526.796875,
+ 130144.4765625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007365003693848848,
+ 0.0007177364313974977,
+ 0.0007168670417740941,
+ 0.000717108603566885,
+ 0.0007130720769055188
+ ],
+ "acc_eval": 0.150390625,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 2928.448974609375,
+ 65162.98046875,
+ 153909.296875,
+ 184005.875,
+ 159483.03125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007613440393470228,
+ 0.000720723532140255,
+ 0.000720796815585345,
+ 0.0007208258030004799,
+ 0.0007211563643068075
+ ],
+ "acc_eval": 0.166015625,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 2970.975341796875,
+ 76176.9609375,
+ 179093.75,
+ 216167.875,
+ 186723.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007602480472996831,
+ 0.0007191941258497536,
+ 0.0007163456757552922,
+ 0.0007164765265770257,
+ 0.0007142137037590146
+ ],
+ "acc_eval": 0.1796875,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 3078.336181640625,
+ 91839.40625,
+ 215980.015625,
+ 263515.15625,
+ 227071.515625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007584959384985268,
+ 0.0007150565506890416,
+ 0.0007151922909542918,
+ 0.000715585716534406,
+ 0.0007152389152906835
+ ],
+ "acc_eval": 0.1767578125,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 3202.803466796875,
+ 104358.6875,
+ 248325.390625,
+ 305395.84375,
+ 262365.46875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007867171661928296,
+ 0.0007155268103815615,
+ 0.0007155817584134638,
+ 0.0007157608633860946,
+ 0.0007155768107622862
+ ],
+ "acc_eval": 0.138671875,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 3282.27490234375,
+ 117747.359375,
+ 284217.3125,
+ 351018.15625,
+ 300903.65625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007691550417803228,
+ 0.0007147297146730125,
+ 0.0007147309370338917,
+ 0.0007150261080823839,
+ 0.0007147534633986652
+ ],
+ "acc_eval": 0.1923828125,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 3394.945556640625,
+ 129443.9765625,
+ 317078.65625,
+ 393509.375,
+ 336658.40625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008442914695478976,
+ 0.0007179519161581993,
+ 0.0007190873729996383,
+ 0.000723545381333679,
+ 0.0007175213540904224
+ ],
+ "acc_eval": 0.1376953125,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 3484.2763671875,
+ 140426.171875,
+ 355086.84375,
+ 443148.09375,
+ 378501.53125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007702927687205374,
+ 0.0006826652679592371,
+ 0.0006794629734940827,
+ 0.0006826536264270544,
+ 0.0006794703076593578
+ ],
+ "acc_eval": 0.19140625,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 3529.414306640625,
+ 153612.265625,
+ 393522.9375,
+ 493183.03125,
+ 421284.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008731107809580863,
+ 0.0007047304534353316,
+ 0.0007038630428723991,
+ 0.000708943116478622,
+ 0.000701444165315479
+ ],
+ "acc_eval": 0.16796875,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 3604.90283203125,
+ 165405.75,
+ 423586.46875,
+ 533219.375,
+ 454992.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008110221242532134,
+ 0.0006812610663473606,
+ 0.0006812110659666359,
+ 0.0006817537359893322,
+ 0.0006813214858993888
+ ],
+ "acc_eval": 0.20703125,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 3761.85400390625,
+ 178944.296875,
+ 464984.875,
+ 587869.375,
+ 501438.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008038324886001647,
+ 0.0006578225293196738,
+ 0.0006502956384792924,
+ 0.000664222112391144,
+ 0.0006502254982478917
+ ],
+ "acc_eval": 0.240234375,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 3818.5869140625,
+ 193167.4375,
+ 505599.375,
+ 643764.4375,
+ 550033.3125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007956585614010692,
+ 0.0007038708426989615,
+ 0.0007025190279819071,
+ 0.0007078333292156458,
+ 0.0006988184759393334
+ ],
+ "acc_eval": 0.185546875,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 3924.1787109375,
+ 207801.1875,
+ 548741.125,
+ 701043.0625,
+ 599520.4375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009222823427990079,
+ 0.000673642847687006,
+ 0.0006724554114043713,
+ 0.0006726986612193286,
+ 0.0006725445855408907
+ ],
+ "acc_eval": 0.216796875,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 4061.806884765625,
+ 222595.921875,
+ 590807.5,
+ 755718.75,
+ 646775.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008092334610410035,
+ 0.0007093537133187056,
+ 0.0007078479393385351,
+ 0.0007069098646752536,
+ 0.0007029378321021795
+ ],
+ "acc_eval": 0.2158203125,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 4216.11083984375,
+ 237549.296875,
+ 636429.5625,
+ 816954.9375,
+ 699524.9375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008620031294412911,
+ 0.0007326522027142346,
+ 0.00072627910412848,
+ 0.000725903722923249,
+ 0.0007269763154909015
+ ],
+ "acc_eval": 0.1533203125,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 4319.05029296875,
+ 251667.5,
+ 681409.75,
+ 874567.9375,
+ 748820.1875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008448463049717247,
+ 0.0007160686072893441,
+ 0.000714016379788518,
+ 0.0007141274982132018,
+ 0.0007095346227288246
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 4387.8330078125,
+ 268470.375,
+ 733153.125,
+ 943456.375,
+ 808793.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009849616326391697,
+ 0.0007160623208619654,
+ 0.0007154300110414624,
+ 0.0007152247708290815,
+ 0.0007160453242249787
+ ],
+ "acc_eval": 0.1884765625,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 4495.54638671875,
+ 291274.59375,
+ 806698.75,
+ 1039374.875,
+ 892062.1875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008646573405712843,
+ 0.000731874315533787,
+ 0.0007177238585427403,
+ 0.0007205329020507634,
+ 0.0007192457560449839
+ ],
+ "acc_eval": 0.17578125,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 4596.96337890625,
+ 305228.46875,
+ 848072.5625,
+ 1092268.625,
+ 937583.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009474663529545069,
+ 0.0007221641135402024,
+ 0.000721680698916316,
+ 0.0007284134044311941,
+ 0.0007212713244371116
+ ],
+ "acc_eval": 0.171875,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 4724.111328125,
+ 321366.5,
+ 891238.9375,
+ 1149886.25,
+ 987910.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009131877450272441,
+ 0.0007397676818072796,
+ 0.0007398735033348203,
+ 0.0007397927111014724,
+ 0.0007406016811728477
+ ],
+ "acc_eval": 0.125,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 4865.970703125,
+ 344027.15625,
+ 946722.0625,
+ 1219714.625,
+ 1049445.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001010064734145999,
+ 0.0007341124583035707,
+ 0.0007336883572861552,
+ 0.0007345521007664502,
+ 0.0007338698487728834
+ ],
+ "acc_eval": 0.119140625,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 5003.3857421875,
+ 373410.21875,
+ 1026535.0625,
+ 1321456.25,
+ 1139824.625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010555180488154292,
+ 0.0007112861494533718,
+ 0.0007111895247362554,
+ 0.0007112334715202451,
+ 0.000711193191818893
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 5121.19287109375,
+ 405646.9375,
+ 1111111.125,
+ 1430716.625,
+ 1237074.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010308363707736135,
+ 0.0007563655963167548,
+ 0.0007560031372122467,
+ 0.000755665882024914,
+ 0.0007561628590337932
+ ],
+ "acc_eval": 0.134765625,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 5212.7294921875,
+ 434054.15625,
+ 1180238.125,
+ 1518019.875,
+ 1314350.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001035128254443407,
+ 0.0007314062095247209,
+ 0.0007304889149963856,
+ 0.0007291524088941514,
+ 0.0007313747191801667
+ ],
+ "acc_eval": 0.140625,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 5322.74951171875,
+ 462000.6875,
+ 1248006.75,
+ 1606243.125,
+ 1392563.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009023830061778426,
+ 0.000720554031431675,
+ 0.0007195135112851858,
+ 0.0007197313825599849,
+ 0.0007196948863565922
+ ],
+ "acc_eval": 0.1708984375,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 5453.89111328125,
+ 498941.0625,
+ 1343521.0,
+ 1731177.375,
+ 1504101.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010444134240970016,
+ 0.0007362678297795355,
+ 0.0007352089160121977,
+ 0.0007340405718423426,
+ 0.0007357052527368069
+ ],
+ "acc_eval": 0.1328125,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 5515.6982421875,
+ 529817.75,
+ 1409505.625,
+ 1816151.0,
+ 1580539.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011280628386884928,
+ 0.0007231750059872866,
+ 0.0007211649208329618,
+ 0.000721275107935071,
+ 0.0007212632917799056
+ ],
+ "acc_eval": 0.1611328125,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 5617.26513671875,
+ 567492.4375,
+ 1498097.5,
+ 1931607.875,
+ 1684206.875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010544253746047616,
+ 0.0007354306289926171,
+ 0.0007348860381171107,
+ 0.0007349851075559855,
+ 0.0007350810337811708
+ ],
+ "acc_eval": 0.1416015625,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 5740.7978515625,
+ 596215.625,
+ 1561745.25,
+ 2014107.25,
+ 1758526.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010764201870188117,
+ 0.0007244387525133789,
+ 0.000723967794328928,
+ 0.000724096957128495,
+ 0.0007241644198074937
+ ],
+ "acc_eval": 0.19921875,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 5808.19677734375,
+ 630780.3125,
+ 1636034.875,
+ 2109305.75,
+ 1845552.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010526466649025679,
+ 0.0007206913433037698,
+ 0.0007207048474811018,
+ 0.0007211468764580786,
+ 0.0007207895396277308
+ ],
+ "acc_eval": 0.173828125,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 5868.3583984375,
+ 673578.625,
+ 1729325.25,
+ 2227518.0,
+ 1953361.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009479392319917679,
+ 0.0007091389270499349,
+ 0.0007090644794516265,
+ 0.0007082624360918999,
+ 0.0007085782708600163
+ ],
+ "acc_eval": 0.1923828125,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 5953.82421875,
+ 720273.0,
+ 1840695.5,
+ 2372038.0,
+ 2084658.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0014002618845552206,
+ 0.0007315247785300016,
+ 0.0007256051758304238,
+ 0.0007254919619299471,
+ 0.000725599646102637
+ ],
+ "acc_eval": 0.17578125,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 6054.7861328125,
+ 758000.6875,
+ 1930354.375,
+ 2488163.75,
+ 2190582.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001109408913180232,
+ 0.0007018125616014004,
+ 0.0007016566814854741,
+ 0.000701890152413398,
+ 0.0007018494652584195
+ ],
+ "acc_eval": 0.203125,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 6155.0859375,
+ 790443.0,
+ 2009565.875,
+ 2590829.25,
+ 2285268.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010253023356199265,
+ 0.0007347314967773855,
+ 0.0007304528844542801,
+ 0.0007322027231566608,
+ 0.0007312395609915257
+ ],
+ "acc_eval": 0.154296875,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 6216.64453125,
+ 830678.125,
+ 2088773.5,
+ 2691122.0,
+ 2376731.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010403504129499197,
+ 0.0006902964669279754,
+ 0.0006906419876031578,
+ 0.0006905900663696229,
+ 0.0006906461785547435
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 6252.98486328125,
+ 867790.1875,
+ 2159729.75,
+ 2781409.5,
+ 2460902.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011370684951543808,
+ 0.0007390088285319507,
+ 0.0007305812323465943,
+ 0.0007310720975510776,
+ 0.0007304322207346559
+ ],
+ "acc_eval": 0.15234375,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 6294.51611328125,
+ 897267.5625,
+ 2218282.5,
+ 2858224.75,
+ 2530432.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0013790406519547105,
+ 0.0007320911972783506,
+ 0.0007304649334400892,
+ 0.0007293879170902073,
+ 0.0007303770980797708
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 6312.2314453125,
+ 935570.375,
+ 2299086.0,
+ 2963619.0,
+ 2627515.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000999285257421434,
+ 0.0007227054447866976,
+ 0.0007246703025884926,
+ 0.0007245387532748282,
+ 0.0007243558065965772
+ ],
+ "acc_eval": 0.20703125,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 6387.30322265625,
+ 977101.125,
+ 2387243.0,
+ 3077676.25,
+ 2733147.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001396833686158061,
+ 0.0007110408041626215,
+ 0.0007093287422321737,
+ 0.000708233390469104,
+ 0.0007085108081810176
+ ],
+ "acc_eval": 0.1787109375,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 6406.59033203125,
+ 1011753.1875,
+ 2450391.25,
+ 3158275.0,
+ 2807055.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0012408416951075196,
+ 0.0007304692408069968,
+ 0.000724659999832511,
+ 0.0007247650064527988,
+ 0.0007249858463183045
+ ],
+ "acc_eval": 0.130859375,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 6396.32080078125,
+ 1051044.375,
+ 2521085.5,
+ 3249326.75,
+ 2890642.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010854896390810609,
+ 0.0006957638543099165,
+ 0.0006896257400512695,
+ 0.0006964386557228863,
+ 0.0006897017010487616
+ ],
+ "acc_eval": 0.234375,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 6413.91357421875,
+ 1083474.5,
+ 2597945.5,
+ 3348271.5,
+ 2981405.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.00098806235473603,
+ 0.000719150179065764,
+ 0.0007170068565756083,
+ 0.0007178731029853225,
+ 0.0007173708290793002
+ ],
+ "acc_eval": 0.205078125,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 6406.4228515625,
+ 1124429.875,
+ 2675529.5,
+ 3447474.25,
+ 3073241.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001149638439528644,
+ 0.0007225789595395327,
+ 0.0007212197524495423,
+ 0.0007210947806015611,
+ 0.0007211659685708582
+ ],
+ "acc_eval": 0.1494140625,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 6443.423828125,
+ 1166184.375,
+ 2758561.25,
+ 3551879.75,
+ 3171214.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001115654013119638,
+ 0.000685695675201714,
+ 0.0006846366450190544,
+ 0.0006861463189125061,
+ 0.0006862673326395452
+ ],
+ "acc_eval": 0.2490234375,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 6477.5,
+ 1208826.0,
+ 2842194.75,
+ 3654862.0,
+ 3267617.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000923235435038805,
+ 0.0006659153732471168,
+ 0.0006642267107963562,
+ 0.0006722065154463053,
+ 0.000664416525978595
+ ],
+ "acc_eval": 0.2353515625,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 6486.1689453125,
+ 1249377.0,
+ 2928293.75,
+ 3765881.75,
+ 3370835.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008846685523167253,
+ 0.0006866253679618239,
+ 0.000686973100528121,
+ 0.0006869880016893148,
+ 0.0006870955694466829
+ ],
+ "acc_eval": 0.2373046875,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 6499.3720703125,
+ 1291233.25,
+ 3012714.75,
+ 3873429.75,
+ 3471234.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009820004925131798,
+ 0.0007174524944275618,
+ 0.0007178467349149287,
+ 0.0007176626822911203,
+ 0.0007174718775786459
+ ],
+ "acc_eval": 0.216796875,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 6486.14404296875,
+ 1327247.75,
+ 3088322.75,
+ 3971415.75,
+ 3562299.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010241338750347495,
+ 0.0007171124452725053,
+ 0.0007174332858994603,
+ 0.0007172181503847241,
+ 0.0007169945747591555
+ ],
+ "acc_eval": 0.18359375,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 6455.17236328125,
+ 1355067.375,
+ 3142698.25,
+ 4041006.5,
+ 3627490.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009781530825421214,
+ 0.0007034538430161774,
+ 0.000703376077581197,
+ 0.0007118352805264294,
+ 0.0007080681971274316
+ ],
+ "acc_eval": 0.189453125,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 6454.62841796875,
+ 1384795.75,
+ 3199654.0,
+ 4114095.75,
+ 3696468.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009227422997355461,
+ 0.0007023688522167504,
+ 0.0007012909045442939,
+ 0.0007004260551184416,
+ 0.0007006779196672142
+ ],
+ "acc_eval": 0.21484375,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 6451.345703125,
+ 1420232.75,
+ 3260116.5,
+ 4190244.25,
+ 3768354.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008870494784787297,
+ 0.0007146014831960201,
+ 0.0007149986922740936,
+ 0.0007148014265112579,
+ 0.0007145918207243085
+ ],
+ "acc_eval": 0.197265625,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 6445.890625,
+ 1448264.875,
+ 3319505.0,
+ 4267505.0,
+ 3840047.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010003555798903108,
+ 0.0007171350298449397,
+ 0.0007168895681388676,
+ 0.0007169176824390888,
+ 0.0007170233875513077
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 6440.8212890625,
+ 1478082.75,
+ 3376291.25,
+ 4340727.0,
+ 3909334.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009646597318351269,
+ 0.0007130720769055188,
+ 0.0007134011830203235,
+ 0.0007131980964913964,
+ 0.0007129770237952471
+ ],
+ "acc_eval": 0.171875,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 6398.03955078125,
+ 1508487.5,
+ 3436526.25,
+ 4417271.5,
+ 3981251.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009445869363844395,
+ 0.0007122856914065778,
+ 0.0007126569980755448,
+ 0.0007124742260202765,
+ 0.0007122504175640643
+ ],
+ "acc_eval": 0.189453125,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 6389.02392578125,
+ 1530834.625,
+ 3480246.5,
+ 4471170.0,
+ 4032576.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009853171650320292,
+ 0.0006874292739666998,
+ 0.0006876476109027863,
+ 0.0006881517474539578,
+ 0.0006880395230837166
+ ],
+ "acc_eval": 0.1904296875,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 6338.54443359375,
+ 1561198.875,
+ 3541681.5,
+ 4548099.0,
+ 4105499.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009333671187050641,
+ 0.0006952910916879773,
+ 0.0006947650690563023,
+ 0.0006940987077541649,
+ 0.0006943742628209293
+ ],
+ "acc_eval": 0.23046875,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 6280.18603515625,
+ 1585008.0,
+ 3589125.25,
+ 4608667.0,
+ 4162480.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009699579677544534,
+ 0.0007101434166543186,
+ 0.0007104446412995458,
+ 0.000710242718923837,
+ 0.0007100136135704815
+ ],
+ "acc_eval": 0.146484375,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 6252.455078125,
+ 1608187.875,
+ 3635014.75,
+ 4667478.5,
+ 4218253.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008955001248978078,
+ 0.0006863236776553094,
+ 0.0006864941096864641,
+ 0.000687020889017731,
+ 0.0006868807831779122
+ ],
+ "acc_eval": 0.2431640625,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 6201.6845703125,
+ 1619508.875,
+ 3661275.25,
+ 4700652.0,
+ 4249921.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009069991065189242,
+ 0.0006539999740198255,
+ 0.0006531713879667222,
+ 0.0006594359292648733,
+ 0.000653320224955678
+ ],
+ "acc_eval": 0.2216796875,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 6182.8115234375,
+ 1632587.875,
+ 3679586.25,
+ 4722070.5,
+ 4271567.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009595821611583233,
+ 0.0007079984061419964,
+ 0.0007082773372530937,
+ 0.0007081056828610599,
+ 0.000707884959410876
+ ],
+ "acc_eval": 0.193359375,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 6153.7392578125,
+ 1653576.875,
+ 3722935.0,
+ 4776921.0,
+ 4323508.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008598894928582013,
+ 0.0007073319284245372,
+ 0.0007075938628986478,
+ 0.0007074539898894727,
+ 0.0007072555599734187
+ ],
+ "acc_eval": 0.201171875,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 6135.21240234375,
+ 1667474.375,
+ 3750912.75,
+ 4812450.5,
+ 4357575.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009454588289372623,
+ 0.0007068001432344317,
+ 0.0007069715647958219,
+ 0.0007067638216540217,
+ 0.0007065933896228671
+ ],
+ "acc_eval": 0.2158203125,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 6085.7109375,
+ 1679251.75,
+ 3774334.5,
+ 4840148.5,
+ 4384792.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008410231093876064,
+ 0.0006843701121397316,
+ 0.0006845371681265533,
+ 0.00068506138632074,
+ 0.0006849151104688644
+ ],
+ "acc_eval": 0.2578125,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 6042.693359375,
+ 1685705.5,
+ 3787479.75,
+ 4856211.0,
+ 4400193.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008572259685024619,
+ 0.0006840305286459625,
+ 0.0006841861759312451,
+ 0.0006847094628028572,
+ 0.0006845552125014365
+ ],
+ "acc_eval": 0.2568359375,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 6003.5390625,
+ 1702685.5,
+ 3813174.5,
+ 4888481.0,
+ 4430612.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008342780056409538,
+ 0.0006777377566322684,
+ 0.0006779460818506777,
+ 0.0006789933540858328,
+ 0.0006781259435229003
+ ],
+ "acc_eval": 0.2685546875,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 5948.60107421875,
+ 1714243.125,
+ 3830846.5,
+ 4910337.5,
+ 4451921.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008218465954996645,
+ 0.0006832804065197706,
+ 0.0006831764476373792,
+ 0.0006826326716691256,
+ 0.0006829035119153559
+ ],
+ "acc_eval": 0.2529296875,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 5881.8525390625,
+ 1718113.375,
+ 3838036.5,
+ 4920025.5,
+ 4461931.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007958809728734195,
+ 0.000677398347761482,
+ 0.0006775528891012073,
+ 0.0006775871734134853,
+ 0.0006777321686968207
+ ],
+ "acc_eval": 0.2548828125,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 5816.7880859375,
+ 1723461.25,
+ 3850904.75,
+ 4936806.0,
+ 4478473.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008361428044736385,
+ 0.0006769691244699061,
+ 0.0006771331536583602,
+ 0.0006771665066480637,
+ 0.0006773129571229219
+ ],
+ "acc_eval": 0.251953125,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 5760.41845703125,
+ 1732135.25,
+ 3859576.0,
+ 4947171.0,
+ 4488986.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008036325452849269,
+ 0.0006821549613960087,
+ 0.0006806753808632493,
+ 0.0006799713592045009,
+ 0.0006802318384870887
+ ],
+ "acc_eval": 0.2490234375,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 5710.22998046875,
+ 1740014.25,
+ 3871992.25,
+ 4962337.5,
+ 4503463.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008278922759927809,
+ 0.0006754198693670332,
+ 0.000675307004712522,
+ 0.0006768241291865706,
+ 0.0006769676692783833
+ ],
+ "acc_eval": 0.26171875,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 5685.73828125,
+ 1745863.25,
+ 3880256.75,
+ 4973639.5,
+ 4514457.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008255501161329448,
+ 0.0006466225022450089,
+ 0.0006466452032327652,
+ 0.0006467151688411832,
+ 0.0006467655766755342
+ ],
+ "acc_eval": 0.283203125,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 5637.498046875,
+ 1743128.375,
+ 3879796.5,
+ 4973009.0,
+ 4514424.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008148956694640219,
+ 0.0006465681362897158,
+ 0.0006463592289946973,
+ 0.0006491504609584808,
+ 0.0006464755861088634
+ ],
+ "acc_eval": 0.2587890625,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 5601.87744140625,
+ 1741859.375,
+ 3884447.75,
+ 4978445.5,
+ 4518886.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008254973217844963,
+ 0.0006783050484955311,
+ 0.0006774527719244361,
+ 0.0006768335006199777,
+ 0.0006770920008420944
+ ],
+ "acc_eval": 0.298828125,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 5587.505859375,
+ 1748285.875,
+ 3887730.5,
+ 4982144.0,
+ 4523151.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008113561780191958,
+ 0.0006764904828742146,
+ 0.000676542054861784,
+ 0.0006762324483133852,
+ 0.0006764894351363182
+ ],
+ "acc_eval": 0.2734375,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 5553.013671875,
+ 1748456.75,
+ 3890722.0,
+ 4986538.5,
+ 4527315.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007909060223028064,
+ 0.0006763285491615534,
+ 0.0006762049742974341,
+ 0.0006756742368452251,
+ 0.000675930583383888
+ ],
+ "acc_eval": 0.2861328125,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 5524.611328125,
+ 1748210.0,
+ 3893003.75,
+ 4989732.5,
+ 4530436.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000797618820797652,
+ 0.0006453269743360579,
+ 0.0006453663809224963,
+ 0.0006454290705733001,
+ 0.0006454723770730197
+ ],
+ "acc_eval": 0.28515625,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 5506.21923828125,
+ 1750958.0,
+ 3894639.5,
+ 4992073.0,
+ 4532399.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007834367570467293,
+ 0.0006762953125871718,
+ 0.0006754640489816666,
+ 0.0006748714949935675,
+ 0.0006751226610504091
+ ],
+ "acc_eval": 0.2939453125,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 5485.10791015625,
+ 1747546.25,
+ 3895030.0,
+ 4992480.5,
+ 4532805.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007779909064993262,
+ 0.0006450997898355126,
+ 0.0006451247027143836,
+ 0.0006455867551267147,
+ 0.0006452234229072928
+ ],
+ "acc_eval": 0.2890625,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 5464.07763671875,
+ 1749313.125,
+ 3894610.75,
+ 4991684.0,
+ 4532270.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008090221090242267,
+ 0.0006661301013082266,
+ 0.0006646219990216196,
+ 0.0006726695573888719,
+ 0.0006649038987234235
+ ],
+ "acc_eval": 0.283203125,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 5451.2841796875,
+ 1749389.0,
+ 3894315.25,
+ 4990837.5,
+ 4531011.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007907215040177107,
+ 0.0006448677740991116,
+ 0.0006448915228247643,
+ 0.0006451430963352323,
+ 0.0006449950742535293
+ ],
+ "acc_eval": 0.2958984375,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 5437.77099609375,
+ 1750653.125,
+ 3895251.75,
+ 4992303.0,
+ 4532441.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007774807745590806,
+ 0.000676269584801048,
+ 0.0006763145211152732,
+ 0.0006763775018043816,
+ 0.000676501716952771
+ ],
+ "acc_eval": 0.2763671875,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 5427.34619140625,
+ 1751408.875,
+ 3894547.75,
+ 4991554.5,
+ 4532145.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007797307334840298,
+ 0.000664835621137172,
+ 0.0006642266525886953,
+ 0.000671364541631192,
+ 0.0006645115208812058
+ ],
+ "acc_eval": 0.296875,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 5420.30615234375,
+ 1751757.5,
+ 3894027.5,
+ 4991042.0,
+ 4531674.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007797667058184743,
+ 0.0006446840125136077,
+ 0.0006447113119065762,
+ 0.0006447701598517597,
+ 0.0006448116037063301
+ ],
+ "acc_eval": 0.2939453125,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 5416.81396484375,
+ 1751629.625,
+ 3893959.25,
+ 4991021.5,
+ 4531639.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007706825854256749,
+ 0.0006446407060138881,
+ 0.0006406756583601236,
+ 0.0006447536870837212,
+ 0.0006393496878445148
+ ],
+ "acc_eval": 0.306640625,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 5415.3095703125,
+ 1751552.75,
+ 3893897.0,
+ 4990973.0,
+ 4531587.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007776900893077254,
+ 0.0006458400748670101,
+ 0.0006446869228966534,
+ 0.0006466003833338618,
+ 0.0006447876221500337
+ ],
+ "acc_eval": 0.2978515625,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 5414.92822265625,
+ 1751530.25,
+ 3893876.5,
+ 4990954.0,
+ 4531568.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007761479937471449,
+ 0.0006465426995418966,
+ 0.0006446881452575326,
+ 0.0006466349004767835,
+ 0.0006447875639423728
+ ],
+ "acc_eval": 0.294921875,
+ "epoch": 100
+ }
+ ],
+ "arch": "resmlp_noln",
+ "seed": 42
+} \ No newline at end of file
diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s123.json b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json
new file mode 100644
index 0000000..f3f6392
--- /dev/null
+++ b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json
@@ -0,0 +1,4766 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_no_outln_v1",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 123,
+ "depth": 4,
+ "d_hidden": 256
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "architecture": "ResidualMLP_NoOutLN",
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 8.690464973449707,
+ 8.719978332519531,
+ 8.73093318939209,
+ 8.75937271118164,
+ 8.790542602539062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005465824506245553,
+ 0.0005437708459794521,
+ 0.0005393712199293077,
+ 0.0005331890424713492,
+ 0.0005310169071890414
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.1015625,
+ "loss_eval": 2.3754236698150635,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 40.83987808227539,
+ 37.75401306152344,
+ 36.1661376953125,
+ 34.91564178466797,
+ 34.55687713623047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00012231437722221017,
+ 0.00012846711615566164,
+ 0.00013815351121593267,
+ 0.00015655385504942387,
+ 0.0002070761693175882
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.435546875,
+ "loss_eval": 1.5918896198272705,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 54.60358810424805,
+ 49.46598434448242,
+ 46.75371170043945,
+ 44.21198272705078,
+ 42.52875900268555
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010624218703014776,
+ 0.00011056899529648945,
+ 0.0001174700737465173,
+ 0.00012732982577290386,
+ 0.00015480577712878585
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4755859375,
+ "loss_eval": 1.464656114578247,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 65.05919647216797,
+ 58.81830596923828,
+ 54.65021896362305,
+ 50.87609100341797,
+ 48.61247253417969
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.24510313780047e-05,
+ 9.810000483412296e-05,
+ 0.00010529180872254074,
+ 0.00011547923350008205,
+ 0.00013095361646264791
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.509765625,
+ "loss_eval": 1.4144818782806396,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 71.89185333251953,
+ 63.81675338745117,
+ 58.61539077758789,
+ 53.633819580078125,
+ 50.85374450683594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.624486119719222e-05,
+ 0.00010101673979079351,
+ 0.00010665278387023136,
+ 0.00011629729851847515,
+ 0.0001258883421542123
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5009765625,
+ "loss_eval": 1.4042909145355225,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 77.86115264892578,
+ 68.96236419677734,
+ 62.764793395996094,
+ 56.297122955322266,
+ 51.927825927734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.636285201646388e-05,
+ 9.12561226869002e-05,
+ 9.721348760649562e-05,
+ 0.0001029788691084832,
+ 0.00010866572119994089
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5048828125,
+ "loss_eval": 1.362424373626709,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 86.97894287109375,
+ 76.51913452148438,
+ 68.91358947753906,
+ 61.691619873046875,
+ 55.97148132324219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.555527165299281e-05,
+ 9.211624274030328e-05,
+ 9.770254109753296e-05,
+ 0.00010545850091148168,
+ 0.00011015798372682184
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4990234375,
+ "loss_eval": 1.4210331439971924,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 91.98681640625,
+ 80.48826599121094,
+ 72.19147491455078,
+ 63.2117919921875,
+ 57.618526458740234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.108472684398293e-05,
+ 8.69045325089246e-05,
+ 9.184813097817823e-05,
+ 9.785865404410288e-05,
+ 0.00010359002772020176
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.50390625,
+ "loss_eval": 1.395978569984436,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 97.7012939453125,
+ 84.81765747070312,
+ 75.55701446533203,
+ 65.7588119506836,
+ 58.28969955444336
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.22104630060494e-05,
+ 8.808301208773628e-05,
+ 9.288280853070319e-05,
+ 0.0001000006013782695,
+ 0.00010321019362891093
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.525390625,
+ "loss_eval": 1.3341916799545288,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 102.29643249511719,
+ 88.3180923461914,
+ 78.02013397216797,
+ 67.14125061035156,
+ 59.45139694213867
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.297000749735162e-05,
+ 8.909840107662603e-05,
+ 9.493192192167044e-05,
+ 0.00010043827933259308,
+ 0.00010197651863563806
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5166015625,
+ "loss_eval": 1.3378056287765503,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 107.60400390625,
+ 93.19139862060547,
+ 81.3952407836914,
+ 70.16273498535156,
+ 61.15400314331055
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.625297439517453e-05,
+ 8.249503298429772e-05,
+ 8.778223127592355e-05,
+ 9.526272333459929e-05,
+ 9.708418656373397e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.54296875,
+ "loss_eval": 1.3057411909103394,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 111.52012634277344,
+ 95.61714935302734,
+ 83.3553695678711,
+ 70.52283477783203,
+ 61.52479553222656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.589814777020365e-05,
+ 8.213706314563751e-05,
+ 8.74441975611262e-05,
+ 9.462270099902526e-05,
+ 9.573540592100471e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5400390625,
+ "loss_eval": 1.2877662181854248,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 116.06771850585938,
+ 99.79177856445312,
+ 86.30980682373047,
+ 72.20254516601562,
+ 62.78416442871094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.193555939011276e-05,
+ 7.673310028621927e-05,
+ 8.175434049917385e-05,
+ 8.827414421830326e-05,
+ 9.135493019130081e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5478515625,
+ "loss_eval": 1.2685296535491943,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 119.3271484375,
+ 102.65406799316406,
+ 88.69587707519531,
+ 74.90689849853516,
+ 63.780494689941406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.618113158969209e-05,
+ 8.220612653531134e-05,
+ 8.806472760625184e-05,
+ 9.463543392485008e-05,
+ 9.703192336019129e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.54296875,
+ "loss_eval": 1.276496410369873,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 123.31849670410156,
+ 105.7769775390625,
+ 90.95068359375,
+ 76.97051239013672,
+ 64.97062683105469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.194027421064675e-05,
+ 7.883367652539164e-05,
+ 8.381865336559713e-05,
+ 9.018390846904367e-05,
+ 8.924194844439626e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.552734375,
+ "loss_eval": 1.2604155540466309,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 127.73625946044922,
+ 109.2970199584961,
+ 94.82887268066406,
+ 79.42200469970703,
+ 66.68120574951172
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.26957805454731e-05,
+ 7.816226570867002e-05,
+ 8.386534318560734e-05,
+ 9.044967737281695e-05,
+ 9.091151150641963e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.55859375,
+ "loss_eval": 1.2421667575836182,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 129.39227294921875,
+ 110.16195678710938,
+ 95.65125274658203,
+ 79.63654327392578,
+ 66.4422836303711
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.170928438426927e-05,
+ 7.703503069933504e-05,
+ 8.211386011680588e-05,
+ 8.873116166796535e-05,
+ 9.066827624337748e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615234375,
+ "loss_eval": 1.2539770603179932,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 132.24916076660156,
+ 113.025634765625,
+ 96.19522857666016,
+ 80.5164566040039,
+ 67.23816680908203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.194816862465814e-05,
+ 7.835567521397024e-05,
+ 8.341929060406983e-05,
+ 8.761802746448666e-05,
+ 8.926806913223118e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5732421875,
+ "loss_eval": 1.2596629858016968,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 136.37730407714844,
+ 116.11273956298828,
+ 98.82146453857422,
+ 81.83920288085938,
+ 67.72627258300781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.331569941015914e-05,
+ 7.95917512732558e-05,
+ 8.647916547488421e-05,
+ 9.198131010634825e-05,
+ 9.28269510040991e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.53515625,
+ "loss_eval": 1.2714436054229736,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 137.7354736328125,
+ 119.1905288696289,
+ 102.62776184082031,
+ 84.3735580444336,
+ 69.55421447753906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.105377881089225e-05,
+ 7.70094629842788e-05,
+ 8.26972391223535e-05,
+ 8.802180673228577e-05,
+ 8.82365129655227e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5498046875,
+ "loss_eval": 1.25264310836792,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 139.01124572753906,
+ 119.05533599853516,
+ 101.28179168701172,
+ 83.50191497802734,
+ 68.7996826171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.610249303979799e-05,
+ 8.31697034300305e-05,
+ 8.997280383482575e-05,
+ 9.514019620837644e-05,
+ 9.370686893817037e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.517578125,
+ "loss_eval": 1.2884626388549805,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 142.8061981201172,
+ 121.41246795654297,
+ 104.47654724121094,
+ 86.13514709472656,
+ 70.62234497070312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.287831977009773e-05,
+ 7.990973244886845e-05,
+ 8.473258640151471e-05,
+ 9.054663678398356e-05,
+ 9.23949119169265e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5498046875,
+ "loss_eval": 1.2458946704864502,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 145.03463745117188,
+ 124.42599487304688,
+ 105.64387512207031,
+ 87.60891723632812,
+ 71.11911010742188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.878219573991373e-05,
+ 7.463164365617558e-05,
+ 7.942628144519404e-05,
+ 8.418951620114967e-05,
+ 8.709819667274132e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5654296875,
+ "loss_eval": 1.2031928300857544,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 145.368896484375,
+ 124.08200073242188,
+ 106.14088439941406,
+ 87.3053970336914,
+ 70.22563171386719
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.987902452237904e-05,
+ 7.564797124359757e-05,
+ 8.058137609623373e-05,
+ 8.513103239238262e-05,
+ 8.664488268550485e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5830078125,
+ "loss_eval": 1.2048817873001099,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 149.82542419433594,
+ 127.8211898803711,
+ 109.31559753417969,
+ 88.96003723144531,
+ 71.56672668457031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.123420073185116e-05,
+ 7.683804142288864e-05,
+ 8.418370271101594e-05,
+ 8.922854613047093e-05,
+ 8.777298353379592e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5654296875,
+ "loss_eval": 1.2408947944641113,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 151.1898193359375,
+ 128.61166381835938,
+ 110.0819320678711,
+ 89.33537292480469,
+ 70.91573333740234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.046251994324848e-05,
+ 7.593455666210502e-05,
+ 8.183503086911514e-05,
+ 8.78809587447904e-05,
+ 8.738410542719066e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5849609375,
+ "loss_eval": 1.2345162630081177,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 153.0899200439453,
+ 130.6381072998047,
+ 110.78546905517578,
+ 90.43073272705078,
+ 72.28581237792969
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.224789442261681e-05,
+ 7.864048529881984e-05,
+ 8.493732457282022e-05,
+ 9.218508785124868e-05,
+ 9.127514931606129e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.548828125,
+ "loss_eval": 1.234302282333374,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 156.78964233398438,
+ 132.35365295410156,
+ 114.26016998291016,
+ 93.03483581542969,
+ 73.8830337524414
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.004363578744233e-05,
+ 7.51781408325769e-05,
+ 8.189951768144965e-05,
+ 8.64862377056852e-05,
+ 8.457603689748794e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.572265625,
+ "loss_eval": 1.226435661315918,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 154.7094268798828,
+ 132.68295288085938,
+ 112.78950500488281,
+ 91.68452453613281,
+ 72.69532012939453
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.871543155284598e-05,
+ 7.408537931041792e-05,
+ 7.912247383501381e-05,
+ 8.584219176555052e-05,
+ 8.712658018339425e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5693359375,
+ "loss_eval": 1.186962604522705,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 156.5343475341797,
+ 133.95303344726562,
+ 113.44208526611328,
+ 91.55599212646484,
+ 72.66578674316406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.697547360090539e-05,
+ 7.314077083719894e-05,
+ 7.949489372549579e-05,
+ 8.466470171697438e-05,
+ 8.366732799913734e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.595703125,
+ "loss_eval": 1.1845954656600952,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 158.63601684570312,
+ 134.8338165283203,
+ 115.27066802978516,
+ 93.78146362304688,
+ 72.8468017578125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.742558616679162e-05,
+ 7.408189412672073e-05,
+ 7.9598423326388e-05,
+ 8.415436604991555e-05,
+ 8.754149166634306e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5693359375,
+ "loss_eval": 1.208282470703125,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 158.21023559570312,
+ 136.07545471191406,
+ 116.15364837646484,
+ 93.98001098632812,
+ 73.68004608154297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.207741873571649e-05,
+ 7.860636833356693e-05,
+ 8.520736446371302e-05,
+ 9.168307587970048e-05,
+ 8.956313104135916e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.2018094062805176,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 160.46771240234375,
+ 136.1265411376953,
+ 116.0124282836914,
+ 93.3584976196289,
+ 73.7890396118164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.191704207798466e-05,
+ 7.717879634583369e-05,
+ 8.299856563098729e-05,
+ 8.967710164142773e-05,
+ 8.699094178155065e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5810546875,
+ "loss_eval": 1.1889103651046753,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 160.90545654296875,
+ 137.0214080810547,
+ 115.83223724365234,
+ 94.28914642333984,
+ 73.96448516845703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.10546228219755e-05,
+ 7.790922973072156e-05,
+ 8.321165660163388e-05,
+ 8.87274945853278e-05,
+ 8.640237501822412e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.1516971588134766,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 163.9844207763672,
+ 138.9420166015625,
+ 118.25187683105469,
+ 94.9247817993164,
+ 73.99342346191406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.05249622114934e-05,
+ 7.705103053012863e-05,
+ 8.39303684188053e-05,
+ 8.84484761627391e-05,
+ 8.569705096306279e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1713684797286987,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 162.2567596435547,
+ 139.536376953125,
+ 118.07953643798828,
+ 96.10607147216797,
+ 75.22054290771484
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.98907533660531e-05,
+ 7.564698171336204e-05,
+ 8.246934885391966e-05,
+ 8.673300180817023e-05,
+ 8.65447727846913e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5869140625,
+ "loss_eval": 1.1986680030822754,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 163.85494995117188,
+ 140.6683807373047,
+ 120.20167541503906,
+ 96.79766845703125,
+ 74.6565933227539
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.933045369805768e-05,
+ 7.555640331702307e-05,
+ 8.187161438399926e-05,
+ 8.634777623228729e-05,
+ 8.516138041159138e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.58203125,
+ "loss_eval": 1.17092764377594,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 163.91464233398438,
+ 141.8627166748047,
+ 120.35345458984375,
+ 96.861083984375,
+ 74.91275024414062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.821981514804065e-05,
+ 7.462653593393043e-05,
+ 7.9863122664392e-05,
+ 8.513165812473744e-05,
+ 8.408474968746305e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1603121757507324,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 166.6566162109375,
+ 142.48072814941406,
+ 120.16492462158203,
+ 96.4870376586914,
+ 75.0911636352539
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.862134614493698e-05,
+ 7.509759598178789e-05,
+ 8.221028838306665e-05,
+ 8.709747635293752e-05,
+ 8.625433838460594e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.163398027420044,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 165.2766571044922,
+ 140.6273193359375,
+ 119.01939392089844,
+ 96.45698547363281,
+ 74.86931610107422
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.741421384504065e-05,
+ 7.467559044016525e-05,
+ 8.113843068713322e-05,
+ 8.498551324009895e-05,
+ 8.365403482457623e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1174335479736328,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 166.8720703125,
+ 141.94195556640625,
+ 119.73834228515625,
+ 96.83306884765625,
+ 75.50749206542969
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.83375183143653e-05,
+ 7.506174733862281e-05,
+ 8.1863887317013e-05,
+ 8.717682067072019e-05,
+ 8.521847485098988e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.128427267074585,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 166.10345458984375,
+ 140.8309783935547,
+ 119.59312438964844,
+ 96.5144271850586,
+ 75.01549530029297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.117655331967399e-05,
+ 7.808134250808507e-05,
+ 8.549879566999152e-05,
+ 9.121275070356205e-05,
+ 8.961764251580462e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.1407405138015747,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 168.5572052001953,
+ 144.19313049316406,
+ 121.29338836669922,
+ 98.18904113769531,
+ 75.74433898925781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.024689693935215e-05,
+ 7.835906581021845e-05,
+ 8.28477568575181e-05,
+ 8.988843183033168e-05,
+ 9.142952330876142e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5791015625,
+ "loss_eval": 1.188612699508667,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 167.82464599609375,
+ 142.2963104248047,
+ 120.96216583251953,
+ 98.01409149169922,
+ 76.0032730102539
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.296045077964664e-05,
+ 7.839543832233176e-05,
+ 8.31817596917972e-05,
+ 9.021619916893542e-05,
+ 8.68452261784114e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.60546875,
+ "loss_eval": 1.1675610542297363,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 168.66015625,
+ 143.3383026123047,
+ 121.46915435791016,
+ 97.43902587890625,
+ 75.26473236083984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.207799353636801e-05,
+ 8.018259541131556e-05,
+ 8.563740993849933e-05,
+ 9.22580948099494e-05,
+ 9.03013497008942e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.1672401428222656,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 168.55662536621094,
+ 142.82704162597656,
+ 120.73102569580078,
+ 96.30245971679688,
+ 74.20568084716797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.172006007749587e-05,
+ 7.97949469415471e-05,
+ 8.564699237467721e-05,
+ 9.092836262425408e-05,
+ 9.031151421368122e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.1739519834518433,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 169.05859375,
+ 143.376953125,
+ 122.22779083251953,
+ 98.1865234375,
+ 75.46460723876953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.164492853917181e-05,
+ 8.059864194365218e-05,
+ 8.811463339952752e-05,
+ 9.420064452569932e-05,
+ 9.068247891264036e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5869140625,
+ "loss_eval": 1.1654919385910034,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 167.85174560546875,
+ 143.98324584960938,
+ 121.09931945800781,
+ 97.61621856689453,
+ 75.3441390991211
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.121654198272154e-05,
+ 7.876066229073331e-05,
+ 8.58678831718862e-05,
+ 9.374372893944383e-05,
+ 8.886006980901584e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6015625,
+ "loss_eval": 1.1619040966033936,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 169.16136169433594,
+ 144.1681671142578,
+ 121.65021514892578,
+ 97.65489959716797,
+ 75.40325927734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.085441029630601e-05,
+ 7.872789865359664e-05,
+ 8.54654426802881e-05,
+ 9.159239561995491e-05,
+ 8.735150913707912e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.60546875,
+ "loss_eval": 1.1553215980529785,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 170.07469177246094,
+ 144.21502685546875,
+ 122.42488098144531,
+ 97.60433959960938,
+ 75.30228424072266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.460799679392949e-05,
+ 8.310206612804905e-05,
+ 8.914316276786849e-05,
+ 9.709167352411896e-05,
+ 9.34089912334457e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5947265625,
+ "loss_eval": 1.1511603593826294,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 169.58541870117188,
+ 143.38230895996094,
+ 121.96705627441406,
+ 97.77040100097656,
+ 74.732177734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.605904102092609e-05,
+ 8.306169183924794e-05,
+ 9.093777771340683e-05,
+ 9.604891965864226e-05,
+ 9.101478644879535e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.583984375,
+ "loss_eval": 1.150202751159668,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 169.28955078125,
+ 143.6193084716797,
+ 122.43891906738281,
+ 97.91162109375,
+ 75.27656555175781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.325071055674925e-05,
+ 8.037279621930793e-05,
+ 8.85110639501363e-05,
+ 9.169802797259763e-05,
+ 8.926681766752154e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.1172325611114502,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 170.01052856445312,
+ 143.45779418945312,
+ 122.65426635742188,
+ 98.24798583984375,
+ 75.68919372558594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.252323121065274e-05,
+ 8.011860336409882e-05,
+ 8.620596781838685e-05,
+ 9.34487470658496e-05,
+ 9.04093321878463e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1147592067718506,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 168.67430114746094,
+ 143.25802612304688,
+ 119.88789367675781,
+ 96.92530822753906,
+ 74.42180633544922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.410924445139244e-05,
+ 8.137265831464902e-05,
+ 8.864435949362814e-05,
+ 9.472777310293168e-05,
+ 9.015527029987425e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.625,
+ "loss_eval": 1.1209393739700317,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 169.25973510742188,
+ 142.8248291015625,
+ 120.75433349609375,
+ 96.85049438476562,
+ 74.96371459960938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.351540989475325e-05,
+ 8.063198038144037e-05,
+ 8.647661161376163e-05,
+ 9.411892096977681e-05,
+ 9.352037159260362e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1025673151016235,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 170.8097381591797,
+ 143.562744140625,
+ 121.1410903930664,
+ 97.70262145996094,
+ 75.55540466308594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.382583135040477e-05,
+ 8.104312291834503e-05,
+ 8.895712380763143e-05,
+ 9.191031131194904e-05,
+ 8.924967551138252e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1013734340667725,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 169.41827392578125,
+ 143.60491943359375,
+ 119.79347229003906,
+ 96.5761947631836,
+ 74.94788360595703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.506331166950986e-05,
+ 8.308376709464937e-05,
+ 9.05599954421632e-05,
+ 9.552844858262688e-05,
+ 9.322594269178808e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1202704906463623,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 169.0540008544922,
+ 144.03970336914062,
+ 121.87033081054688,
+ 98.80317687988281,
+ 76.42084503173828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.446128438459709e-05,
+ 8.153915405273438e-05,
+ 8.840708323987201e-05,
+ 9.388235048390925e-05,
+ 9.186066017718986e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.1205706596374512,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 168.36595153808594,
+ 141.80178833007812,
+ 120.2418212890625,
+ 96.8748779296875,
+ 75.01248168945312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.731275400146842e-05,
+ 8.405288099311292e-05,
+ 9.186116949422285e-05,
+ 9.942329052137211e-05,
+ 9.51286856434308e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1108977794647217,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 169.39569091796875,
+ 142.4537353515625,
+ 120.81804656982422,
+ 97.19158172607422,
+ 75.20236206054688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.883378566475585e-05,
+ 8.777670154813677e-05,
+ 9.416328248335049e-05,
+ 0.00010057339386548847,
+ 9.685986879048869e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1141078472137451,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 169.97256469726562,
+ 143.7432098388672,
+ 121.0943832397461,
+ 97.53318786621094,
+ 75.44910430908203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.617164374096319e-05,
+ 8.471525507047772e-05,
+ 9.014597890200093e-05,
+ 9.796666563488543e-05,
+ 9.110565588343889e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.0869580507278442,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 168.3030242919922,
+ 142.93931579589844,
+ 120.8933334350586,
+ 97.99317932128906,
+ 75.29071044921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.692870713071898e-05,
+ 8.63347522681579e-05,
+ 9.28592708078213e-05,
+ 9.994371794164181e-05,
+ 9.114396380027756e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6357421875,
+ "loss_eval": 1.102014183998108,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 168.24777221679688,
+ 142.03550720214844,
+ 120.25982666015625,
+ 97.82561492919922,
+ 75.54430389404297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.734074461041018e-05,
+ 8.487069862894714e-05,
+ 9.25088970689103e-05,
+ 9.827558096731082e-05,
+ 9.154371218755841e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.642578125,
+ "loss_eval": 1.0736993551254272,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 168.08807373046875,
+ 142.24661254882812,
+ 119.9559555053711,
+ 96.72630310058594,
+ 74.6895523071289
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.049221651162952e-05,
+ 8.925019210437313e-05,
+ 9.64810824370943e-05,
+ 0.00010555233166087419,
+ 9.567404049448669e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6328125,
+ "loss_eval": 1.0822858810424805,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 167.2539825439453,
+ 141.55946350097656,
+ 119.37681579589844,
+ 97.13011169433594,
+ 75.02286529541016
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.919344352558255e-05,
+ 8.567116310587153e-05,
+ 9.377488458994776e-05,
+ 9.892786329146475e-05,
+ 9.566175140207633e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6328125,
+ "loss_eval": 1.1096018552780151,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 168.11643981933594,
+ 142.01052856445312,
+ 119.23418426513672,
+ 96.38211059570312,
+ 75.08849334716797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.787172216922045e-05,
+ 8.574797539040446e-05,
+ 9.008680353872478e-05,
+ 9.943459735950455e-05,
+ 9.4872091722209e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6455078125,
+ "loss_eval": 1.1080338954925537,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 168.09153747558594,
+ 141.83984375,
+ 120.16891479492188,
+ 97.12582397460938,
+ 74.98177337646484
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.894716691225767e-05,
+ 8.66493719513528e-05,
+ 9.518097795080394e-05,
+ 0.00010154353367397562,
+ 9.530662646284327e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.634765625,
+ "loss_eval": 1.1069355010986328,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 167.35382080078125,
+ 142.33642578125,
+ 120.0411148071289,
+ 96.53257751464844,
+ 75.0328598022461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.973265019245446e-05,
+ 8.856245403876528e-05,
+ 9.601243800716475e-05,
+ 0.00010215263318968937,
+ 9.676075569586828e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.63671875,
+ "loss_eval": 1.100548505783081,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 167.418701171875,
+ 140.93800354003906,
+ 119.4802017211914,
+ 96.3717269897461,
+ 74.67574310302734
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.022025576792657e-05,
+ 8.782520308159292e-05,
+ 9.638317715143785e-05,
+ 0.0001046421384671703,
+ 9.856691031018272e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.63671875,
+ "loss_eval": 1.1227837800979614,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 166.9136962890625,
+ 140.45266723632812,
+ 119.06848907470703,
+ 95.9060287475586,
+ 74.79631042480469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.995362102519721e-05,
+ 8.583935414208099e-05,
+ 9.508246148470789e-05,
+ 0.00010096231562783942,
+ 9.634289017412812e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6416015625,
+ "loss_eval": 1.1006299257278442,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 165.4694366455078,
+ 139.69601440429688,
+ 117.53054809570312,
+ 95.05348205566406,
+ 74.65673065185547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.79753245296888e-05,
+ 8.487935701850802e-05,
+ 9.169900295091793e-05,
+ 9.879520075628534e-05,
+ 9.398034308105707e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.623046875,
+ "loss_eval": 1.0988688468933105,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 165.3974609375,
+ 139.54141235351562,
+ 117.3493881225586,
+ 94.9970474243164,
+ 74.31880187988281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.893131260061637e-05,
+ 8.71433803695254e-05,
+ 9.492320532444865e-05,
+ 0.00010128845315193757,
+ 9.578587196301669e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6484375,
+ "loss_eval": 1.0860004425048828,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 165.16651916503906,
+ 138.63233947753906,
+ 117.15692138671875,
+ 94.41555786132812,
+ 74.16561889648438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.611902012489736e-05,
+ 9.412867802893743e-05,
+ 0.0001005554513540119,
+ 0.00010507499246159568,
+ 0.00010004997602663934
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 1.0985480546951294,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 166.48802185058594,
+ 139.67433166503906,
+ 117.13744354248047,
+ 94.41883087158203,
+ 74.25392150878906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.272679406218231e-05,
+ 9.101553587242961e-05,
+ 9.994471474783495e-05,
+ 0.00010372102406108752,
+ 9.65072977123782e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.63671875,
+ "loss_eval": 1.1026251316070557,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 164.66531372070312,
+ 138.62359619140625,
+ 117.72949981689453,
+ 95.40411376953125,
+ 74.5541763305664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.516917296219617e-05,
+ 9.385120938532054e-05,
+ 0.00010402742918813601,
+ 0.00010775420378195122,
+ 0.00010169474262511358
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6298828125,
+ "loss_eval": 1.1083872318267822,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 164.67889404296875,
+ 138.3468017578125,
+ 116.61951446533203,
+ 93.94100952148438,
+ 74.09746551513672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.641117165097967e-05,
+ 9.53027411014773e-05,
+ 0.0001029834384098649,
+ 0.0001086485426640138,
+ 0.0001005055892164819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6455078125,
+ "loss_eval": 1.1155339479446411,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 164.2607421875,
+ 138.0647735595703,
+ 116.18480682373047,
+ 93.95038604736328,
+ 73.88935089111328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.567768963985145e-05,
+ 9.307480650022626e-05,
+ 9.939757728716359e-05,
+ 0.00010579575609881431,
+ 9.849719936028123e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 1.1126312017440796,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 163.9792938232422,
+ 137.88185119628906,
+ 116.34628295898438,
+ 93.93537139892578,
+ 73.83805084228516
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.795045869192109e-05,
+ 9.678495553089306e-05,
+ 0.00010362159082433209,
+ 0.0001105417322833091,
+ 0.00010525066318223253
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6337890625,
+ "loss_eval": 1.110876202583313,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 164.1384735107422,
+ 137.82691955566406,
+ 115.94445037841797,
+ 94.01095581054688,
+ 73.68436431884766
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.610311488155276e-05,
+ 9.507987851975486e-05,
+ 0.00010208813182543963,
+ 0.00010807226499309763,
+ 0.00010176940850215033
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6318359375,
+ "loss_eval": 1.1176977157592773,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 163.91049194335938,
+ 136.9142608642578,
+ 115.37925720214844,
+ 93.2219009399414,
+ 73.2654800415039
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.745997183723375e-05,
+ 9.566589869791642e-05,
+ 0.00010251311323372647,
+ 0.00011129804624943063,
+ 0.0001056971013895236
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6318359375,
+ "loss_eval": 1.1140623092651367,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 163.40182495117188,
+ 137.21026611328125,
+ 115.46720123291016,
+ 93.46426391601562,
+ 73.12786102294922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.96864221431315e-05,
+ 9.8639284260571e-05,
+ 0.0001043426527758129,
+ 0.00010869379184441641,
+ 0.00010685920278774574
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.1114736795425415,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 163.22100830078125,
+ 136.5157012939453,
+ 115.2002944946289,
+ 93.15667724609375,
+ 73.07371520996094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.870210876921192e-05,
+ 9.846940520219505e-05,
+ 0.0001080361835192889,
+ 0.0001128382355091162,
+ 0.00010244990698993206
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.634765625,
+ "loss_eval": 1.1125456094741821,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 163.21449279785156,
+ 136.63999938964844,
+ 114.51496124267578,
+ 92.76043701171875,
+ 73.22138214111328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.551862265449017e-05,
+ 9.3683076556772e-05,
+ 0.00010453341383254156,
+ 0.00010722207662183791,
+ 0.00010129058500751853
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 1.0996887683868408,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 162.75770568847656,
+ 136.49710083007812,
+ 114.6112060546875,
+ 92.87682342529297,
+ 73.25039672851562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.870910096447915e-05,
+ 9.74184149526991e-05,
+ 0.00010446018859511241,
+ 0.00011418589565437287,
+ 0.00010412647679913789
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.634765625,
+ "loss_eval": 1.1063097715377808,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 163.11697387695312,
+ 136.4162139892578,
+ 114.9229507446289,
+ 93.17060089111328,
+ 73.40281677246094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.790192077867687e-05,
+ 9.763163689058274e-05,
+ 0.00010599731467664242,
+ 0.00011016600910807028,
+ 0.00010507069964660332
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6435546875,
+ "loss_eval": 1.1009955406188965,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 162.4318389892578,
+ 136.2643280029297,
+ 114.47940826416016,
+ 92.43824005126953,
+ 72.75123596191406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.680798055138439e-05,
+ 9.524248889647424e-05,
+ 0.00010346775525249541,
+ 0.00010771532106446102,
+ 0.00010157373617403209
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.106760025024414,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 162.55992126464844,
+ 136.00660705566406,
+ 114.44908142089844,
+ 92.65226745605469,
+ 73.14122772216797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.55888138175942e-05,
+ 9.422176663065329e-05,
+ 0.00010130204464076087,
+ 0.0001082807284547016,
+ 0.00010286335600540042
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6435546875,
+ "loss_eval": 1.1080232858657837,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 162.33607482910156,
+ 136.22657775878906,
+ 114.64276885986328,
+ 92.26687622070312,
+ 72.99312591552734
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.005892934510484e-05,
+ 9.746963041834533e-05,
+ 0.00010383747576270252,
+ 0.00010905141971306875,
+ 0.00010293527157045901
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6455078125,
+ "loss_eval": 1.0989083051681519,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 161.69874572753906,
+ 135.9654998779297,
+ 113.88583374023438,
+ 91.72888946533203,
+ 72.5824966430664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.02136744116433e-05,
+ 9.903020691126585e-05,
+ 0.0001059234855347313,
+ 0.00011399909999454394,
+ 0.00010543780081206933
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6435546875,
+ "loss_eval": 1.1039698123931885,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 162.3827362060547,
+ 136.0760498046875,
+ 114.07840728759766,
+ 91.95870971679688,
+ 72.59473419189453
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.043919999385253e-05,
+ 9.950586536433548e-05,
+ 0.00010800046584336087,
+ 0.00011628754145931453,
+ 0.00010360861051594839
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6435546875,
+ "loss_eval": 1.1007411479949951,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 161.50054931640625,
+ 135.7166748046875,
+ 113.83382415771484,
+ 91.96630096435547,
+ 72.61833953857422
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.075389243662357e-05,
+ 9.988105011871085e-05,
+ 0.00010788880899781361,
+ 0.00011431374150561169,
+ 0.00010596351057756692
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.64453125,
+ "loss_eval": 1.0992103815078735,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 161.48770141601562,
+ 135.71417236328125,
+ 114.12840270996094,
+ 91.98160552978516,
+ 72.64606475830078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.050803782884032e-05,
+ 9.805837908061221e-05,
+ 0.00010800142626976594,
+ 0.00011649157386273146,
+ 0.00010660875705070794
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.640625,
+ "loss_eval": 1.1021543741226196,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 162.0372314453125,
+ 135.4561767578125,
+ 114.00292205810547,
+ 91.83483123779297,
+ 72.68809509277344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.82204039953649e-05,
+ 9.769284224603325e-05,
+ 0.00010632916382746771,
+ 0.00011439422814873978,
+ 0.00010489066335139796
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6416015625,
+ "loss_eval": 1.1001535654067993,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 161.88534545898438,
+ 135.54629516601562,
+ 113.90684509277344,
+ 91.81143188476562,
+ 72.64588165283203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.120439790422097e-05,
+ 9.779920219443738e-05,
+ 0.00010798833682201803,
+ 0.00011447365250205621,
+ 0.00010797424329211935
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.642578125,
+ "loss_eval": 1.0961315631866455,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 162.06427001953125,
+ 135.49281311035156,
+ 113.69275665283203,
+ 91.76304626464844,
+ 72.4867935180664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.100054739974439e-05,
+ 9.935065463650972e-05,
+ 0.00010879126784857363,
+ 0.00011589765199460089,
+ 0.00010837834270205349
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6416015625,
+ "loss_eval": 1.097299337387085,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 162.06063842773438,
+ 135.57981872558594,
+ 113.76399230957031,
+ 91.94515991210938,
+ 72.56278991699219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.139141184277833e-05,
+ 9.897649579215795e-05,
+ 0.00010867504897760227,
+ 0.0001159063758677803,
+ 0.00010943930828943849
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6376953125,
+ "loss_eval": 1.0986907482147217,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 161.8842315673828,
+ 135.4130859375,
+ 113.66045379638672,
+ 91.80276489257812,
+ 72.58989715576172
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.080857125809416e-05,
+ 0.00010123007814399898,
+ 0.00010883246432058513,
+ 0.00011908033775398508,
+ 0.00010963032400468364
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.0988240242004395,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 161.86744689941406,
+ 135.38331604003906,
+ 113.66378784179688,
+ 91.70223236083984,
+ 72.4896240234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.091695392271504e-05,
+ 0.00010080484207719564,
+ 0.00010940106585621834,
+ 0.00011762498616008088,
+ 0.00010917771578533575
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.0987744331359863,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 161.89633178710938,
+ 135.33140563964844,
+ 113.67347717285156,
+ 91.68895721435547,
+ 72.49469757080078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.099576709559187e-05,
+ 0.00010038664186140522,
+ 0.0001086170959752053,
+ 0.00011788319534389302,
+ 0.00010914496670011431
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.0990701913833618,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 161.9002227783203,
+ 135.33474731445312,
+ 113.68601989746094,
+ 91.69290924072266,
+ 72.48957061767578
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.096309076994658e-05,
+ 0.00010059915803140029,
+ 0.00010838409070856869,
+ 0.00011784962407546118,
+ 0.00010893247235799208
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.098876953125,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 161.8989715576172,
+ 135.33889770507812,
+ 113.69281768798828,
+ 91.6856689453125,
+ 72.48480224609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.085259807761759e-05,
+ 0.00010061707871500403,
+ 0.00010823038610396907,
+ 0.00011745247320504859,
+ 0.00010919221676886082
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6396484375,
+ "loss_eval": 1.0987944602966309,
+ "epoch": 100
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.690464973449707,
+ 8.719978332519531,
+ 8.73093318939209,
+ 8.75937271118164,
+ 8.790542602539062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005465824506245553,
+ 0.0005437708459794521,
+ 0.0005393712199293077,
+ 0.0005331890424713492,
+ 0.0005310169071890414
+ ],
+ "gamma_dfa": 0.007568402143078856,
+ "gamma_dfa_per_layer": [
+ 0.002326551591977477,
+ 0.0009101498289965093,
+ -0.013218702748417854,
+ 0.04025560989975929
+ ],
+ "acc_eval": 0.1015625,
+ "loss_eval": 2.3754236698150635,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 536.5761108398438,
+ 845.265625,
+ 979.7896118164062,
+ 1192.0323486328125,
+ 1230.83935546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006465085316449404,
+ 0.0006462159799411893,
+ 0.0006460825679823756,
+ 0.0006459451396949589,
+ 0.0006460213917307556
+ ],
+ "gamma_dfa": 0.013024769607000053,
+ "gamma_dfa_per_layer": [
+ 0.035579413175582886,
+ -0.0025600260123610497,
+ -0.0014369464479386806,
+ 0.020516637712717056
+ ],
+ "acc_eval": 0.212890625,
+ "loss_eval": 8.137651443481445,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 886.7508544921875,
+ 1871.2640380859375,
+ 2198.631591796875,
+ 2689.22412109375,
+ 2904.254150390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007187994197010994,
+ 0.0007172312471084297,
+ 0.0007172476034611464,
+ 0.0007177897496148944,
+ 0.000717311049811542
+ ],
+ "gamma_dfa": 0.004487544531002641,
+ "gamma_dfa_per_layer": [
+ 0.04744107276201248,
+ -0.011962954886257648,
+ -0.02088175155222416,
+ 0.003353811800479889
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 16.637451171875,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 1117.1649169921875,
+ 3064.644775390625,
+ 3849.060546875,
+ 4987.09130859375,
+ 5690.720703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000734492321498692,
+ 0.0007317167473956943,
+ 0.0007317643612623215,
+ 0.0007318624993786216,
+ 0.0007319750147871673
+ ],
+ "gamma_dfa": 0.0065072893630713224,
+ "gamma_dfa_per_layer": [
+ 0.0597357451915741,
+ -0.0063293795101344585,
+ -0.033218011260032654,
+ 0.0058408030308783054
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 29.753459930419922,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 1279.7017822265625,
+ 4015.093017578125,
+ 5594.23828125,
+ 7459.69091796875,
+ 8727.64453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007434640428982675,
+ 0.0007419881876558065,
+ 0.0007416673470288515,
+ 0.000741377065423876,
+ 0.0007413675775751472
+ ],
+ "gamma_dfa": 0.0072651703376322985,
+ "gamma_dfa_per_layer": [
+ 0.07467889785766602,
+ -0.02277005836367607,
+ -0.009787362068891525,
+ -0.013060796074569225
+ ],
+ "acc_eval": 0.1640625,
+ "loss_eval": 54.22368621826172,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 1399.06787109375,
+ 4862.35302734375,
+ 9250.7666015625,
+ 10789.8828125,
+ 12902.6591796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007491935975849628,
+ 0.0007442779606208205,
+ 0.0007423132774420083,
+ 0.0007422835915349424,
+ 0.0007422153139486909
+ ],
+ "gamma_dfa": -0.005301014054566622,
+ "gamma_dfa_per_layer": [
+ 0.06516245007514954,
+ -0.03411812335252762,
+ -0.034175027161836624,
+ -0.01807335577905178
+ ],
+ "acc_eval": 0.2080078125,
+ "loss_eval": 62.78772735595703,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 1478.1070556640625,
+ 5865.33935546875,
+ 15407.5283203125,
+ 16717.609375,
+ 19284.30078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000746070989407599,
+ 0.0007320672739297152,
+ 0.0007320406148210168,
+ 0.0007324790931306779,
+ 0.0007322196033783257
+ ],
+ "gamma_dfa": -0.0043716938234865665,
+ "gamma_dfa_per_layer": [
+ 0.0889529138803482,
+ -0.03475068882107735,
+ -0.06096648424863815,
+ -0.010722516104578972
+ ],
+ "acc_eval": 0.21875,
+ "loss_eval": 84.72342681884766,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 1569.764892578125,
+ 7991.109375,
+ 22041.46484375,
+ 23657.2890625,
+ 27372.69140625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007371728424914181,
+ 0.0007328476058319211,
+ 0.0007317248382605612,
+ 0.0007321859593503177,
+ 0.0007314819958992302
+ ],
+ "gamma_dfa": -0.006586531409993768,
+ "gamma_dfa_per_layer": [
+ 0.08020298182964325,
+ -0.038106564432382584,
+ -0.05412164330482483,
+ -0.014320899732410908
+ ],
+ "acc_eval": 0.21484375,
+ "loss_eval": 87.40310668945312,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 1649.8133544921875,
+ 12248.005859375,
+ 30825.916015625,
+ 32827.55078125,
+ 38153.3828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007630810141563416,
+ 0.0007434195140376687,
+ 0.0007433100836351514,
+ 0.0007435025763697922,
+ 0.0007434298167936504
+ ],
+ "gamma_dfa": -0.0035092607140541077,
+ "gamma_dfa_per_layer": [
+ 0.1012866348028183,
+ -0.029570601880550385,
+ -0.04660683125257492,
+ -0.039146244525909424
+ ],
+ "acc_eval": 0.1708984375,
+ "loss_eval": 157.51614379882812,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 1712.73193359375,
+ 20302.939453125,
+ 43360.37109375,
+ 46000.90234375,
+ 53154.84765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007849909015931189,
+ 0.0007540763472206891,
+ 0.0007541946833953261,
+ 0.0007542177918367088,
+ 0.0007542550447396934
+ ],
+ "gamma_dfa": 0.006478439085185528,
+ "gamma_dfa_per_layer": [
+ 0.1487787812948227,
+ -0.03583626449108124,
+ -0.0212298221886158,
+ -0.06579893827438354
+ ],
+ "acc_eval": 0.138671875,
+ "loss_eval": 512.7744750976562,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 1763.957763671875,
+ 29818.015625,
+ 57092.5546875,
+ 60514.234375,
+ 69695.1015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00080581457586959,
+ 0.0007400442264042795,
+ 0.0007398677407763898,
+ 0.0007363590411841869,
+ 0.0007358043803833425
+ ],
+ "gamma_dfa": -0.003822646103799343,
+ "gamma_dfa_per_layer": [
+ 0.1044168770313263,
+ -0.0318819060921669,
+ -0.054846249520778656,
+ -0.03297930583357811
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 288.6083984375,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 1841.6363525390625,
+ 43646.69921875,
+ 76665.53125,
+ 80991.453125,
+ 91946.4765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008064995636232197,
+ 0.0007405033684335649,
+ 0.0007410499965772033,
+ 0.0007410682155750692,
+ 0.0007410107646137476
+ ],
+ "gamma_dfa": -0.005903353448957205,
+ "gamma_dfa_per_layer": [
+ 0.15344271063804626,
+ -0.06077828258275986,
+ -0.0893951952457428,
+ -0.02688264660537243
+ ],
+ "acc_eval": 0.1630859375,
+ "loss_eval": 462.175537109375,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 1938.4581298828125,
+ 63804.453125,
+ 101178.828125,
+ 106970.6171875,
+ 119676.0390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008472055778838694,
+ 0.0007312041707336903,
+ 0.0007307010819204152,
+ 0.0007308369968086481,
+ 0.000730738160200417
+ ],
+ "gamma_dfa": 0.015948185697197914,
+ "gamma_dfa_per_layer": [
+ 0.19398558139801025,
+ -0.05326637625694275,
+ -0.057601772248744965,
+ -0.019324690103530884
+ ],
+ "acc_eval": 0.1572265625,
+ "loss_eval": 481.7687072753906,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 2059.50390625,
+ 86267.453125,
+ 127668.078125,
+ 134690.953125,
+ 148832.21875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008536268142051995,
+ 0.0007572658942081034,
+ 0.0007572331232950091,
+ 0.0007572534959763288,
+ 0.0007572824251838028
+ ],
+ "gamma_dfa": 0.007115887477993965,
+ "gamma_dfa_per_layer": [
+ 0.19894848763942719,
+ -0.06199394166469574,
+ -0.04606857895851135,
+ -0.06242241710424423
+ ],
+ "acc_eval": 0.162109375,
+ "loss_eval": 442.7697448730469,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 2162.650390625,
+ 111971.2421875,
+ 158544.5,
+ 167081.546875,
+ 183230.21875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009137325105257332,
+ 0.0007456843741238117,
+ 0.0007456432213075459,
+ 0.0007455914164893329,
+ 0.0007455993909388781
+ ],
+ "gamma_dfa": 0.008699490688741207,
+ "gamma_dfa_per_layer": [
+ 0.22433382272720337,
+ -0.07114191353321075,
+ -0.07720339298248291,
+ -0.041190553456544876
+ ],
+ "acc_eval": 0.16796875,
+ "loss_eval": 631.255859375,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 2287.1767578125,
+ 140028.015625,
+ 188737.5625,
+ 197952.296875,
+ 214414.0625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000864461821038276,
+ 0.0007380775641649961,
+ 0.0007383264601230621,
+ 0.000738749688025564,
+ 0.0007389392121694982
+ ],
+ "gamma_dfa": 0.01581217348575592,
+ "gamma_dfa_per_layer": [
+ 0.21350334584712982,
+ -0.05864371731877327,
+ -0.039877790957689285,
+ -0.051733143627643585
+ ],
+ "acc_eval": 0.1806640625,
+ "loss_eval": 720.0626220703125,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 2390.364013671875,
+ 180786.796875,
+ 233030.703125,
+ 243522.09375,
+ 260648.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010889085242524743,
+ 0.0007420245674438775,
+ 0.0007420974434353411,
+ 0.0007420690963044763,
+ 0.0007420206675305963
+ ],
+ "gamma_dfa": 0.01692677615210414,
+ "gamma_dfa_per_layer": [
+ 0.22792349755764008,
+ -0.06613948941230774,
+ -0.0679212138056755,
+ -0.026155689731240273
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 1348.43115234375,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 2525.60009765625,
+ 226341.015625,
+ 282575.21875,
+ 294521.5,
+ 313155.65625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010620173998177052,
+ 0.0007694299565628171,
+ 0.0007695311214774847,
+ 0.0007694744854234159,
+ 0.000769737409427762
+ ],
+ "gamma_dfa": 0.012939120642840862,
+ "gamma_dfa_per_layer": [
+ 0.24798060953617096,
+ -0.07888300716876984,
+ -0.03452270105481148,
+ -0.0828184187412262
+ ],
+ "acc_eval": 0.1572265625,
+ "loss_eval": 1277.5867919921875,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 2738.423828125,
+ 284434.5625,
+ 346282.90625,
+ 359909.125,
+ 379330.46875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009644942474551499,
+ 0.0007429496035911143,
+ 0.0007425086805596948,
+ 0.0007422671769745648,
+ 0.0007426248048432171
+ ],
+ "gamma_dfa": 0.02641105931252241,
+ "gamma_dfa_per_layer": [
+ 0.2637922763824463,
+ -0.06210581958293915,
+ -0.05640384927392006,
+ -0.039638370275497437
+ ],
+ "acc_eval": 0.220703125,
+ "loss_eval": 802.8688354492188,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 2890.100830078125,
+ 346858.71875,
+ 414202.09375,
+ 429987.3125,
+ 451374.3125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010854159481823444,
+ 0.0007560763042420149,
+ 0.0007561030797660351,
+ 0.0007562912651337683,
+ 0.0007561809034086764
+ ],
+ "gamma_dfa": -0.006043614819645882,
+ "gamma_dfa_per_layer": [
+ 0.18550744652748108,
+ -0.07387037575244904,
+ -0.0915735587477684,
+ -0.04423797130584717
+ ],
+ "acc_eval": 0.0927734375,
+ "loss_eval": 2067.48974609375,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 3048.9677734375,
+ 416326.4375,
+ 488715.9375,
+ 506779.0,
+ 528907.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001142722088843584,
+ 0.0007379497401416302,
+ 0.0007378923473879695,
+ 0.0007379662129096687,
+ 0.0007378893787972629
+ ],
+ "gamma_dfa": 0.020490088500082493,
+ "gamma_dfa_per_layer": [
+ 0.21813809871673584,
+ -0.053681232035160065,
+ -0.04219571128487587,
+ -0.040300801396369934
+ ],
+ "acc_eval": 0.2294921875,
+ "loss_eval": 1929.7166748046875,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 3216.734619140625,
+ 499057.0,
+ 577401.1875,
+ 597297.0,
+ 620542.125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014556541573256254,
+ 0.0007413470884785056,
+ 0.0007413764833472669,
+ 0.0007412104168906808,
+ 0.0007420589681714773
+ ],
+ "gamma_dfa": 0.03948488784953952,
+ "gamma_dfa_per_layer": [
+ 0.27680304646492004,
+ -0.05157003924250603,
+ -0.039460550993680954,
+ -0.02783290483057499
+ ],
+ "acc_eval": 0.1474609375,
+ "loss_eval": 2699.9052734375,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 3342.216064453125,
+ 584495.625,
+ 665696.625,
+ 687533.1875,
+ 710813.9375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001884044730104506,
+ 0.0007584495469927788,
+ 0.0007583577535115182,
+ 0.0007583281840197742,
+ 0.0007583273691125214
+ ],
+ "gamma_dfa": 0.004080784507095814,
+ "gamma_dfa_per_layer": [
+ 0.1770291030406952,
+ -0.056366197764873505,
+ -0.057933274656534195,
+ -0.046406492590904236
+ ],
+ "acc_eval": 0.2373046875,
+ "loss_eval": 1742.9925537109375,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 3566.038818359375,
+ 674756.3125,
+ 760463.3125,
+ 784571.125,
+ 808618.6875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001965342788025737,
+ 0.0007340435404330492,
+ 0.0007341310847550631,
+ 0.0007343373727053404,
+ 0.0007337987190112472
+ ],
+ "gamma_dfa": 0.030578704085201025,
+ "gamma_dfa_per_layer": [
+ 0.24771088361740112,
+ -0.05749209225177765,
+ -0.04569869861006737,
+ -0.022205276414752007
+ ],
+ "acc_eval": 0.1611328125,
+ "loss_eval": 2397.3916015625,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 3779.54296875,
+ 786509.5,
+ 877152.1875,
+ 903987.8125,
+ 928449.375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016364307375624776,
+ 0.0007935749599710107,
+ 0.000793365528807044,
+ 0.0007934189052321017,
+ 0.0007935216999612749
+ ],
+ "gamma_dfa": 0.01740677817724645,
+ "gamma_dfa_per_layer": [
+ 0.2701166570186615,
+ -0.0851234570145607,
+ 0.004913746379315853,
+ -0.12027983367443085
+ ],
+ "acc_eval": 0.12109375,
+ "loss_eval": 4908.0458984375,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 3969.119873046875,
+ 900145.9375,
+ 993945.75,
+ 1023047.9375,
+ 1047156.125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012235429603606462,
+ 0.0007582573452964425,
+ 0.0007582195685245097,
+ 0.000758210604544729,
+ 0.0007582050748169422
+ ],
+ "gamma_dfa": -0.005556041374802589,
+ "gamma_dfa_per_layer": [
+ 0.2166597992181778,
+ -0.09299580752849579,
+ -0.09515514969825745,
+ -0.05073300749063492
+ ],
+ "acc_eval": 0.1728515625,
+ "loss_eval": 3738.029541015625,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 4167.24169921875,
+ 1027096.125,
+ 1126300.25,
+ 1158199.625,
+ 1183064.875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015538743464276195,
+ 0.0007320540607906878,
+ 0.0007321767043322325,
+ 0.0007325086044147611,
+ 0.0007322292076423764
+ ],
+ "gamma_dfa": 0.013890675269067287,
+ "gamma_dfa_per_layer": [
+ 0.25793927907943726,
+ -0.09288333356380463,
+ -0.07571414113044739,
+ -0.03377910330891609
+ ],
+ "acc_eval": 0.10546875,
+ "loss_eval": 6202.408203125,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 4332.73046875,
+ 1157313.5,
+ 1261637.875,
+ 1297158.5,
+ 1323617.625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015948566142469645,
+ 0.0007783056935295463,
+ 0.00077825813787058,
+ 0.0007782406755723059,
+ 0.0007781987660564482
+ ],
+ "gamma_dfa": 0.02306488621979952,
+ "gamma_dfa_per_layer": [
+ 0.2585013508796692,
+ -0.07491485029459,
+ -0.058371271938085556,
+ -0.03295568376779556
+ ],
+ "acc_eval": 0.208984375,
+ "loss_eval": 4646.37451171875,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 4508.3486328125,
+ 1310938.125,
+ 1421261.875,
+ 1460382.75,
+ 1487384.375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001599438488483429,
+ 0.0007645513396710157,
+ 0.0007644708384759724,
+ 0.00076470518251881,
+ 0.0007645483710803092
+ ],
+ "gamma_dfa": 0.017900947481393814,
+ "gamma_dfa_per_layer": [
+ 0.24153774976730347,
+ -0.06473007053136826,
+ -0.06562119722366333,
+ -0.039582692086696625
+ ],
+ "acc_eval": 0.173828125,
+ "loss_eval": 5292.640625,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 4729.70556640625,
+ 1458380.25,
+ 1572980.125,
+ 1615003.0,
+ 1642261.875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014249716186895967,
+ 0.0007341640302911401,
+ 0.00073421117849648,
+ 0.0007345581543631852,
+ 0.0007344211917370558
+ ],
+ "gamma_dfa": 0.03120402991771698,
+ "gamma_dfa_per_layer": [
+ 0.2725849747657776,
+ -0.07284568250179291,
+ -0.05128118395805359,
+ -0.02364198863506317
+ ],
+ "acc_eval": 0.17578125,
+ "loss_eval": 4871.27001953125,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 4886.33984375,
+ 1617197.25,
+ 1735577.625,
+ 1780813.375,
+ 1808887.125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018187292153015733,
+ 0.0007682304712943733,
+ 0.0007675564847886562,
+ 0.0007677674293518066,
+ 0.0007678233087062836
+ ],
+ "gamma_dfa": 0.017138252966105938,
+ "gamma_dfa_per_layer": [
+ 0.2494080811738968,
+ -0.08018361777067184,
+ -0.027287419885396957,
+ -0.07338403165340424
+ ],
+ "acc_eval": 0.193359375,
+ "loss_eval": 3960.6728515625,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 5119.7841796875,
+ 1765219.5,
+ 1886735.375,
+ 1934213.125,
+ 1961976.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0022127064876258373,
+ 0.000754481996409595,
+ 0.0007539362413808703,
+ 0.0007542265811935067,
+ 0.0007539446814917028
+ ],
+ "gamma_dfa": 0.0332237659022212,
+ "gamma_dfa_per_layer": [
+ 0.30639636516571045,
+ -0.08304375410079956,
+ -0.06092921271920204,
+ -0.029528334736824036
+ ],
+ "acc_eval": 0.193359375,
+ "loss_eval": 4306.7734375,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 5354.88720703125,
+ 1941186.125,
+ 2066860.125,
+ 2117348.25,
+ 2144884.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013304626336321235,
+ 0.0007719467394053936,
+ 0.0007719435379840434,
+ 0.0007721700239926577,
+ 0.0007720825960859656
+ ],
+ "gamma_dfa": 0.01764332875609398,
+ "gamma_dfa_per_layer": [
+ 0.2670303285121918,
+ -0.07338991016149521,
+ -0.05201137810945511,
+ -0.07105572521686554
+ ],
+ "acc_eval": 0.1845703125,
+ "loss_eval": 4018.3662109375,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 5519.78759765625,
+ 2116056.25,
+ 2246081.5,
+ 2300078.25,
+ 2327378.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016995095647871494,
+ 0.0007534062024205923,
+ 0.0007532716845162213,
+ 0.0007533822790719569,
+ 0.0007532139425165951
+ ],
+ "gamma_dfa": 0.021287068724632263,
+ "gamma_dfa_per_layer": [
+ 0.2717400789260864,
+ -0.08038187026977539,
+ -0.05876553803682327,
+ -0.04744439572095871
+ ],
+ "acc_eval": 0.216796875,
+ "loss_eval": 6509.134765625,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 5700.9130859375,
+ 2317603.75,
+ 2452612.5,
+ 2509779.5,
+ 2537064.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001880816649645567,
+ 0.0007947525009512901,
+ 0.0007945421966724098,
+ 0.0007944482495076954,
+ 0.0007949797436594963
+ ],
+ "gamma_dfa": 0.02851281687617302,
+ "gamma_dfa_per_layer": [
+ 0.2822743058204651,
+ -0.08248982578516006,
+ -0.05187612026929855,
+ -0.03385709226131439
+ ],
+ "acc_eval": 0.1337890625,
+ "loss_eval": 8231.9248046875,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 5855.8310546875,
+ 2515524.75,
+ 2653569.0,
+ 2713748.5,
+ 2740903.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018560283351689577,
+ 0.0007757823332212865,
+ 0.0007757038110867143,
+ 0.0007756180129945278,
+ 0.0007759004947729409
+ ],
+ "gamma_dfa": 0.018099953944329172,
+ "gamma_dfa_per_layer": [
+ 0.2729976773262024,
+ -0.08800812810659409,
+ -0.002550901612266898,
+ -0.11003883183002472
+ ],
+ "acc_eval": 0.150390625,
+ "loss_eval": 7247.7216796875,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 6036.9033203125,
+ 2711563.0,
+ 2854179.0,
+ 2918077.75,
+ 2945814.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001862754113972187,
+ 0.0007525583496317267,
+ 0.0007525330875068903,
+ 0.0007526627741754055,
+ 0.0007525623659603298
+ ],
+ "gamma_dfa": 0.02487885858863592,
+ "gamma_dfa_per_layer": [
+ 0.29685819149017334,
+ -0.08635345101356506,
+ -0.056181322783231735,
+ -0.054807983338832855
+ ],
+ "acc_eval": 0.1435546875,
+ "loss_eval": 7513.36376953125,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 6188.01611328125,
+ 2906995.5,
+ 3054202.25,
+ 3121279.0,
+ 3149996.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013340733712539077,
+ 0.0007529910071752965,
+ 0.0007524905377067626,
+ 0.0007527912384830415,
+ 0.0007525555556640029
+ ],
+ "gamma_dfa": 0.027058321982622147,
+ "gamma_dfa_per_layer": [
+ 0.25763267278671265,
+ -0.06575162708759308,
+ -0.04412994533777237,
+ -0.03951781243085861
+ ],
+ "acc_eval": 0.2431640625,
+ "loss_eval": 12329.697265625,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 6390.7060546875,
+ 3133419.5,
+ 3288636.0,
+ 3360502.75,
+ 3390539.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014776778407394886,
+ 0.0007607035804539919,
+ 0.0007607110310345888,
+ 0.0007606975850649178,
+ 0.000760715629439801
+ ],
+ "gamma_dfa": 0.022189474664628506,
+ "gamma_dfa_per_layer": [
+ 0.2616554796695709,
+ -0.07128072530031204,
+ -0.06259018927812576,
+ -0.039026666432619095
+ ],
+ "acc_eval": 0.173828125,
+ "loss_eval": 6832.28955078125,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 6548.68115234375,
+ 3356773.75,
+ 3517968.25,
+ 3593598.5,
+ 3624375.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002129003871232271,
+ 0.0007741872104816139,
+ 0.000774160900618881,
+ 0.0007743749301880598,
+ 0.0007743173046037555
+ ],
+ "gamma_dfa": 0.034090133383870125,
+ "gamma_dfa_per_layer": [
+ 0.3182219862937927,
+ -0.08398662507534027,
+ -0.06546281278133392,
+ -0.03241201490163803
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 5371.0859375,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 6723.9697265625,
+ 3592963.25,
+ 3757696.25,
+ 3837777.75,
+ 3868088.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018772021867334843,
+ 0.0007547365385107696,
+ 0.0007547002169303596,
+ 0.0007546909037046134,
+ 0.000754650856833905
+ ],
+ "gamma_dfa": 0.003609549254179001,
+ "gamma_dfa_per_layer": [
+ 0.282962441444397,
+ -0.10840916633605957,
+ -0.10053665935993195,
+ -0.05957841873168945
+ ],
+ "acc_eval": 0.1376953125,
+ "loss_eval": 8650.76953125,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 6887.81005859375,
+ 3829273.5,
+ 3999416.75,
+ 4084005.5,
+ 4113581.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020062020048499107,
+ 0.0007521071238443255,
+ 0.0007519447826780379,
+ 0.0007520412327721715,
+ 0.0007518909987993538
+ ],
+ "gamma_dfa": 0.01951257325708866,
+ "gamma_dfa_per_layer": [
+ 0.2743881344795227,
+ -0.08543786406517029,
+ -0.05402272939682007,
+ -0.056877247989177704
+ ],
+ "acc_eval": 0.1796875,
+ "loss_eval": 15509.98828125,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 7027.42626953125,
+ 4050130.5,
+ 4223340.0,
+ 4310667.5,
+ 4340882.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016777552664279938,
+ 0.0007508718408644199,
+ 0.0007508369744755328,
+ 0.0007509454735554755,
+ 0.0007508718408644199
+ ],
+ "gamma_dfa": 0.02786387037485838,
+ "gamma_dfa_per_layer": [
+ 0.2803051769733429,
+ -0.07360324263572693,
+ -0.04823639243841171,
+ -0.04701006039977074
+ ],
+ "acc_eval": 0.2275390625,
+ "loss_eval": 7618.71533203125,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 7157.845703125,
+ 4292685.0,
+ 4471049.5,
+ 4562175.0,
+ 4591811.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016224944265559316,
+ 0.0007538175559602678,
+ 0.0007538740755990148,
+ 0.0007538648205809295,
+ 0.0007538393838331103
+ ],
+ "gamma_dfa": 0.0053657907992601395,
+ "gamma_dfa_per_layer": [
+ 0.26428842544555664,
+ -0.10051027685403824,
+ -0.08806045353412628,
+ -0.05425453186035156
+ ],
+ "acc_eval": 0.166015625,
+ "loss_eval": 7869.64111328125,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 7275.4365234375,
+ 4532040.5,
+ 4714971.5,
+ 4809776.0,
+ 4839258.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002823092043399811,
+ 0.0007887987303547561,
+ 0.0007888769032433629,
+ 0.0007889135158620775,
+ 0.0007889300468377769
+ ],
+ "gamma_dfa": 0.008974121417850256,
+ "gamma_dfa_per_layer": [
+ 0.25932246446609497,
+ -0.10199789702892303,
+ 0.012336602434515953,
+ -0.13376468420028687
+ ],
+ "acc_eval": 0.091796875,
+ "loss_eval": 19789.41796875,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 7393.93212890625,
+ 4772152.5,
+ 4958566.0,
+ 5058113.0,
+ 5086560.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0019131727749481797,
+ 0.0007677456014789641,
+ 0.0007676532259210944,
+ 0.000767527730204165,
+ 0.0007678664987906814
+ ],
+ "gamma_dfa": 0.014807725325226784,
+ "gamma_dfa_per_layer": [
+ 0.23344306647777557,
+ -0.08349616825580597,
+ -0.0560825914144516,
+ -0.03463340550661087
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 12636.65625,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 7527.99462890625,
+ 5048336.0,
+ 5239027.5,
+ 5342244.0,
+ 5370085.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018555351998656988,
+ 0.000769329781178385,
+ 0.0007686647586524487,
+ 0.0007689501508139074,
+ 0.0007690390921197832
+ ],
+ "gamma_dfa": 0.004876136779785156,
+ "gamma_dfa_per_layer": [
+ 0.21739649772644043,
+ -0.08506827056407928,
+ -0.03674054145812988,
+ -0.07608313858509064
+ ],
+ "acc_eval": 0.232421875,
+ "loss_eval": 12248.12109375,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 7638.85693359375,
+ 5287113.0,
+ 5479795.0,
+ 5586404.5,
+ 5613225.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0025236238725483418,
+ 0.0007688805344514549,
+ 0.000768228666856885,
+ 0.0007684807060286403,
+ 0.0007685597520321608
+ ],
+ "gamma_dfa": -0.006854387931525707,
+ "gamma_dfa_per_layer": [
+ 0.17993390560150146,
+ -0.08751687407493591,
+ -0.030272338539361954,
+ -0.08956224471330643
+ ],
+ "acc_eval": 0.1796875,
+ "loss_eval": 18537.177734375,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 7754.390625,
+ 5527426.0,
+ 5724221.0,
+ 5833576.5,
+ 5860100.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020714402198791504,
+ 0.0007631001644767821,
+ 0.0007630567415617406,
+ 0.0007630541222169995,
+ 0.0007631017942912877
+ ],
+ "gamma_dfa": 0.02875693328678608,
+ "gamma_dfa_per_layer": [
+ 0.29564130306243896,
+ -0.08437579870223999,
+ -0.050235565751791,
+ -0.04600220546126366
+ ],
+ "acc_eval": 0.208984375,
+ "loss_eval": 10527.2578125,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 7888.46923828125,
+ 5787159.5,
+ 5987915.0,
+ 6101035.0,
+ 6127097.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0026283818297088146,
+ 0.0007835617288947105,
+ 0.0007836156873963773,
+ 0.000783648225478828,
+ 0.0007836673175916076
+ ],
+ "gamma_dfa": 0.011204172391444445,
+ "gamma_dfa_per_layer": [
+ 0.26796066761016846,
+ -0.10181419551372528,
+ 0.010023357346653938,
+ -0.13135313987731934
+ ],
+ "acc_eval": 0.0966796875,
+ "loss_eval": 15481.84375,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 7975.13671875,
+ 6029198.0,
+ 6234359.5,
+ 6352162.0,
+ 6377873.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001740386476740241,
+ 0.0007632866618223488,
+ 0.0007632256019860506,
+ 0.0007631148328073323,
+ 0.0007634586072526872
+ ],
+ "gamma_dfa": -0.000985240563750267,
+ "gamma_dfa_per_layer": [
+ 0.20569762587547302,
+ -0.0866088718175888,
+ -0.04746733605861664,
+ -0.07556238025426865
+ ],
+ "acc_eval": 0.2001953125,
+ "loss_eval": 12020.572265625,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 8109.23095703125,
+ 6280213.0,
+ 6488845.5,
+ 6610432.5,
+ 6636101.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018630403792485595,
+ 0.0007671525236219168,
+ 0.000766951881814748,
+ 0.0007671291241422296,
+ 0.0007672281353734434
+ ],
+ "gamma_dfa": -0.0027379142120480537,
+ "gamma_dfa_per_layer": [
+ 0.22697225213050842,
+ -0.10085368156433105,
+ -0.059774767607450485,
+ -0.0772954598069191
+ ],
+ "acc_eval": 0.13671875,
+ "loss_eval": 12490.904296875,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 8223.3388671875,
+ 6520398.5,
+ 6731145.5,
+ 6855487.0,
+ 6880542.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020134998485445976,
+ 0.0007573508773930371,
+ 0.0007573754992336035,
+ 0.0007574421470053494,
+ 0.0007576147909276187
+ ],
+ "gamma_dfa": 0.00887075625360012,
+ "gamma_dfa_per_layer": [
+ 0.260132372379303,
+ -0.08125708997249603,
+ -0.07711100578308105,
+ -0.06628125160932541
+ ],
+ "acc_eval": 0.12890625,
+ "loss_eval": 13286.50390625,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 8317.2099609375,
+ 6773551.0,
+ 6990263.5,
+ 7117609.5,
+ 7143509.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016349060460925102,
+ 0.000744542689062655,
+ 0.0007445236551575363,
+ 0.000744638848118484,
+ 0.0007445821538567543
+ ],
+ "gamma_dfa": 0.036132486537098885,
+ "gamma_dfa_per_layer": [
+ 0.35822737216949463,
+ -0.09246134012937546,
+ -0.05995674431324005,
+ -0.06127934157848358
+ ],
+ "acc_eval": 0.1318359375,
+ "loss_eval": 12961.923828125,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 8396.16015625,
+ 7036334.0,
+ 7256480.5,
+ 7388541.0,
+ 7414023.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016424244968220592,
+ 0.0007655483204871416,
+ 0.0007653584470972419,
+ 0.0007655261433683336,
+ 0.0007656112429685891
+ ],
+ "gamma_dfa": 0.00855250470340252,
+ "gamma_dfa_per_layer": [
+ 0.31318342685699463,
+ -0.11486171185970306,
+ -0.07210143655538559,
+ -0.0920102596282959
+ ],
+ "acc_eval": 0.0986328125,
+ "loss_eval": 14289.1396484375,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 8425.91796875,
+ 7268265.0,
+ 7491250.5,
+ 7626377.5,
+ 7651502.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014321975177153945,
+ 0.0007547372952103615,
+ 0.0007547161658294499,
+ 0.0007547704153694212,
+ 0.000754979089833796
+ ],
+ "gamma_dfa": 0.019777772948145866,
+ "gamma_dfa_per_layer": [
+ 0.3146383762359619,
+ -0.0827077254652977,
+ -0.0876566469669342,
+ -0.06516291201114655
+ ],
+ "acc_eval": 0.0908203125,
+ "loss_eval": 12761.185546875,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 8519.505859375,
+ 7514964.5,
+ 7741589.0,
+ 7880037.0,
+ 7905207.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017787133110687137,
+ 0.0007505406392738223,
+ 0.0007507357513532043,
+ 0.0007507326663471758,
+ 0.0007507237605750561
+ ],
+ "gamma_dfa": -0.012186199426651001,
+ "gamma_dfa_per_layer": [
+ 0.2306034117937088,
+ -0.11392365396022797,
+ -0.1025918573141098,
+ -0.06283269822597504
+ ],
+ "acc_eval": 0.1455078125,
+ "loss_eval": 8573.3310546875,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 8575.814453125,
+ 7701015.5,
+ 7930432.0,
+ 8070523.0,
+ 8095346.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013273135991767049,
+ 0.0007214294746518135,
+ 0.0007213159115053713,
+ 0.0007215962978079915,
+ 0.0007215975201688707
+ ],
+ "gamma_dfa": 0.02046024613082409,
+ "gamma_dfa_per_layer": [
+ 0.2830252945423126,
+ -0.09345690906047821,
+ -0.06962529569864273,
+ -0.038102105259895325
+ ],
+ "acc_eval": 0.1923828125,
+ "loss_eval": 6201.162109375,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 8635.1220703125,
+ 7939687.0,
+ 8172801.5,
+ 8315327.5,
+ 8340462.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002125338651239872,
+ 0.0007551790331490338,
+ 0.0007551065064035356,
+ 0.0007549694273620844,
+ 0.000755314074922353
+ ],
+ "gamma_dfa": 0.019076894968748093,
+ "gamma_dfa_per_layer": [
+ 0.25508445501327515,
+ -0.07673472911119461,
+ -0.04303552210330963,
+ -0.059006623923778534
+ ],
+ "acc_eval": 0.1865234375,
+ "loss_eval": 12055.595703125,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 8706.6689453125,
+ 8158003.0,
+ 8394169.0,
+ 8539798.0,
+ 8565165.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001350156613625586,
+ 0.0007560249068774283,
+ 0.0007559725781902671,
+ 0.0007558663492091,
+ 0.0007561935926787555
+ ],
+ "gamma_dfa": 0.028152598068118095,
+ "gamma_dfa_per_layer": [
+ 0.28580546379089355,
+ -0.08475945889949799,
+ -0.05238167941570282,
+ -0.03605393320322037
+ ],
+ "acc_eval": 0.220703125,
+ "loss_eval": 12085.9541015625,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 8758.453125,
+ 8374766.0,
+ 8613513.0,
+ 8761622.0,
+ 8786363.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002377285622060299,
+ 0.0007197813247330487,
+ 0.0007195555372163653,
+ 0.0007198317907750607,
+ 0.000719684932846576
+ ],
+ "gamma_dfa": 0.025455349124968052,
+ "gamma_dfa_per_layer": [
+ 0.27419814467430115,
+ -0.08699844777584076,
+ -0.04594934359192848,
+ -0.0394289568066597
+ ],
+ "acc_eval": 0.1669921875,
+ "loss_eval": 13302.744140625,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 8795.5654296875,
+ 8572136.0,
+ 8812910.0,
+ 8963599.0,
+ 8987706.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015984047204256058,
+ 0.0007187420851550996,
+ 0.0007185072172433138,
+ 0.000718816474545747,
+ 0.000718718278221786
+ ],
+ "gamma_dfa": 0.020128127187490463,
+ "gamma_dfa_per_layer": [
+ 0.3066103458404541,
+ -0.1022094339132309,
+ -0.07834567129611969,
+ -0.04554273188114166
+ ],
+ "acc_eval": 0.1181640625,
+ "loss_eval": 6553.7236328125,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 8811.46875,
+ 8766653.0,
+ 9009529.0,
+ 9162389.0,
+ 9185680.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0019123096717521548,
+ 0.0007724921451881528,
+ 0.0007725215400569141,
+ 0.0007725482573732734,
+ 0.0007725649629719555
+ ],
+ "gamma_dfa": 0.03271363768726587,
+ "gamma_dfa_per_layer": [
+ 0.2947639226913452,
+ -0.08735189586877823,
+ -0.04557036980986595,
+ -0.030987106263637543
+ ],
+ "acc_eval": 0.18359375,
+ "loss_eval": 11607.7158203125,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 8860.6220703125,
+ 8977001.0,
+ 9224122.0,
+ 9379773.0,
+ 9402851.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013403806369751692,
+ 0.0007685344316996634,
+ 0.0007685531745664775,
+ 0.0007685986929573119,
+ 0.0007685821619816124
+ ],
+ "gamma_dfa": 0.020242065889760852,
+ "gamma_dfa_per_layer": [
+ 0.30239802598953247,
+ -0.09480112791061401,
+ -0.014634584076702595,
+ -0.11199405044317245
+ ],
+ "acc_eval": 0.1337890625,
+ "loss_eval": 9788.81640625,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 8904.9482421875,
+ 9185937.0,
+ 9436793.0,
+ 9595000.0,
+ 9618183.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012845145538449287,
+ 0.0007421535556204617,
+ 0.0007421503541991115,
+ 0.0007421293412335217,
+ 0.0007421668851748109
+ ],
+ "gamma_dfa": 0.02229973580688238,
+ "gamma_dfa_per_layer": [
+ 0.2927352786064148,
+ -0.08628389239311218,
+ -0.060364432632923126,
+ -0.05688801035284996
+ ],
+ "acc_eval": 0.1728515625,
+ "loss_eval": 8114.20458984375,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 8892.296875,
+ 9356716.0,
+ 9611136.0,
+ 9771064.0,
+ 9794530.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001351315644569695,
+ 0.0007599962409585714,
+ 0.0007597811054438353,
+ 0.0007599799428135157,
+ 0.0007600505487062037
+ ],
+ "gamma_dfa": 0.019069598987698555,
+ "gamma_dfa_per_layer": [
+ 0.29072487354278564,
+ -0.0944916158914566,
+ -0.05359811335802078,
+ -0.06635674834251404
+ ],
+ "acc_eval": 0.169921875,
+ "loss_eval": 8773.3408203125,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 8905.83984375,
+ 9511506.0,
+ 9766884.0,
+ 9928659.0,
+ 9951002.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017338081961497664,
+ 0.0007696599350310862,
+ 0.0007696837419643998,
+ 0.0007697126129642129,
+ 0.0007697291439399123
+ ],
+ "gamma_dfa": 0.028427925892174244,
+ "gamma_dfa_per_layer": [
+ 0.3319295644760132,
+ -0.09938425570726395,
+ 0.004324089735746384,
+ -0.12315769493579865
+ ],
+ "acc_eval": 0.1142578125,
+ "loss_eval": 12823.435546875,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 8944.53125,
+ 9692436.0,
+ 9950194.0,
+ 10113948.0,
+ 10136307.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017030658200383186,
+ 0.000714489258825779,
+ 0.0007141575333662331,
+ 0.0007145405979827046,
+ 0.0007144163828343153
+ ],
+ "gamma_dfa": 0.055724941194057465,
+ "gamma_dfa_per_layer": [
+ 0.3514706492424011,
+ -0.07685236632823944,
+ -0.031716104596853256,
+ -0.020002413541078568
+ ],
+ "acc_eval": 0.18359375,
+ "loss_eval": 10412.890625,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 8926.98828125,
+ 9838798.0,
+ 10099141.0,
+ 10264565.0,
+ 10286604.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015448650810867548,
+ 0.0007684402517043054,
+ 0.0007684584707021713,
+ 0.0007684882148168981,
+ 0.0007685049204155803
+ ],
+ "gamma_dfa": 0.032529132440686226,
+ "gamma_dfa_per_layer": [
+ 0.3082513213157654,
+ -0.0888272076845169,
+ -0.032446227967739105,
+ -0.056861355900764465
+ ],
+ "acc_eval": 0.19921875,
+ "loss_eval": 8345.18359375,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 8903.689453125,
+ 10005445.0,
+ 10266980.0,
+ 10434005.0,
+ 10454617.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017746278317645192,
+ 0.0007130402373149991,
+ 0.0007127230055630207,
+ 0.0007131076999939978,
+ 0.0007130174781195819
+ ],
+ "gamma_dfa": 0.05443635303527117,
+ "gamma_dfa_per_layer": [
+ 0.35508570075035095,
+ -0.08241431415081024,
+ -0.03841204196214676,
+ -0.01651393249630928
+ ],
+ "acc_eval": 0.140625,
+ "loss_eval": 7877.36181640625,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 8910.42578125,
+ 10173785.0,
+ 10439506.0,
+ 10609011.0,
+ 10630571.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011222161119803786,
+ 0.0007312637171708047,
+ 0.0007313191890716553,
+ 0.0007313672685995698,
+ 0.0007313768728636205
+ ],
+ "gamma_dfa": 0.023520448245108128,
+ "gamma_dfa_per_layer": [
+ 0.29335978627204895,
+ -0.08935706317424774,
+ -0.06947942078113556,
+ -0.04044150933623314
+ ],
+ "acc_eval": 0.2421875,
+ "loss_eval": 5653.23388671875,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 8876.2041015625,
+ 10317365.0,
+ 10586095.0,
+ 10757344.0,
+ 10779691.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011208312353119254,
+ 0.0007571111200377345,
+ 0.0007568965083919466,
+ 0.0007570943562313914,
+ 0.0007571595488116145
+ ],
+ "gamma_dfa": 0.025294490158557892,
+ "gamma_dfa_per_layer": [
+ 0.331506609916687,
+ -0.09467847645282745,
+ -0.06287634372711182,
+ -0.07277382910251617
+ ],
+ "acc_eval": 0.1884765625,
+ "loss_eval": 3869.094970703125,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 8852.7001953125,
+ 10449657.0,
+ 10719980.0,
+ 10891483.0,
+ 10913594.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001109768869355321,
+ 0.0007331773522309959,
+ 0.0007331601809710264,
+ 0.0007332302629947662,
+ 0.0007332285749725997
+ ],
+ "gamma_dfa": 0.03539558406919241,
+ "gamma_dfa_per_layer": [
+ 0.3268349766731262,
+ -0.08062416315078735,
+ -0.055393531918525696,
+ -0.04923494532704353
+ ],
+ "acc_eval": 0.2353515625,
+ "loss_eval": 7111.935546875,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 8827.3955078125,
+ 10582167.0,
+ 10855077.0,
+ 11028114.0,
+ 11050690.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001240618177689612,
+ 0.0007623998681083322,
+ 0.0007624404970556498,
+ 0.0007624777499586344,
+ 0.0007624629070051014
+ ],
+ "gamma_dfa": 0.03839550958946347,
+ "gamma_dfa_per_layer": [
+ 0.36802345514297485,
+ -0.09764832258224487,
+ -0.0042990874499082565,
+ -0.11249400675296783
+ ],
+ "acc_eval": 0.1357421875,
+ "loss_eval": 6752.0322265625,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 8814.1962890625,
+ 10696667.0,
+ 10971925.0,
+ 11146316.0,
+ 11168931.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001309843035414815,
+ 0.0007403214112855494,
+ 0.0007405314245261252,
+ 0.0007405264186672866,
+ 0.0007405087817460299
+ ],
+ "gamma_dfa": 0.038134077563881874,
+ "gamma_dfa_per_layer": [
+ 0.3364037275314331,
+ -0.08192241191864014,
+ -0.03633008152246475,
+ -0.06561492383480072
+ ],
+ "acc_eval": 0.212890625,
+ "loss_eval": 6998.021484375,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 8779.0400390625,
+ 10798076.0,
+ 11075004.0,
+ 11250115.0,
+ 11272600.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011087025050073862,
+ 0.0007316112169064581,
+ 0.0007316232076846063,
+ 0.0007316932315006852,
+ 0.00073169672396034
+ ],
+ "gamma_dfa": 0.04451032355427742,
+ "gamma_dfa_per_layer": [
+ 0.34500744938850403,
+ -0.07661331444978714,
+ -0.04388073831796646,
+ -0.04647210240364075
+ ],
+ "acc_eval": 0.2490234375,
+ "loss_eval": 3624.614013671875,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 8751.8486328125,
+ 10906611.0,
+ 11185716.0,
+ 11362176.0,
+ 11384611.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001067605335265398,
+ 0.0007393756532110274,
+ 0.0007396025466732681,
+ 0.000739598530344665,
+ 0.000739583745598793
+ ],
+ "gamma_dfa": 0.03648093156516552,
+ "gamma_dfa_per_layer": [
+ 0.31906285881996155,
+ -0.07843812555074692,
+ -0.051880721002817154,
+ -0.0428202860057354
+ ],
+ "acc_eval": 0.2509765625,
+ "loss_eval": 2816.3427734375,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 8743.0078125,
+ 10999747.0,
+ 11279813.0,
+ 11457343.0,
+ 11479737.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010900371707975864,
+ 0.0007332717068493366,
+ 0.0007332694949582219,
+ 0.0007332508685067296,
+ 0.0007332859677262604
+ ],
+ "gamma_dfa": 0.03520212788134813,
+ "gamma_dfa_per_layer": [
+ 0.3010096549987793,
+ -0.07223288714885712,
+ -0.05185239389538765,
+ -0.036115862429142
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 3747.66748046875,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 8693.3349609375,
+ 11081850.0,
+ 11362476.0,
+ 11540274.0,
+ 11562006.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010161141399294138,
+ 0.0007433417486026883,
+ 0.0007432828424498439,
+ 0.000743163691367954,
+ 0.0007434578728862107
+ ],
+ "gamma_dfa": 0.04203554056584835,
+ "gamma_dfa_per_layer": [
+ 0.3622134029865265,
+ -0.08443501591682434,
+ -0.020812533795833588,
+ -0.08882369101047516
+ ],
+ "acc_eval": 0.1953125,
+ "loss_eval": 3283.453125,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 8679.0673828125,
+ 11176062.0,
+ 11458995.0,
+ 11637744.0,
+ 11660108.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010180213721469045,
+ 0.0007298000273294747,
+ 0.000729813240468502,
+ 0.0007298758719116449,
+ 0.0007298807031475008
+ ],
+ "gamma_dfa": 0.03867925424128771,
+ "gamma_dfa_per_layer": [
+ 0.3430703282356262,
+ -0.08001460134983063,
+ -0.05243712291121483,
+ -0.05590158700942993
+ ],
+ "acc_eval": 0.22265625,
+ "loss_eval": 3249.233154296875,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 8630.8896484375,
+ 11249126.0,
+ 11532709.0,
+ 11711592.0,
+ 11733760.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001043561496771872,
+ 0.0007425911608152092,
+ 0.0007425197982229292,
+ 0.0007423801580443978,
+ 0.000742721778806299
+ ],
+ "gamma_dfa": 0.028339628130197525,
+ "gamma_dfa_per_layer": [
+ 0.32279035449028015,
+ -0.09357395768165588,
+ -0.06377816200256348,
+ -0.05207972228527069
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 3085.4638671875,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 8578.060546875,
+ 11304050.0,
+ 11589802.0,
+ 11769234.0,
+ 11792299.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000967628788203001,
+ 0.0007289479253813624,
+ 0.0007289598579518497,
+ 0.0007290169014595449,
+ 0.0007290222565643489
+ ],
+ "gamma_dfa": 0.02121756039559841,
+ "gamma_dfa_per_layer": [
+ 0.31049084663391113,
+ -0.09504136443138123,
+ -0.07916043698787689,
+ -0.05141880363225937
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 1885.889404296875,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 8522.4794921875,
+ 11393685.0,
+ 11680880.0,
+ 11860855.0,
+ 11883774.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010794082190841436,
+ 0.0007521919906139374,
+ 0.0007519960636273026,
+ 0.0007521732477471232,
+ 0.0007522284286096692
+ ],
+ "gamma_dfa": 0.026587368920445442,
+ "gamma_dfa_per_layer": [
+ 0.37745779752731323,
+ -0.11168865859508514,
+ -0.0728297159075737,
+ -0.08658994734287262
+ ],
+ "acc_eval": 0.1220703125,
+ "loss_eval": 2588.15478515625,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 8482.1484375,
+ 11447732.0,
+ 11736021.0,
+ 11916302.0,
+ 11939110.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009376976522617042,
+ 0.0007250583730638027,
+ 0.000724694284144789,
+ 0.0007250410853885114,
+ 0.0007250093622133136
+ ],
+ "gamma_dfa": 0.0355191919952631,
+ "gamma_dfa_per_layer": [
+ 0.31943440437316895,
+ -0.07911509275436401,
+ -0.0536213181912899,
+ -0.04462122544646263
+ ],
+ "acc_eval": 0.2783203125,
+ "loss_eval": 1507.2919921875,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 8430.1455078125,
+ 11492522.0,
+ 11781554.0,
+ 11962317.0,
+ 11985175.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009387033060193062,
+ 0.0007079826318658888,
+ 0.0007078545750118792,
+ 0.0007080811192281544,
+ 0.0007080849609337747
+ ],
+ "gamma_dfa": 0.036465028300881386,
+ "gamma_dfa_per_layer": [
+ 0.3066443204879761,
+ -0.07488954067230225,
+ -0.03129498288035393,
+ -0.05459968373179436
+ ],
+ "acc_eval": 0.275390625,
+ "loss_eval": 1614.5029296875,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 8369.6298828125,
+ 11532036.0,
+ 11821641.0,
+ 12002443.0,
+ 12025323.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009389162878505886,
+ 0.0007232772768475115,
+ 0.0007233347278088331,
+ 0.0007233632495626807,
+ 0.000723376520909369
+ ],
+ "gamma_dfa": 0.040183850564062595,
+ "gamma_dfa_per_layer": [
+ 0.34539365768432617,
+ -0.08373545110225677,
+ -0.05380668863654137,
+ -0.04711611568927765
+ ],
+ "acc_eval": 0.25,
+ "loss_eval": 1501.9444580078125,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 8319.4169921875,
+ 11569238.0,
+ 11860199.0,
+ 12041371.0,
+ 12064573.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009176665917038918,
+ 0.0007041870849207044,
+ 0.0007039242191240191,
+ 0.0007042758516035974,
+ 0.0007042170618660748
+ ],
+ "gamma_dfa": 0.035514961928129196,
+ "gamma_dfa_per_layer": [
+ 0.2879785895347595,
+ -0.07180146872997284,
+ -0.037917762994766235,
+ -0.03619951009750366
+ ],
+ "acc_eval": 0.30859375,
+ "loss_eval": 1078.8165283203125,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 8282.478515625,
+ 11596869.0,
+ 11888039.0,
+ 12069453.0,
+ 12092582.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00098571612033993,
+ 0.000731602602172643,
+ 0.0007312855450436473,
+ 0.0007312477100640535,
+ 0.0007316134287975729
+ ],
+ "gamma_dfa": 0.04066215269267559,
+ "gamma_dfa_per_layer": [
+ 0.33381348848342896,
+ -0.08063024282455444,
+ -0.055662885308265686,
+ -0.034871749579906464
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 1841.648193359375,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 8242.1005859375,
+ 11624052.0,
+ 11916218.0,
+ 12098548.0,
+ 12121911.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009184937225654721,
+ 0.0007233315263874829,
+ 0.000723001197911799,
+ 0.0007232833886519074,
+ 0.0007232468342408538
+ ],
+ "gamma_dfa": 0.03233872726559639,
+ "gamma_dfa_per_layer": [
+ 0.2990570068359375,
+ -0.07802218198776245,
+ -0.04814079403877258,
+ -0.04353912174701691
+ ],
+ "acc_eval": 0.2890625,
+ "loss_eval": 980.395751953125,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 8216.91796875,
+ 11647355.0,
+ 11939175.0,
+ 12121172.0,
+ 12144056.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008776114555075765,
+ 0.0007067625410854816,
+ 0.0007066249381750822,
+ 0.0007068619015626609,
+ 0.0007068667327985168
+ ],
+ "gamma_dfa": 0.027417242527008057,
+ "gamma_dfa_per_layer": [
+ 0.28433892130851746,
+ -0.07622525095939636,
+ -0.050822652876377106,
+ -0.04762204736471176
+ ],
+ "acc_eval": 0.326171875,
+ "loss_eval": 776.0946044921875,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 8169.76513671875,
+ 11658648.0,
+ 11950474.0,
+ 12132456.0,
+ 12155182.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008986471802927554,
+ 0.0007065801764838398,
+ 0.0007064181263558567,
+ 0.000706693041138351,
+ 0.0007066999096423388
+ ],
+ "gamma_dfa": 0.03352018166333437,
+ "gamma_dfa_per_layer": [
+ 0.296892374753952,
+ -0.07546264678239822,
+ -0.04814247041940689,
+ -0.03920653089880943
+ ],
+ "acc_eval": 0.3095703125,
+ "loss_eval": 893.558349609375,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 8142.11669921875,
+ 11667783.0,
+ 11959690.0,
+ 12141714.0,
+ 12164439.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009172433638013899,
+ 0.0007064292440190911,
+ 0.0007062776712700725,
+ 0.0007065359968692064,
+ 0.000706541701219976
+ ],
+ "gamma_dfa": 0.03799809701740742,
+ "gamma_dfa_per_layer": [
+ 0.31104975938796997,
+ -0.07753260433673859,
+ -0.04483959078788757,
+ -0.03668517619371414
+ ],
+ "acc_eval": 0.2763671875,
+ "loss_eval": 918.902099609375,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 8113.36474609375,
+ 11673688.0,
+ 11965558.0,
+ 12147558.0,
+ 12170198.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009179572225548327,
+ 0.0007257050601765513,
+ 0.0007257269462570548,
+ 0.0007257769466377795,
+ 0.0007257869001477957
+ ],
+ "gamma_dfa": 0.03620104119181633,
+ "gamma_dfa_per_layer": [
+ 0.3097808361053467,
+ -0.07722775638103485,
+ -0.0500766858458519,
+ -0.03767222911119461
+ ],
+ "acc_eval": 0.2880859375,
+ "loss_eval": 1033.579833984375,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 8085.35595703125,
+ 11678927.0,
+ 11970798.0,
+ 12152808.0,
+ 12175446.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008720594923943281,
+ 0.0007061808719299734,
+ 0.0007060291827656329,
+ 0.0007062855875119567,
+ 0.0007062909426167607
+ ],
+ "gamma_dfa": 0.03221010882407427,
+ "gamma_dfa_per_layer": [
+ 0.2895042598247528,
+ -0.07448285818099976,
+ -0.04004380851984024,
+ -0.04613715782761574
+ ],
+ "acc_eval": 0.3046875,
+ "loss_eval": 827.44140625,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 8072.322265625,
+ 11682684.0,
+ 11974490.0,
+ 12156499.0,
+ 12179080.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008837314089760184,
+ 0.0007061065407469869,
+ 0.0007059663184918463,
+ 0.00070620869519189,
+ 0.000706215447280556
+ ],
+ "gamma_dfa": 0.026722624897956848,
+ "gamma_dfa_per_layer": [
+ 0.28959959745407104,
+ -0.08210700005292892,
+ -0.05253326892852783,
+ -0.048068828880786896
+ ],
+ "acc_eval": 0.291015625,
+ "loss_eval": 795.6766357421875,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 8063.02001953125,
+ 11684947.0,
+ 11976758.0,
+ 12158785.0,
+ 12181362.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008943622815422714,
+ 0.0007086708792485297,
+ 0.0007086790283210576,
+ 0.0007087094127200544,
+ 0.0007087020785547793
+ ],
+ "gamma_dfa": 0.02946585137397051,
+ "gamma_dfa_per_layer": [
+ 0.29232603311538696,
+ -0.08056485652923584,
+ -0.05102770775556564,
+ -0.042870063334703445
+ ],
+ "acc_eval": 0.2919921875,
+ "loss_eval": 839.8633422851562,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 8055.40576171875,
+ 11685775.0,
+ 11977584.0,
+ 12159594.0,
+ 12182165.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008769903797656298,
+ 0.0007059753406792879,
+ 0.0007058423361741006,
+ 0.0007060715579427779,
+ 0.0007060769130475819
+ ],
+ "gamma_dfa": 0.02765239030122757,
+ "gamma_dfa_per_layer": [
+ 0.2855387032032013,
+ -0.07872132211923599,
+ -0.051525406539440155,
+ -0.04468241333961487
+ ],
+ "acc_eval": 0.3115234375,
+ "loss_eval": 736.9282836914062,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 8050.93310546875,
+ 11685670.0,
+ 11977453.0,
+ 12159452.0,
+ 12182004.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008705379441380501,
+ 0.0007085780380293727,
+ 0.0007085860124789178,
+ 0.0007086164550855756,
+ 0.0007086091791279614
+ ],
+ "gamma_dfa": 0.026861276477575302,
+ "gamma_dfa_per_layer": [
+ 0.2898082733154297,
+ -0.07899712026119232,
+ -0.046087510883808136,
+ -0.05727853626012802
+ ],
+ "acc_eval": 0.302734375,
+ "loss_eval": 737.6731567382812,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 8048.384765625,
+ 11685821.0,
+ 11977554.0,
+ 12159347.0,
+ 12182068.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008696588920429349,
+ 0.0007085675024427474,
+ 0.0007085754186846316,
+ 0.0007086056284606457,
+ 0.0007085986435413361
+ ],
+ "gamma_dfa": 0.02852465771138668,
+ "gamma_dfa_per_layer": [
+ 0.2933640480041504,
+ -0.07862062007188797,
+ -0.04777185618877411,
+ -0.05287294089794159
+ ],
+ "acc_eval": 0.30859375,
+ "loss_eval": 716.3431396484375,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 8047.294921875,
+ 11685550.0,
+ 11977281.0,
+ 12159072.0,
+ 12181796.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000868224713485688,
+ 0.0007059023482725024,
+ 0.0007057614857330918,
+ 0.0007060033385641873,
+ 0.0007060095085762441
+ ],
+ "gamma_dfa": 0.026804575696587563,
+ "gamma_dfa_per_layer": [
+ 0.2827316224575043,
+ -0.07767541706562042,
+ -0.051301658153533936,
+ -0.046536244451999664
+ ],
+ "acc_eval": 0.32421875,
+ "loss_eval": 693.041259765625,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 8047.01025390625,
+ 11685479.0,
+ 11977214.0,
+ 12159006.0,
+ 12181733.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008688519592396915,
+ 0.0007085604593157768,
+ 0.0007085682009346783,
+ 0.0007085984107106924,
+ 0.0007085916586220264
+ ],
+ "gamma_dfa": 0.027284779585897923,
+ "gamma_dfa_per_layer": [
+ 0.2883991003036499,
+ -0.07865853607654572,
+ -0.04951424151659012,
+ -0.05108720436692238
+ ],
+ "acc_eval": 0.3134765625,
+ "loss_eval": 705.9644775390625,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file
diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s42.json b/results/snapshot_no_outln_v1/snapshot_noLN_s42.json
new file mode 100644
index 0000000..6bf0a61
--- /dev/null
+++ b/results/snapshot_no_outln_v1/snapshot_noLN_s42.json
@@ -0,0 +1,4766 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_no_outln_v1",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 42,
+ "depth": 4,
+ "d_hidden": 256
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "architecture": "ResidualMLP_NoOutLN",
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005561555735766888,
+ 0.0005519049009308219,
+ 0.0005482902633957565,
+ 0.0005436676437966526,
+ 0.000538847001735121
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.1123046875,
+ "loss_eval": 2.3168468475341797,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 39.5714225769043,
+ 36.241031646728516,
+ 34.50772476196289,
+ 33.32059097290039,
+ 33.10130310058594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001264682796318084,
+ 0.00013185068382881582,
+ 0.0001420896005583927,
+ 0.00016605440760031343,
+ 0.0002204339689342305
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4228515625,
+ "loss_eval": 1.6010748147964478,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 52.47050857543945,
+ 48.28652572631836,
+ 45.496219635009766,
+ 43.2078857421875,
+ 41.36874008178711
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010761933663161471,
+ 0.00011420303053455427,
+ 0.00012131234689150006,
+ 0.00013399586896412075,
+ 0.00016239506658166647
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.453125,
+ "loss_eval": 1.4937903881072998,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 62.092323303222656,
+ 56.274635314941406,
+ 52.64373016357422,
+ 49.852622985839844,
+ 46.636131286621094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010067893890663981,
+ 0.00010744533210527152,
+ 0.000112645146145951,
+ 0.00012268377759028226,
+ 0.00014184287283569574
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.46484375,
+ "loss_eval": 1.495908498764038,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 70.92781829833984,
+ 62.570072174072266,
+ 57.76173400878906,
+ 53.9067497253418,
+ 49.468414306640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.065420454135165e-05,
+ 9.659545321483165e-05,
+ 0.00010056291648652405,
+ 0.00010604548879200593,
+ 0.0001232008944498375
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5048828125,
+ "loss_eval": 1.4103548526763916,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 77.77008056640625,
+ 68.82622528076172,
+ 62.881927490234375,
+ 57.43979263305664,
+ 52.381675720214844
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.967184840003029e-05,
+ 9.561960905557498e-05,
+ 9.984008647734299e-05,
+ 0.0001043190059135668,
+ 0.00011724776413757354
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5009765625,
+ "loss_eval": 1.3900126218795776,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 84.3420639038086,
+ 73.14466094970703,
+ 66.25099182128906,
+ 60.290985107421875,
+ 54.196815490722656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.548566984245554e-05,
+ 9.279063669964671e-05,
+ 9.806034358916804e-05,
+ 0.00010389943781774491,
+ 0.00011231016833335161
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.509765625,
+ "loss_eval": 1.3721935749053955,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 91.67733764648438,
+ 79.67963409423828,
+ 70.7928466796875,
+ 63.614192962646484,
+ 56.76249694824219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.422173414146528e-05,
+ 9.07716530491598e-05,
+ 9.6989817393478e-05,
+ 0.00010211832704953849,
+ 0.00011144059681100771
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5166015625,
+ "loss_eval": 1.344391107559204,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 96.60388946533203,
+ 83.8042221069336,
+ 74.53706359863281,
+ 66.99102020263672,
+ 58.020408630371094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.360752690350637e-05,
+ 9.003488958114758e-05,
+ 9.634223533794284e-05,
+ 0.00010073634621221572,
+ 0.00010698751430027187
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5185546875,
+ "loss_eval": 1.3327906131744385,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 101.24382781982422,
+ 87.08720397949219,
+ 76.92607116699219,
+ 68.23351287841797,
+ 59.4285888671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.019094821065664e-05,
+ 8.715572766959667e-05,
+ 9.189714910462499e-05,
+ 9.61213736445643e-05,
+ 0.00010296071559423581
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.533203125,
+ "loss_eval": 1.3403639793395996,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 107.04126739501953,
+ 91.77833557128906,
+ 80.73109436035156,
+ 70.98918914794922,
+ 61.11309051513672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.710429053986445e-05,
+ 8.402510866289958e-05,
+ 8.972393698059022e-05,
+ 9.477136336499825e-05,
+ 9.921709715854377e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5517578125,
+ "loss_eval": 1.3021693229675293,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 111.9730224609375,
+ 94.8844985961914,
+ 83.01356506347656,
+ 72.39442443847656,
+ 61.61451721191406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.266257307492197e-05,
+ 8.069563045864925e-05,
+ 8.615722617832944e-05,
+ 8.979514677776024e-05,
+ 9.45624997257255e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5458984375,
+ "loss_eval": 1.298128604888916,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 116.69439697265625,
+ 99.29745483398438,
+ 84.83220672607422,
+ 72.58226013183594,
+ 61.799560546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.808519876562059e-05,
+ 8.509745384799317e-05,
+ 9.162558853859082e-05,
+ 9.594277798896655e-05,
+ 0.00010088863200508058
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5361328125,
+ "loss_eval": 1.327142596244812,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 118.57154083251953,
+ 100.65165710449219,
+ 86.92396545410156,
+ 75.52800750732422,
+ 63.40058898925781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.507520058425143e-05,
+ 8.161060395650566e-05,
+ 8.807337144389749e-05,
+ 9.307889558840543e-05,
+ 9.839278209256008e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.529296875,
+ "loss_eval": 1.301376223564148,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 123.16495513916016,
+ 104.0947265625,
+ 90.54090118408203,
+ 79.24758911132812,
+ 66.25940704345703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.567028660560027e-05,
+ 8.223088661907241e-05,
+ 8.735521987546235e-05,
+ 9.217277693096548e-05,
+ 9.719380614114925e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615234375,
+ "loss_eval": 1.2765182256698608,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 126.89250946044922,
+ 107.54840087890625,
+ 93.0474853515625,
+ 79.41374206542969,
+ 66.3965835571289
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.546511915279552e-05,
+ 8.2636863226071e-05,
+ 8.891599281923845e-05,
+ 9.294570190832019e-05,
+ 9.809954644879326e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.51953125,
+ "loss_eval": 1.300541877746582,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 130.00201416015625,
+ 110.14152526855469,
+ 95.71183776855469,
+ 81.57356262207031,
+ 68.07804107666016
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.271749927895144e-05,
+ 7.90783524280414e-05,
+ 8.341569628100842e-05,
+ 8.888234879123047e-05,
+ 9.289903391618282e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.55859375,
+ "loss_eval": 1.253805160522461,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 132.4821014404297,
+ 112.55132293701172,
+ 96.15247344970703,
+ 82.20439147949219,
+ 67.68408203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.47043450246565e-05,
+ 8.161538426065817e-05,
+ 8.696810255059972e-05,
+ 9.05536362552084e-05,
+ 9.490203956374899e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5634765625,
+ "loss_eval": 1.2818918228149414,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 136.31614685058594,
+ 116.76542663574219,
+ 100.04906463623047,
+ 85.71382141113281,
+ 70.02954864501953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.14207926648669e-05,
+ 7.859354082029313e-05,
+ 8.420498488703743e-05,
+ 8.882852853275836e-05,
+ 9.116062574321404e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5595703125,
+ "loss_eval": 1.2435299158096313,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 138.36990356445312,
+ 117.38836669921875,
+ 101.75880432128906,
+ 86.79072570800781,
+ 70.66394805908203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.72569328546524e-05,
+ 8.451085159322247e-05,
+ 8.929366595111787e-05,
+ 9.467442578170449e-05,
+ 9.868820779956877e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.53515625,
+ "loss_eval": 1.3142390251159668,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 140.71449279785156,
+ 119.23265838623047,
+ 101.22541809082031,
+ 85.75491333007812,
+ 69.77205657958984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.5247859058436e-05,
+ 8.147219341481104e-05,
+ 8.72978416737169e-05,
+ 9.33377887122333e-05,
+ 9.715931082610041e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.548828125,
+ "loss_eval": 1.26747465133667,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 143.37794494628906,
+ 121.56777954101562,
+ 105.97654724121094,
+ 90.9666748046875,
+ 72.01183319091797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.179555541370064e-05,
+ 7.918629125924781e-05,
+ 8.409017755184323e-05,
+ 8.838798385113478e-05,
+ 9.469009819440544e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.564453125,
+ "loss_eval": 1.2752306461334229,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 144.44107055664062,
+ 122.94657135009766,
+ 106.18299102783203,
+ 89.72506713867188,
+ 71.56814575195312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.250273483805358e-05,
+ 7.833781273802742e-05,
+ 8.349631389137357e-05,
+ 8.67474009282887e-05,
+ 8.975700620794669e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.56640625,
+ "loss_eval": 1.214519739151001,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 145.68658447265625,
+ 123.7938232421875,
+ 107.63272857666016,
+ 91.90914154052734,
+ 72.97653198242188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.909506919328123e-05,
+ 7.67810779507272e-05,
+ 8.248597441706806e-05,
+ 8.500050898874179e-05,
+ 8.80209991009906e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.578125,
+ "loss_eval": 1.2490482330322266,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 149.15159606933594,
+ 125.77446746826172,
+ 106.84111022949219,
+ 90.89909362792969,
+ 72.29488372802734
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.051522698020563e-05,
+ 7.787953654769808e-05,
+ 8.355934551218525e-05,
+ 8.837382483761758e-05,
+ 9.125470387516543e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5634765625,
+ "loss_eval": 1.2157257795333862,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 149.9364776611328,
+ 126.3508529663086,
+ 107.00386047363281,
+ 89.69956970214844,
+ 70.79742431640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.40521791158244e-05,
+ 8.231549145421013e-05,
+ 8.598146814620122e-05,
+ 9.036294795805588e-05,
+ 9.211329597746953e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5546875,
+ "loss_eval": 1.2515935897827148,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 152.33641052246094,
+ 127.60247039794922,
+ 109.31637573242188,
+ 91.78147888183594,
+ 71.85491180419922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.096086483215913e-05,
+ 7.774732512189075e-05,
+ 8.330845594173297e-05,
+ 8.756548049859703e-05,
+ 9.018366108648479e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5791015625,
+ "loss_eval": 1.234102487564087,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 154.90924072265625,
+ 129.49365234375,
+ 111.0758285522461,
+ 94.2232666015625,
+ 73.4395523071289
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.217184611363336e-05,
+ 7.90508056525141e-05,
+ 8.487315790262073e-05,
+ 9.130351099884138e-05,
+ 9.386075544171035e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5693359375,
+ "loss_eval": 1.2473926544189453,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 155.88226318359375,
+ 130.6912384033203,
+ 111.4398193359375,
+ 93.5534896850586,
+ 73.1227035522461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.115830521797761e-05,
+ 7.749604992568493e-05,
+ 8.24403905426152e-05,
+ 8.617334970040247e-05,
+ 8.857186185196042e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5625,
+ "loss_eval": 1.232407569885254,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 155.35606384277344,
+ 131.03033447265625,
+ 112.69044494628906,
+ 95.1001968383789,
+ 74.01049041748047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.353001274168491e-05,
+ 8.054459613049403e-05,
+ 8.64928078954108e-05,
+ 8.998846897156909e-05,
+ 9.453124948777258e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.576171875,
+ "loss_eval": 1.2427477836608887,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 157.87423706054688,
+ 132.91993713378906,
+ 114.23269653320312,
+ 96.04922485351562,
+ 74.40912628173828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.218361861305311e-05,
+ 8.000781963346526e-05,
+ 8.621480083093047e-05,
+ 9.079690062208101e-05,
+ 9.179109474644065e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.572265625,
+ "loss_eval": 1.2170917987823486,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 159.94407653808594,
+ 134.98342895507812,
+ 116.59188842773438,
+ 96.52700805664062,
+ 74.13409423828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.996722368057817e-05,
+ 7.723316957708448e-05,
+ 8.291137055493891e-05,
+ 8.800445357337594e-05,
+ 8.874708146322519e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1662731170654297,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 159.40000915527344,
+ 134.68307495117188,
+ 115.32740783691406,
+ 95.89759826660156,
+ 73.79962158203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.17860457370989e-05,
+ 7.931615255074576e-05,
+ 8.509325562044978e-05,
+ 8.835212793201208e-05,
+ 9.002821025205776e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5732421875,
+ "loss_eval": 1.1779483556747437,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 160.3310089111328,
+ 135.494140625,
+ 116.1007308959961,
+ 96.30546569824219,
+ 74.54843139648438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.925644993316382e-05,
+ 7.548897701781243e-05,
+ 8.256838918896392e-05,
+ 8.621955930721015e-05,
+ 8.84741239133291e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1561952829360962,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 161.94854736328125,
+ 135.6446075439453,
+ 116.58970642089844,
+ 96.99983978271484,
+ 74.31636810302734
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.260960410349071e-05,
+ 8.003232505870983e-05,
+ 8.696899749338627e-05,
+ 9.040992881637067e-05,
+ 9.149286051979288e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5810546875,
+ "loss_eval": 1.1946098804473877,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 163.52120971679688,
+ 138.41390991210938,
+ 118.427490234375,
+ 98.19206237792969,
+ 75.36811828613281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.831327482359484e-05,
+ 7.447604730259627e-05,
+ 7.990537415025756e-05,
+ 8.471667388221249e-05,
+ 8.780926145846024e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.184380054473877,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 164.48324584960938,
+ 138.1424102783203,
+ 118.34252166748047,
+ 98.4327621459961,
+ 75.36869049072266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.150783494580537e-05,
+ 7.926567923277617e-05,
+ 8.36653562146239e-05,
+ 8.762039215071127e-05,
+ 8.95786433829926e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.2110118865966797,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 164.0553741455078,
+ 138.08517456054688,
+ 118.49005126953125,
+ 98.67227172851562,
+ 74.64473724365234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.029619155218825e-05,
+ 7.684711454203352e-05,
+ 8.26816976768896e-05,
+ 8.846465789247304e-05,
+ 9.003532613860443e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5908203125,
+ "loss_eval": 1.1644396781921387,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 165.32000732421875,
+ 138.64366149902344,
+ 119.2437515258789,
+ 99.25880432128906,
+ 75.45353698730469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.045984239084646e-05,
+ 7.836698205210268e-05,
+ 8.392294694203883e-05,
+ 8.778785559115931e-05,
+ 8.954900113167241e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5810546875,
+ "loss_eval": 1.18137526512146,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 164.7397918701172,
+ 138.3001251220703,
+ 117.6864242553711,
+ 97.29838562011719,
+ 73.79444122314453
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.162813562899828e-05,
+ 7.83513969508931e-05,
+ 8.275063009932637e-05,
+ 8.855803025653586e-05,
+ 8.704853098606691e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.583984375,
+ "loss_eval": 1.1727752685546875,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 166.1660919189453,
+ 138.93536376953125,
+ 118.51292419433594,
+ 97.88706970214844,
+ 75.51615905761719
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.430704863509163e-05,
+ 8.242860349128023e-05,
+ 8.74657926033251e-05,
+ 9.10981761990115e-05,
+ 9.303457773057744e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.1664979457855225,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 167.8816375732422,
+ 140.1188201904297,
+ 119.77051544189453,
+ 99.83518981933594,
+ 75.69395446777344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.187369919847697e-05,
+ 7.945671677589417e-05,
+ 8.597246051067486e-05,
+ 8.931689808377996e-05,
+ 8.963213622337207e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.587890625,
+ "loss_eval": 1.19194757938385,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 168.21185302734375,
+ 141.76817321777344,
+ 121.40872192382812,
+ 100.61127471923828,
+ 76.76028442382812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.174632628448308e-05,
+ 7.968613499542698e-05,
+ 8.514403452863917e-05,
+ 8.922909910324961e-05,
+ 9.091905667446554e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1679599285125732,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 167.2344207763672,
+ 140.6108856201172,
+ 120.0829849243164,
+ 99.8038330078125,
+ 76.13324737548828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.436795567627996e-05,
+ 8.090144547168165e-05,
+ 8.729894761927426e-05,
+ 9.00863014976494e-05,
+ 8.991207869257778e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.595703125,
+ "loss_eval": 1.1705546379089355,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 167.59393310546875,
+ 140.7035369873047,
+ 120.24620056152344,
+ 99.91508483886719,
+ 75.96212005615234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.446305971825495e-05,
+ 8.234894630732015e-05,
+ 8.821392111713067e-05,
+ 9.209391282638535e-05,
+ 9.261125524062663e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5791015625,
+ "loss_eval": 1.1846892833709717,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 168.69448852539062,
+ 141.26541137695312,
+ 121.04974365234375,
+ 100.46004486083984,
+ 75.70881652832031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.222096610348672e-05,
+ 7.875960727687925e-05,
+ 8.227298530982807e-05,
+ 8.841860108077526e-05,
+ 9.022892481880262e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.1577212810516357,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 169.7440185546875,
+ 142.39825439453125,
+ 121.89653778076172,
+ 100.77093505859375,
+ 76.56221008300781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.555038610007614e-05,
+ 8.296242594951764e-05,
+ 9.037082054419443e-05,
+ 9.527869406156242e-05,
+ 9.701496310299262e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5908203125,
+ "loss_eval": 1.1768805980682373,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 167.24928283691406,
+ 140.36639404296875,
+ 119.20468139648438,
+ 99.04094696044922,
+ 75.62102508544922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.741156878182665e-05,
+ 8.454316412098706e-05,
+ 9.005220636026934e-05,
+ 9.321123798144981e-05,
+ 9.260981460101902e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5908203125,
+ "loss_eval": 1.166186809539795,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 170.72845458984375,
+ 142.466796875,
+ 120.5933837890625,
+ 100.26793670654297,
+ 76.15065002441406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.659869879717007e-05,
+ 8.334196172654629e-05,
+ 9.012148075271398e-05,
+ 9.564686479279771e-05,
+ 9.513212717138231e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.1720219850540161,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 169.83580017089844,
+ 141.82705688476562,
+ 121.11093139648438,
+ 100.64865112304688,
+ 76.17137145996094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.593600457767025e-05,
+ 8.458431693725288e-05,
+ 9.001771832117811e-05,
+ 9.566119115334004e-05,
+ 9.762388071976602e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.184555172920227,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 168.68116760253906,
+ 141.1621856689453,
+ 119.57838439941406,
+ 98.55834197998047,
+ 75.13648223876953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.207417704397812e-05,
+ 9.170681732939556e-05,
+ 9.716026397654787e-05,
+ 0.0001007765022222884,
+ 0.0001005034864647314
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5810546875,
+ "loss_eval": 1.1981369256973267,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 171.0980682373047,
+ 143.56202697753906,
+ 121.67494201660156,
+ 101.36307525634766,
+ 76.57723999023438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.634361099917442e-05,
+ 8.294743747683242e-05,
+ 8.85644112713635e-05,
+ 9.305671119363979e-05,
+ 9.303687693318352e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.1646153926849365,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 170.58717346191406,
+ 143.18809509277344,
+ 120.9772720336914,
+ 100.8180923461914,
+ 77.12872314453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.599191303597763e-05,
+ 8.41239161673002e-05,
+ 8.960344712249935e-05,
+ 9.63989004958421e-05,
+ 9.756541112437844e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.1623225212097168,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 169.49244689941406,
+ 142.66770935058594,
+ 122.00574493408203,
+ 101.84593963623047,
+ 77.40425109863281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.701734284637496e-05,
+ 8.374643221031874e-05,
+ 9.025474719237536e-05,
+ 9.504661284154281e-05,
+ 9.925573249347508e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59765625,
+ "loss_eval": 1.1574187278747559,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 169.3027801513672,
+ 143.11941528320312,
+ 120.9614486694336,
+ 101.5257797241211,
+ 77.17151641845703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.559885852970183e-05,
+ 8.217129652621225e-05,
+ 8.892706682672724e-05,
+ 9.235734614776447e-05,
+ 9.276533091906458e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6015625,
+ "loss_eval": 1.149141788482666,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 168.70281982421875,
+ 141.82730102539062,
+ 120.2729263305664,
+ 99.75395965576172,
+ 76.92571258544922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.91895727161318e-05,
+ 8.787367551121861e-05,
+ 9.60014876909554e-05,
+ 0.0001018140246742405,
+ 9.86503655440174e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6005859375,
+ "loss_eval": 1.1657415628433228,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 169.94361877441406,
+ 142.49684143066406,
+ 120.18767547607422,
+ 100.32206726074219,
+ 76.59700012207031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.673597428947687e-05,
+ 8.517439709976315e-05,
+ 9.201091597788036e-05,
+ 9.491065429756418e-05,
+ 9.497139399172738e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.170656442642212,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 168.98934936523438,
+ 142.45361328125,
+ 120.9234848022461,
+ 101.12970733642578,
+ 76.8805160522461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.979186193551868e-05,
+ 8.849770529195666e-05,
+ 9.661864896770567e-05,
+ 0.00010212804772891104,
+ 9.96212984318845e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59375,
+ "loss_eval": 1.153792142868042,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 169.1288604736328,
+ 141.414306640625,
+ 119.56535339355469,
+ 99.89313507080078,
+ 76.44340515136719
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.042863919399679e-05,
+ 8.848145080264658e-05,
+ 9.505209163762629e-05,
+ 0.00010096383630298078,
+ 9.844720625551417e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1363590955734253,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 167.93479919433594,
+ 140.53518676757812,
+ 118.76004028320312,
+ 99.56035614013672,
+ 76.20387268066406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.038699888857082e-05,
+ 8.754427108215168e-05,
+ 9.549371316097677e-05,
+ 0.00010098952043335885,
+ 0.0001008743784041144
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.1666439771652222,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 168.28646850585938,
+ 140.67718505859375,
+ 118.55599975585938,
+ 98.98268127441406,
+ 75.81230163574219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.297240128740668e-05,
+ 8.875853382050991e-05,
+ 9.902577585307881e-05,
+ 0.00010285823373124003,
+ 0.00010488184489076957
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1589187383651733,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 168.05776977539062,
+ 140.5435791015625,
+ 119.5470962524414,
+ 99.72227478027344,
+ 76.00287628173828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.011830504983664e-05,
+ 8.830082515487447e-05,
+ 9.65106810326688e-05,
+ 0.00010251552885165438,
+ 0.00010001847840612754
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.157954216003418,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 168.4709014892578,
+ 140.92843627929688,
+ 119.31693267822266,
+ 98.76548767089844,
+ 75.95777893066406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.56209808262065e-05,
+ 9.390609193360433e-05,
+ 0.00010086362453876063,
+ 0.00010554264736128971,
+ 0.00010187114821746945
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.147390365600586,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 167.48707580566406,
+ 139.8479766845703,
+ 118.25393676757812,
+ 99.32323455810547,
+ 75.72100830078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.738139877095819e-05,
+ 9.79254036792554e-05,
+ 0.00010459231998538598,
+ 0.00011052342597395182,
+ 0.00010695838136598468
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5966796875,
+ "loss_eval": 1.1785132884979248,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 167.5928955078125,
+ 140.20948791503906,
+ 118.63544464111328,
+ 99.02739715576172,
+ 75.8176040649414
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.539798727724701e-05,
+ 9.423612937098369e-05,
+ 0.00010523338278289884,
+ 0.00010897681931965053,
+ 0.00010739201388787478
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.60546875,
+ "loss_eval": 1.1509130001068115,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 167.19003295898438,
+ 138.91221618652344,
+ 117.57588195800781,
+ 98.43026733398438,
+ 75.48680114746094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.238407463068143e-05,
+ 9.25329077290371e-05,
+ 0.00010089747956953943,
+ 0.00010575826308922842,
+ 0.00010581395326880738
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6220703125,
+ "loss_eval": 1.151381254196167,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 165.7104034423828,
+ 138.99298095703125,
+ 117.33794403076172,
+ 98.08374786376953,
+ 75.52032470703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.850001177052036e-05,
+ 9.699742804514244e-05,
+ 0.00010492365981917828,
+ 0.00011017896758858114,
+ 0.00010667099559213966
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.151253581047058,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 165.87271118164062,
+ 138.727783203125,
+ 118.21571350097656,
+ 97.76729583740234,
+ 75.68400573730469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.00067898328416e-05,
+ 9.841559221968055e-05,
+ 0.00010505259706405923,
+ 0.00010942742665065452,
+ 0.00010504219244467095
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.60546875,
+ "loss_eval": 1.1535770893096924,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 165.17666625976562,
+ 138.45004272460938,
+ 117.10303497314453,
+ 97.36707305908203,
+ 75.38941192626953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.911191252991557e-05,
+ 9.853249503066763e-05,
+ 0.00010691725765354931,
+ 0.00011312783317407593,
+ 0.0001101552988984622
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59765625,
+ "loss_eval": 1.1582581996917725,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 165.94325256347656,
+ 138.6524200439453,
+ 117.50881958007812,
+ 97.7616958618164,
+ 75.20433807373047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.616734703537077e-05,
+ 9.347109880764037e-05,
+ 0.00010103159002028406,
+ 0.00010616267536533996,
+ 0.00010419132013339549
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1453883647918701,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 165.7154541015625,
+ 138.506591796875,
+ 117.28874206542969,
+ 97.05110168457031,
+ 75.29759979248047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.980780694400892e-05,
+ 9.973136184271425e-05,
+ 0.00010883707000175491,
+ 0.00011757094762288034,
+ 0.00011409710714360699
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1474578380584717,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 164.83221435546875,
+ 138.6868133544922,
+ 116.98916625976562,
+ 96.52086639404297,
+ 75.43351745605469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.988294575829059e-05,
+ 9.790070907911286e-05,
+ 0.00010740302968770266,
+ 0.00011267260560998693,
+ 0.0001108170035877265
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.143803358078003,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 164.63592529296875,
+ 137.5937042236328,
+ 116.08668518066406,
+ 96.16253662109375,
+ 74.92699432373047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.160200715996325e-05,
+ 0.00010001687769545242,
+ 0.00010771892993943766,
+ 0.00011699824244715273,
+ 0.00011338551848893985
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1410948038101196,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 164.91123962402344,
+ 137.8173828125,
+ 116.79219818115234,
+ 96.76990509033203,
+ 74.76392364501953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.93947362783365e-05,
+ 9.948704246198758e-05,
+ 0.00010810969251906499,
+ 0.00011499693209771067,
+ 0.0001114657279686071
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.623046875,
+ "loss_eval": 1.1341216564178467,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 164.64288330078125,
+ 137.3013153076172,
+ 116.4471206665039,
+ 96.7668228149414,
+ 74.69876861572266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.85727204149589e-05,
+ 9.913302346831188e-05,
+ 0.00011003073450410739,
+ 0.00011727867240551859,
+ 0.00011272053234279156
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1379802227020264,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 163.62106323242188,
+ 137.2855682373047,
+ 115.62771606445312,
+ 95.8958969116211,
+ 74.53977966308594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.984863961813971e-05,
+ 9.98539908323437e-05,
+ 0.00010817578731803223,
+ 0.00011364965030224994,
+ 0.00011257777805440128
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.130206823348999,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 164.09976196289062,
+ 137.23387145996094,
+ 116.05545043945312,
+ 96.66761016845703,
+ 75.32057189941406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.984812302514911e-05,
+ 9.734687773743644e-05,
+ 0.00010578137880656868,
+ 0.00011179807916050777,
+ 0.0001108815340558067
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1422557830810547,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 162.94369506835938,
+ 136.59678649902344,
+ 115.43162536621094,
+ 95.96286010742188,
+ 74.39228057861328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.308777953265235e-05,
+ 0.00010392161493655294,
+ 0.00011047742736991495,
+ 0.00011820423969766125,
+ 0.00011209066724404693
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1316850185394287,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 163.14993286132812,
+ 136.48724365234375,
+ 115.7430648803711,
+ 96.20491790771484,
+ 74.71761322021484
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.024026803672314e-05,
+ 0.00010025065421359614,
+ 0.00011008324509020895,
+ 0.00011521186388563365,
+ 0.00011174430255778134
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.1380174160003662,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 163.56654357910156,
+ 136.04368591308594,
+ 114.58287048339844,
+ 95.99482727050781,
+ 74.26864624023438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.700806549517438e-05,
+ 0.0001051941653713584,
+ 0.00011597082630032673,
+ 0.0001224641309818253,
+ 0.00011469785385997966
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.1528915166854858,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 162.7240753173828,
+ 135.9139862060547,
+ 114.86207580566406,
+ 95.29146575927734,
+ 74.25565338134766
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.666816185927019e-05,
+ 0.0001055657266988419,
+ 0.00011615711264312267,
+ 0.00012476630217861384,
+ 0.00011797657498391345
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.1539390087127686,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 162.158203125,
+ 135.1398468017578,
+ 114.53036499023438,
+ 94.93306732177734,
+ 73.95748901367188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.333287016488612e-05,
+ 0.0001032597865560092,
+ 0.00011410381557652727,
+ 0.00012122129555791616,
+ 0.00011711813567671925
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1506534814834595,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 162.415283203125,
+ 135.51370239257812,
+ 114.56376647949219,
+ 94.92838287353516,
+ 74.06205749511719
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.082158794626594e-05,
+ 0.00010185714199906215,
+ 0.00011048805754398927,
+ 0.00011587562767090276,
+ 0.0001120776214520447
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1497812271118164,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 161.77337646484375,
+ 135.19717407226562,
+ 114.20987701416016,
+ 94.77679443359375,
+ 73.99730682373047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.745426359586418e-05,
+ 0.00010718397970777005,
+ 0.00011704466305673122,
+ 0.00012522070028353482,
+ 0.00012164646614110097
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.155759572982788,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 161.48892211914062,
+ 135.2348175048828,
+ 114.12451171875,
+ 94.8083267211914,
+ 73.4517822265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.549259266350418e-05,
+ 0.00010579569061519578,
+ 0.00011430429003667086,
+ 0.00012098137813154608,
+ 0.00011664297198876739
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.15834379196167,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 161.6995849609375,
+ 135.2989959716797,
+ 114.2784194946289,
+ 94.69004821777344,
+ 73.529541015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.579937614034861e-05,
+ 0.00010731106885941699,
+ 0.00011613505921559408,
+ 0.00012203569349367172,
+ 0.00011712868581525981
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1583144664764404,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 161.00369262695312,
+ 134.7657012939453,
+ 114.10606384277344,
+ 94.362060546875,
+ 73.65673065185547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.818092075875029e-05,
+ 0.00010859747999347746,
+ 0.00011724254727596417,
+ 0.00012138402962591499,
+ 0.00011800935317296535
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1536951065063477,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 161.0053253173828,
+ 134.59410095214844,
+ 113.69575500488281,
+ 94.29032135009766,
+ 73.46531677246094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.722611866891384e-05,
+ 0.00010765776823973283,
+ 0.0001188350870506838,
+ 0.00012322816473897547,
+ 0.00011940464901272207
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.15749192237854,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 161.33126831054688,
+ 134.94166564941406,
+ 113.90135955810547,
+ 94.50862884521484,
+ 73.39297485351562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.938049333868548e-05,
+ 0.0001076548287528567,
+ 0.00011934098438359797,
+ 0.00012375488586258143,
+ 0.00011877582437591627
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.157106637954712,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 161.05789184570312,
+ 134.59825134277344,
+ 113.87554931640625,
+ 94.37042999267578,
+ 73.5987548828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.70072578638792e-05,
+ 0.00010533058957662433,
+ 0.00011765053932322189,
+ 0.00012162782513769343,
+ 0.00012223162048030645
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.1565823554992676,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 160.39405822753906,
+ 134.43434143066406,
+ 113.540283203125,
+ 94.05237579345703,
+ 73.39077758789062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.608148684492335e-05,
+ 0.00010612589539960027,
+ 0.00011680866009555757,
+ 0.00012219352356623858,
+ 0.00011590561916818842
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.1539617776870728,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 160.60440063476562,
+ 134.6214141845703,
+ 113.45699310302734,
+ 93.85929870605469,
+ 73.18849182128906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.81277771643363e-05,
+ 0.00010970587754854932,
+ 0.00011871931201312691,
+ 0.00012303274706937373,
+ 0.00011832414020318538
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1519787311553955,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 160.69932556152344,
+ 134.37420654296875,
+ 113.30387115478516,
+ 93.87930297851562,
+ 73.2369384765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.748790762387216e-05,
+ 0.00010789754742290825,
+ 0.00011884274135809392,
+ 0.00012259349750820547,
+ 0.00012160756887169555
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1536774635314941,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 160.83596801757812,
+ 134.3319854736328,
+ 113.4552230834961,
+ 94.0063705444336,
+ 73.16248321533203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.70613255049102e-05,
+ 0.00010844107600860298,
+ 0.0001184809225378558,
+ 0.00012342457193881273,
+ 0.00011970168998232111
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6220703125,
+ "loss_eval": 1.152658462524414,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 160.8366241455078,
+ 134.48265075683594,
+ 113.25139617919922,
+ 93.83488464355469,
+ 73.08296203613281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.66933585004881e-05,
+ 0.00010815998393809423,
+ 0.00011774426093325019,
+ 0.0001224545994773507,
+ 0.00011890953464899212
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.1551861763000488,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 160.7191162109375,
+ 134.44659423828125,
+ 113.33219146728516,
+ 93.93790435791016,
+ 73.0753402709961
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.675837645772845e-05,
+ 0.00010675707017071545,
+ 0.00011643637844827026,
+ 0.00012197842443129048,
+ 0.0001190306429634802
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.15492582321167,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 160.51898193359375,
+ 134.29307556152344,
+ 113.27383422851562,
+ 94.04198455810547,
+ 73.003662109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.737682557897642e-05,
+ 0.00010710594506235793,
+ 0.00011601457663346082,
+ 0.0001232696376973763,
+ 0.0001181336774607189
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1535921096801758,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 160.5992431640625,
+ 134.43368530273438,
+ 113.30790710449219,
+ 94.0107192993164,
+ 73.01823425292969
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.668481652624905e-05,
+ 0.00010705058230087161,
+ 0.0001163838169304654,
+ 0.0001232351060025394,
+ 0.00011791065480792895
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1539404392242432,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 160.6013946533203,
+ 134.46824645996094,
+ 113.25690460205078,
+ 93.99237060546875,
+ 73.00788879394531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.74524809862487e-05,
+ 0.00010689684131648391,
+ 0.00011608003114815801,
+ 0.00012245487596374005,
+ 0.00011877176439156756
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1537361145019531,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 160.6110076904297,
+ 134.44720458984375,
+ 113.29548645019531,
+ 93.96721649169922,
+ 72.96358489990234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.775274520507082e-05,
+ 0.00010722322622314095,
+ 0.00011578563862713054,
+ 0.00012414308730512857,
+ 0.00011851716408273205
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1537935733795166,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 160.61090087890625,
+ 134.45262145996094,
+ 113.2977066040039,
+ 93.9543685913086,
+ 72.96540069580078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.751630568644032e-05,
+ 0.00010700579878175631,
+ 0.00011575232201721519,
+ 0.0001240932324435562,
+ 0.00011847950372612104
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.153747320175171,
+ "epoch": 100
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005561555735766888,
+ 0.0005519049009308219,
+ 0.0005482902633957565,
+ 0.0005436676437966526,
+ 0.000538847001735121
+ ],
+ "gamma_dfa": 0.008468771702609956,
+ "gamma_dfa_per_layer": [
+ 0.0002397641073912382,
+ 0.021293632686138153,
+ -0.0031478723976761103,
+ 0.015489562414586544
+ ],
+ "acc_eval": 0.1123046875,
+ "loss_eval": 2.3168468475341797,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 481.5912780761719,
+ 951.0988159179688,
+ 1076.1094970703125,
+ 1320.2431640625,
+ 1560.1331787109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006860869470983744,
+ 0.000686013896483928,
+ 0.0006859428831376135,
+ 0.0006858126726001501,
+ 0.0006857643602415919
+ ],
+ "gamma_dfa": 0.008383387292269617,
+ "gamma_dfa_per_layer": [
+ 0.030579306185245514,
+ 0.012463560327887535,
+ -0.009617818519473076,
+ 0.00010850117541849613
+ ],
+ "acc_eval": 0.1494140625,
+ "loss_eval": 6.441287040710449,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 803.455322265625,
+ 1877.8646240234375,
+ 2352.25390625,
+ 2999.778564453125,
+ 3690.3037109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007094781612977386,
+ 0.0007074660388752818,
+ 0.0007073783199302852,
+ 0.0007076358306221664,
+ 0.0007076164474710822
+ ],
+ "gamma_dfa": -0.002415801805909723,
+ "gamma_dfa_per_layer": [
+ 0.04413381963968277,
+ -0.0021541656460613012,
+ -0.028202872723340988,
+ -0.023439988493919373
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 9.331591606140137,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 1023.6770629882812,
+ 2787.596923828125,
+ 3518.2734375,
+ 4732.96337890625,
+ 6139.98486328125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007535111508332193,
+ 0.00075019511859864,
+ 0.0007504230597987771,
+ 0.0007509100250899792,
+ 0.0007509145070798695
+ ],
+ "gamma_dfa": -0.004518487432505935,
+ "gamma_dfa_per_layer": [
+ 0.049626171588897705,
+ -0.0017164160963147879,
+ -0.029111474752426147,
+ -0.03687223047018051
+ ],
+ "acc_eval": 0.1943359375,
+ "loss_eval": 33.82752990722656,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 1163.0250244140625,
+ 3340.40087890625,
+ 4668.20654296875,
+ 6551.25927734375,
+ 8839.166015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007571951719000936,
+ 0.0007542021339759231,
+ 0.0007538797217421234,
+ 0.0007539798971265554,
+ 0.0007538445643149316
+ ],
+ "gamma_dfa": -0.0057786391116678715,
+ "gamma_dfa_per_layer": [
+ 0.06502002477645874,
+ -0.02495962381362915,
+ -0.035328082740306854,
+ -0.02784687466919422
+ ],
+ "acc_eval": 0.1875,
+ "loss_eval": 50.81904983520508,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 1288.871337890625,
+ 3822.7880859375,
+ 5365.59130859375,
+ 7605.025390625,
+ 10502.0478515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007548240246251225,
+ 0.0007521823281422257,
+ 0.0007521542138420045,
+ 0.00075240881415084,
+ 0.0007523542735725641
+ ],
+ "gamma_dfa": -0.006262022419832647,
+ "gamma_dfa_per_layer": [
+ 0.0670417994260788,
+ -0.00757558410987258,
+ -0.044654928147792816,
+ -0.03985937684774399
+ ],
+ "acc_eval": 0.1748046875,
+ "loss_eval": 41.77630615234375,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 1393.3045654296875,
+ 4566.75341796875,
+ 6398.4619140625,
+ 9144.8193359375,
+ 12855.005859375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007480952190235257,
+ 0.0007420883048325777,
+ 0.0007418331224471331,
+ 0.0007423029164783657,
+ 0.0007423472707159817
+ ],
+ "gamma_dfa": -0.012987596448510885,
+ "gamma_dfa_per_layer": [
+ 0.07368794828653336,
+ -0.022242246195673943,
+ -0.04769526422023773,
+ -0.05570082366466522
+ ],
+ "acc_eval": 0.2255859375,
+ "loss_eval": 34.67824172973633,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 1492.14599609375,
+ 4914.71142578125,
+ 7309.0888671875,
+ 10380.2900390625,
+ 14994.3798828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007586176507174969,
+ 0.0007474496378563344,
+ 0.0007472135475836694,
+ 0.0007474484154954553,
+ 0.0007475449237972498
+ ],
+ "gamma_dfa": -0.009481166722252965,
+ "gamma_dfa_per_layer": [
+ 0.07966121286153793,
+ -0.014550731517374516,
+ -0.05317254737019539,
+ -0.04986260086297989
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 47.53326416015625,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 1561.8521728515625,
+ 5346.5771484375,
+ 8036.01171875,
+ 11400.638671875,
+ 16846.158203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007513429154641926,
+ 0.000743337906897068,
+ 0.0007433209684677422,
+ 0.0007435117149725556,
+ 0.0007433460559695959
+ ],
+ "gamma_dfa": -0.020332499407231808,
+ "gamma_dfa_per_layer": [
+ 0.07914174348115921,
+ -0.03499722480773926,
+ -0.0528150238096714,
+ -0.07265949249267578
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 44.3652458190918,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 1634.708740234375,
+ 5771.3779296875,
+ 9056.50390625,
+ 14017.43359375,
+ 18666.166015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007612781482748687,
+ 0.000746309058740735,
+ 0.0007445007795467973,
+ 0.000742616830393672,
+ 0.000742737902328372
+ ],
+ "gamma_dfa": -0.02017525304108858,
+ "gamma_dfa_per_layer": [
+ 0.07873347401618958,
+ -0.0398627370595932,
+ -0.05772021412849426,
+ -0.061851534992456436
+ ],
+ "acc_eval": 0.1962890625,
+ "loss_eval": 76.75175476074219,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 1703.975830078125,
+ 6538.35400390625,
+ 10825.435546875,
+ 18506.091796875,
+ 22004.94140625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007676634704694152,
+ 0.0007641310803592205,
+ 0.0007641207776032388,
+ 0.0007640842813998461,
+ 0.0007641611155122519
+ ],
+ "gamma_dfa": -0.016695345751941204,
+ "gamma_dfa_per_layer": [
+ 0.08918984234333038,
+ -0.029809486120939255,
+ -0.06516598165035248,
+ -0.06099575757980347
+ ],
+ "acc_eval": 0.14453125,
+ "loss_eval": 82.11173248291016,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 1742.7552490234375,
+ 10617.021484375,
+ 14353.39453125,
+ 26320.365234375,
+ 29618.58984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007739505381323397,
+ 0.0007467114483006299,
+ 0.0007445442606694996,
+ 0.0007397353765554726,
+ 0.0007397329318337142
+ ],
+ "gamma_dfa": -0.01567553821951151,
+ "gamma_dfa_per_layer": [
+ 0.08600987493991852,
+ -0.03431041166186333,
+ -0.056060850620269775,
+ -0.05834076553583145
+ ],
+ "acc_eval": 0.1943359375,
+ "loss_eval": 223.91172790527344,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 1824.1932373046875,
+ 15453.6865234375,
+ 18834.18359375,
+ 34960.33984375,
+ 37989.41796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007750834338366985,
+ 0.0007619780953973532,
+ 0.0007621922995895147,
+ 0.0007620578981004655,
+ 0.0007621044642291963
+ ],
+ "gamma_dfa": -0.010786167811602354,
+ "gamma_dfa_per_layer": [
+ 0.12150975316762924,
+ -0.02778821997344494,
+ -0.057943932712078094,
+ -0.07892227172851562
+ ],
+ "acc_eval": 0.2236328125,
+ "loss_eval": 176.59576416015625,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 1874.6923828125,
+ 24413.89453125,
+ 27520.30859375,
+ 49373.3984375,
+ 52416.24609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007790470262989402,
+ 0.0007622907287441194,
+ 0.0007622726843692362,
+ 0.0007622543489560485,
+ 0.0007623030105605721
+ ],
+ "gamma_dfa": -0.014462455175817013,
+ "gamma_dfa_per_layer": [
+ 0.12855470180511475,
+ -0.04145955294370651,
+ -0.05751717463135719,
+ -0.08742779493331909
+ ],
+ "acc_eval": 0.1787109375,
+ "loss_eval": 262.8403625488281,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 1946.8936767578125,
+ 36272.8125,
+ 40333.21875,
+ 69530.5,
+ 73388.2890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008108754991553724,
+ 0.0007635678630322218,
+ 0.0007621092372573912,
+ 0.0007623478886671364,
+ 0.0007624892168678343
+ ],
+ "gamma_dfa": -0.0001736646518111229,
+ "gamma_dfa_per_layer": [
+ 0.17327094078063965,
+ -0.03242593631148338,
+ -0.06580278277397156,
+ -0.0757368803024292
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 413.348876953125,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 2032.87255859375,
+ 51780.58984375,
+ 56919.1484375,
+ 94829.1484375,
+ 100403.8828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008237292058765888,
+ 0.0007614542846567929,
+ 0.0007608170853927732,
+ 0.0007589491433463991,
+ 0.0007590141030959785
+ ],
+ "gamma_dfa": -0.011795124970376492,
+ "gamma_dfa_per_layer": [
+ 0.1382066011428833,
+ -0.05588943883776665,
+ -0.061218664050102234,
+ -0.06827899813652039
+ ],
+ "acc_eval": 0.173828125,
+ "loss_eval": 476.64752197265625,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 2114.94287109375,
+ 69492.1875,
+ 75388.1796875,
+ 119789.3125,
+ 127585.7109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000832556514069438,
+ 0.0007537039346061647,
+ 0.000749573518987745,
+ 0.0007496002363041043,
+ 0.0007496204925701022
+ ],
+ "gamma_dfa": 0.0006226245313882828,
+ "gamma_dfa_per_layer": [
+ 0.18075576424598694,
+ -0.03305089473724365,
+ -0.06780679523944855,
+ -0.07740757614374161
+ ],
+ "acc_eval": 0.1982421875,
+ "loss_eval": 537.6473388671875,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 2253.870849609375,
+ 95625.234375,
+ 102645.28125,
+ 154236.78125,
+ 164149.109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008362202788703144,
+ 0.0007716236286796629,
+ 0.0007702361326664686,
+ 0.0007688606856390834,
+ 0.0007688601035624743
+ ],
+ "gamma_dfa": 0.0006011892110109329,
+ "gamma_dfa_per_layer": [
+ 0.16114464402198792,
+ -0.029663734138011932,
+ -0.06491248309612274,
+ -0.06416366994380951
+ ],
+ "acc_eval": 0.1640625,
+ "loss_eval": 581.9083251953125,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 2351.805419921875,
+ 125897.7421875,
+ 133955.1875,
+ 192500.78125,
+ 204528.875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009331249166280031,
+ 0.0007676270324736834,
+ 0.000767629942856729,
+ 0.0007676497916691005,
+ 0.0007678864640183747
+ ],
+ "gamma_dfa": 0.0174247776158154,
+ "gamma_dfa_per_layer": [
+ 0.2389061450958252,
+ -0.028650319203734398,
+ -0.08226999640464783,
+ -0.058286719024181366
+ ],
+ "acc_eval": 0.18359375,
+ "loss_eval": 913.2538452148438,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 2513.170166015625,
+ 162182.9375,
+ 171449.59375,
+ 239781.78125,
+ 254673.765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010568156139925122,
+ 0.0007681881543248892,
+ 0.0007537052151747048,
+ 0.0007537882192991674,
+ 0.0007537372293882072
+ ],
+ "gamma_dfa": -0.005793072283267975,
+ "gamma_dfa_per_layer": [
+ 0.16605031490325928,
+ -0.03780411183834076,
+ -0.07320450246334076,
+ -0.07821398973464966
+ ],
+ "acc_eval": 0.16796875,
+ "loss_eval": 1265.55859375,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 2644.6826171875,
+ 207142.84375,
+ 218342.21875,
+ 296423.21875,
+ 314992.625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011496657971292734,
+ 0.0007783269393257797,
+ 0.0007782486500218511,
+ 0.0007782430038787425,
+ 0.0007782124448567629
+ ],
+ "gamma_dfa": 0.0026588989421725273,
+ "gamma_dfa_per_layer": [
+ 0.23294636607170105,
+ -0.04264959320425987,
+ -0.083626389503479,
+ -0.09603478759527206
+ ],
+ "acc_eval": 0.20703125,
+ "loss_eval": 1426.623046875,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 2796.434814453125,
+ 252884.71875,
+ 265445.65625,
+ 352069.8125,
+ 373355.1875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001035262132063508,
+ 0.0007528892601840198,
+ 0.0007526214467361569,
+ 0.0007527145207859576,
+ 0.0007528204005211592
+ ],
+ "gamma_dfa": 0.006789525970816612,
+ "gamma_dfa_per_layer": [
+ 0.22278103232383728,
+ -0.04876326024532318,
+ -0.07404369860887527,
+ -0.07281596958637238
+ ],
+ "acc_eval": 0.1640625,
+ "loss_eval": 1487.587158203125,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 2927.763671875,
+ 309847.03125,
+ 323644.75,
+ 419166.875,
+ 443365.71875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010502212680876255,
+ 0.0007627566810697317,
+ 0.0007627056329511106,
+ 0.000762629380915314,
+ 0.0007625716971233487
+ ],
+ "gamma_dfa": 0.02364537864923477,
+ "gamma_dfa_per_layer": [
+ 0.29678860306739807,
+ -0.041244715452194214,
+ -0.08115403354167938,
+ -0.07980833947658539
+ ],
+ "acc_eval": 0.169921875,
+ "loss_eval": 920.2720947265625,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 3096.798583984375,
+ 369599.1875,
+ 385129.65625,
+ 491132.78125,
+ 518903.8125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001009905245155096,
+ 0.0007581011741422117,
+ 0.0007581054233014584,
+ 0.0007580683450214565,
+ 0.0007581928512081504
+ ],
+ "gamma_dfa": 0.003264583647251129,
+ "gamma_dfa_per_layer": [
+ 0.2218201905488968,
+ -0.04958157241344452,
+ -0.07964619994163513,
+ -0.07953408360481262
+ ],
+ "acc_eval": 0.2001953125,
+ "loss_eval": 1496.309814453125,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 3268.982666015625,
+ 428585.28125,
+ 445459.5625,
+ 561163.625,
+ 592376.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001033863751217723,
+ 0.0007647433667443693,
+ 0.0007646661251783371,
+ 0.0007653636857867241,
+ 0.0007653713691979647
+ ],
+ "gamma_dfa": -0.0003395974636077881,
+ "gamma_dfa_per_layer": [
+ 0.2477388083934784,
+ -0.05594494938850403,
+ -0.08699506521224976,
+ -0.10615718364715576
+ ],
+ "acc_eval": 0.1669921875,
+ "loss_eval": 1579.9014892578125,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 3455.88134765625,
+ 503646.0,
+ 521880.0,
+ 646881.0,
+ 681678.4375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001110030454583466,
+ 0.000788405304774642,
+ 0.0007884047226980329,
+ 0.0007886688108555973,
+ 0.0007884959923103452
+ ],
+ "gamma_dfa": 0.03397770132869482,
+ "gamma_dfa_per_layer": [
+ 0.325829416513443,
+ -0.034700896590948105,
+ -0.09419499337673187,
+ -0.061022721230983734
+ ],
+ "acc_eval": 0.1572265625,
+ "loss_eval": 3785.62744140625,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 3642.92626953125,
+ 585772.8125,
+ 606436.25,
+ 744826.125,
+ 783648.0625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014668661169707775,
+ 0.0007638748502358794,
+ 0.000763841497246176,
+ 0.0007643977296538651,
+ 0.000764367519877851
+ ],
+ "gamma_dfa": 0.01312381774187088,
+ "gamma_dfa_per_layer": [
+ 0.23922428488731384,
+ -0.0393734946846962,
+ -0.07718683779239655,
+ -0.07016868144273758
+ ],
+ "acc_eval": 0.232421875,
+ "loss_eval": 4151.03466796875,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 3766.637939453125,
+ 680946.4375,
+ 702914.3125,
+ 850315.25,
+ 892276.625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012596967862918973,
+ 0.0007629106985405087,
+ 0.0007628659950569272,
+ 0.0007628875900991261,
+ 0.0007628927705809474
+ ],
+ "gamma_dfa": 0.034322043880820274,
+ "gamma_dfa_per_layer": [
+ 0.2786872386932373,
+ -0.04257660359144211,
+ -0.046638332307338715,
+ -0.052184127271175385
+ ],
+ "acc_eval": 0.1396484375,
+ "loss_eval": 3629.718017578125,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 3968.325927734375,
+ 788450.875,
+ 812297.0625,
+ 972239.1875,
+ 1018608.3125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001368838595226407,
+ 0.0007680156268179417,
+ 0.0007679847767576575,
+ 0.0007678329711779952,
+ 0.0007678261026740074
+ ],
+ "gamma_dfa": -0.004100106656551361,
+ "gamma_dfa_per_layer": [
+ 0.2793079614639282,
+ -0.07087238132953644,
+ -0.09966391324996948,
+ -0.12517209351062775
+ ],
+ "acc_eval": 0.0908203125,
+ "loss_eval": 4779.9248046875,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 4129.07666015625,
+ 894723.3125,
+ 920476.5,
+ 1091407.125,
+ 1142044.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012168982066214085,
+ 0.0007647873135283589,
+ 0.0007647885358892381,
+ 0.0007647658349014819,
+ 0.0007648474420420825
+ ],
+ "gamma_dfa": 0.008089051581919193,
+ "gamma_dfa_per_layer": [
+ 0.24180662631988525,
+ -0.05241226777434349,
+ -0.08961856365203857,
+ -0.06741958856582642
+ ],
+ "acc_eval": 0.2158203125,
+ "loss_eval": 4783.03515625,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 4306.06396484375,
+ 1029326.875,
+ 1057140.5,
+ 1242169.625,
+ 1298018.875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011723857605829835,
+ 0.0007771517848595977,
+ 0.000777057372033596,
+ 0.0007771223317831755,
+ 0.0007771406089887023
+ ],
+ "gamma_dfa": 0.039280178025364876,
+ "gamma_dfa_per_layer": [
+ 0.3913160562515259,
+ -0.04802073538303375,
+ -0.09416519105434418,
+ -0.09200941771268845
+ ],
+ "acc_eval": 0.1298828125,
+ "loss_eval": 3595.0546875,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 4460.63916015625,
+ 1158344.75,
+ 1187641.625,
+ 1385118.375,
+ 1445341.375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001693590427748859,
+ 0.0007734080427326262,
+ 0.0007734334794804454,
+ 0.0007733569364063442,
+ 0.0007734467508271337
+ ],
+ "gamma_dfa": 0.023572785779833794,
+ "gamma_dfa_per_layer": [
+ 0.2822916507720947,
+ -0.054915353655815125,
+ -0.06488456577062607,
+ -0.06820058822631836
+ ],
+ "acc_eval": 0.1728515625,
+ "loss_eval": 4587.541015625,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 4647.95556640625,
+ 1300320.625,
+ 1331227.625,
+ 1539845.25,
+ 1603645.625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012949237134307623,
+ 0.0007672033389098942,
+ 0.000767192745115608,
+ 0.0007670199265703559,
+ 0.0007670176564715803
+ ],
+ "gamma_dfa": 0.004104164429008961,
+ "gamma_dfa_per_layer": [
+ 0.2596903145313263,
+ -0.053032513707876205,
+ -0.0918058454990387,
+ -0.09843529760837555
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 3593.60400390625,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 4817.267578125,
+ 1453979.25,
+ 1486502.375,
+ 1706268.875,
+ 1774371.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014480708632618189,
+ 0.0007800625753588974,
+ 0.000779640453401953,
+ 0.0007796672289259732,
+ 0.000779696914833039
+ ],
+ "gamma_dfa": 0.02201501652598381,
+ "gamma_dfa_per_layer": [
+ 0.310447633266449,
+ -0.051143430173397064,
+ -0.08497071266174316,
+ -0.0862734243273735
+ ],
+ "acc_eval": 0.1708984375,
+ "loss_eval": 5472.59521484375,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 4990.40625,
+ 1611329.25,
+ 1646018.625,
+ 1880434.25,
+ 1953768.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018194144358858466,
+ 0.000765332777518779,
+ 0.0007653048378415406,
+ 0.0007655462250113487,
+ 0.0007656100788153708
+ ],
+ "gamma_dfa": 0.033283455297350883,
+ "gamma_dfa_per_layer": [
+ 0.3083266317844391,
+ -0.04947835952043533,
+ -0.06329820305109024,
+ -0.06241624802350998
+ ],
+ "acc_eval": 0.2021484375,
+ "loss_eval": 4069.216796875,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 5174.12255859375,
+ 1781529.0,
+ 1818275.25,
+ 2064802.5,
+ 2142905.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015505037736147642,
+ 0.0007980199297890067,
+ 0.0007979664951562881,
+ 0.0007982755196280777,
+ 0.000798304914496839
+ ],
+ "gamma_dfa": 0.019624613225460052,
+ "gamma_dfa_per_layer": [
+ 0.3409179449081421,
+ -0.05889412760734558,
+ -0.10494701564311981,
+ -0.09857834875583649
+ ],
+ "acc_eval": 0.099609375,
+ "loss_eval": 8309.7119140625,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 5347.279296875,
+ 1968104.0,
+ 2006811.625,
+ 2265948.5,
+ 2349278.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001387596596032381,
+ 0.0007817883160896599,
+ 0.0007816275465302169,
+ 0.000781797047238797,
+ 0.0007817737059667706
+ ],
+ "gamma_dfa": 0.000422419048845768,
+ "gamma_dfa_per_layer": [
+ 0.25772032141685486,
+ -0.06083279475569725,
+ -0.09708747267723083,
+ -0.0981103777885437
+ ],
+ "acc_eval": 0.1689453125,
+ "loss_eval": 4254.474609375,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 5501.59130859375,
+ 2140827.0,
+ 2181494.0,
+ 2452387.75,
+ 2540377.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001305495505221188,
+ 0.0007833651034161448,
+ 0.0007831369293853641,
+ 0.0007831998518668115,
+ 0.0007831742987036705
+ ],
+ "gamma_dfa": 0.019166686572134495,
+ "gamma_dfa_per_layer": [
+ 0.3015354871749878,
+ -0.04834163561463356,
+ -0.08644455671310425,
+ -0.090082548558712
+ ],
+ "acc_eval": 0.2060546875,
+ "loss_eval": 7909.48291015625,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 5605.65625,
+ 2338654.5,
+ 2381249.75,
+ 2662644.5,
+ 2754823.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001968128141015768,
+ 0.0008015396306291223,
+ 0.0008015292696654797,
+ 0.0008016829378902912,
+ 0.0008016840438358486
+ ],
+ "gamma_dfa": 0.01810804195702076,
+ "gamma_dfa_per_layer": [
+ 0.352972149848938,
+ -0.05855761468410492,
+ -0.11013064533472061,
+ -0.11185172200202942
+ ],
+ "acc_eval": 0.091796875,
+ "loss_eval": 9552.5458984375,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 5776.4921875,
+ 2524649.5,
+ 2569209.25,
+ 2862403.25,
+ 2959360.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001521907513961196,
+ 0.0007685177261009812,
+ 0.0007685192977078259,
+ 0.0007685712771490216,
+ 0.0007685913005843759
+ ],
+ "gamma_dfa": 0.006301743909716606,
+ "gamma_dfa_per_layer": [
+ 0.3194616436958313,
+ -0.07331519573926926,
+ -0.09753184020519257,
+ -0.12340763211250305
+ ],
+ "acc_eval": 0.123046875,
+ "loss_eval": 9288.3515625,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 5893.2958984375,
+ 2719236.25,
+ 2766489.0,
+ 3076192.25,
+ 3179584.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001874743727967143,
+ 0.0007690778584219515,
+ 0.0007690794300287962,
+ 0.000769136706367135,
+ 0.000769163656514138
+ ],
+ "gamma_dfa": -0.008455535396933556,
+ "gamma_dfa_per_layer": [
+ 0.27458086609840393,
+ -0.07574597001075745,
+ -0.10251512378454208,
+ -0.13014191389083862
+ ],
+ "acc_eval": 0.1015625,
+ "loss_eval": 9500.7265625,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 6037.26904296875,
+ 2917167.0,
+ 2966218.0,
+ 3287947.75,
+ 3395999.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015074120601639152,
+ 0.0007870618137530982,
+ 0.0007870634435676038,
+ 0.00078706128988415,
+ 0.0007870564586482942
+ ],
+ "gamma_dfa": 0.003465494140982628,
+ "gamma_dfa_per_layer": [
+ 0.23106470704078674,
+ -0.04510585218667984,
+ -0.1033426821231842,
+ -0.06875419616699219
+ ],
+ "acc_eval": 0.1484375,
+ "loss_eval": 13665.34375,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 6165.3271484375,
+ 3150321.25,
+ 3201845.5,
+ 3537869.5,
+ 3651609.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0038438383489847183,
+ 0.0007633256609551609,
+ 0.0007633093046024442,
+ 0.0007634069188497961,
+ 0.0007634120993316174
+ ],
+ "gamma_dfa": 0.05023553688079119,
+ "gamma_dfa_per_layer": [
+ 0.36768630146980286,
+ -0.05948590859770775,
+ -0.06263985484838486,
+ -0.0446183905005455
+ ],
+ "acc_eval": 0.130859375,
+ "loss_eval": 15518.396484375,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 6322.185546875,
+ 3356179.75,
+ 3409150.0,
+ 3756998.75,
+ 3874858.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017886407440528274,
+ 0.0007953053573146462,
+ 0.000795268511865288,
+ 0.0007953139720484614,
+ 0.0007953820750117302
+ ],
+ "gamma_dfa": -0.004728740081191063,
+ "gamma_dfa_per_layer": [
+ 0.26050812005996704,
+ -0.07150034606456757,
+ -0.10889407992362976,
+ -0.09902865439653397
+ ],
+ "acc_eval": 0.1474609375,
+ "loss_eval": 13731.47265625,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 6455.05615234375,
+ 3581075.75,
+ 3636212.25,
+ 3997916.75,
+ 4121800.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014103130670264363,
+ 0.0008020435925573111,
+ 0.0008020424866117537,
+ 0.0008023462723940611,
+ 0.0008024003473110497
+ ],
+ "gamma_dfa": 0.03236876800656319,
+ "gamma_dfa_per_layer": [
+ 0.3784361481666565,
+ -0.05973149091005325,
+ -0.09747618436813354,
+ -0.09175340086221695
+ ],
+ "acc_eval": 0.1396484375,
+ "loss_eval": 8173.1318359375,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 6596.92529296875,
+ 3790696.25,
+ 3847633.75,
+ 4219067.0,
+ 4346740.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001376444473862648,
+ 0.0007939717615954578,
+ 0.0007933968445286155,
+ 0.0007933415472507477,
+ 0.0007934658788144588
+ ],
+ "gamma_dfa": 0.026161080226302147,
+ "gamma_dfa_per_layer": [
+ 0.35278040170669556,
+ -0.07518108189105988,
+ -0.09520787000656128,
+ -0.07774712890386581
+ ],
+ "acc_eval": 0.158203125,
+ "loss_eval": 10093.57421875,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 6752.326171875,
+ 4013893.75,
+ 4072463.0,
+ 4456049.5,
+ 4588960.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016587942373007536,
+ 0.000801959540694952,
+ 0.0008019180968403816,
+ 0.0008022981346584857,
+ 0.0008023587288334966
+ ],
+ "gamma_dfa": 0.0014634709805250168,
+ "gamma_dfa_per_layer": [
+ 0.26356324553489685,
+ -0.05649265646934509,
+ -0.09903856366872787,
+ -0.10217814147472382
+ ],
+ "acc_eval": 0.16796875,
+ "loss_eval": 11805.994140625,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 6883.87158203125,
+ 4249640.0,
+ 4310267.0,
+ 4705052.0,
+ 4842379.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017551308264955878,
+ 0.0007804373744875193,
+ 0.0007804358028806746,
+ 0.0007804319611750543,
+ 0.0007804720080457628
+ ],
+ "gamma_dfa": -0.00971926562488079,
+ "gamma_dfa_per_layer": [
+ 0.23957225680351257,
+ -0.06951768696308136,
+ -0.09375166893005371,
+ -0.11517996340990067
+ ],
+ "acc_eval": 0.16015625,
+ "loss_eval": 19465.8828125,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 7004.37841796875,
+ 4461495.0,
+ 4523850.0,
+ 4930553.5,
+ 5072236.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015129564562812448,
+ 0.0007847726810723543,
+ 0.0007845073123462498,
+ 0.000784386123996228,
+ 0.0007843819330446422
+ ],
+ "gamma_dfa": 0.0085066519677639,
+ "gamma_dfa_per_layer": [
+ 0.2637098431587219,
+ -0.05605460703372955,
+ -0.08905251324176788,
+ -0.08457611501216888
+ ],
+ "acc_eval": 0.2021484375,
+ "loss_eval": 7892.26611328125,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 7112.80078125,
+ 4708139.0,
+ 4772392.0,
+ 5193498.0,
+ 5341091.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015166979283094406,
+ 0.0007669071783311665,
+ 0.0007669082842767239,
+ 0.0007670924533158541,
+ 0.0007671677158214152
+ ],
+ "gamma_dfa": 0.015125783160328865,
+ "gamma_dfa_per_layer": [
+ 0.2562488615512848,
+ -0.046804703772068024,
+ -0.08796676248311996,
+ -0.06097426265478134
+ ],
+ "acc_eval": 0.2333984375,
+ "loss_eval": 8893.0791015625,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 7200.81201171875,
+ 4906775.0,
+ 4972128.5,
+ 5401281.5,
+ 5552169.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015469590434804559,
+ 0.0007871663547120988,
+ 0.0007869182154536247,
+ 0.0007867610547691584,
+ 0.0007867159438319504
+ ],
+ "gamma_dfa": 0.016506953164935112,
+ "gamma_dfa_per_layer": [
+ 0.29171258211135864,
+ -0.05020506680011749,
+ -0.09062528610229492,
+ -0.08485441654920578
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 10566.345703125,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 7296.0625,
+ 5134799.0,
+ 5202023.5,
+ 5643737.5,
+ 5799758.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018195129232481122,
+ 0.0007844618521630764,
+ 0.0007844566716812551,
+ 0.000784536823630333,
+ 0.000784553587436676
+ ],
+ "gamma_dfa": 0.019483929499983788,
+ "gamma_dfa_per_layer": [
+ 0.29106640815734863,
+ -0.05478575825691223,
+ -0.07833737879991531,
+ -0.08000755310058594
+ ],
+ "acc_eval": 0.1650390625,
+ "loss_eval": 9639.78125,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 7403.17138671875,
+ 5361356.5,
+ 5429682.0,
+ 5879784.5,
+ 6039432.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002603700151666999,
+ 0.000755469489376992,
+ 0.0007554262992925942,
+ 0.0007555284537374973,
+ 0.0007555308402515948
+ ],
+ "gamma_dfa": 0.05388479772955179,
+ "gamma_dfa_per_layer": [
+ 0.3746236264705658,
+ -0.060121551156044006,
+ -0.06174459308385849,
+ -0.03721829131245613
+ ],
+ "acc_eval": 0.1494140625,
+ "loss_eval": 12397.41015625,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 7488.30126953125,
+ 5582023.0,
+ 5651748.5,
+ 6110668.5,
+ 6273320.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00202713580802083,
+ 0.0007801816100254655,
+ 0.000780182599555701,
+ 0.0007801790488883853,
+ 0.0007801697356626391
+ ],
+ "gamma_dfa": 0.01045304723083973,
+ "gamma_dfa_per_layer": [
+ 0.25068047642707825,
+ -0.06100655347108841,
+ -0.0828605443239212,
+ -0.06500118970870972
+ ],
+ "acc_eval": 0.2138671875,
+ "loss_eval": 18765.955078125,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 7561.47265625,
+ 5795100.5,
+ 5866105.0,
+ 6334896.0,
+ 6501444.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017575331730768085,
+ 0.0007978819194249809,
+ 0.0007978450739756227,
+ 0.000798230292275548,
+ 0.0007982761017046869
+ ],
+ "gamma_dfa": 0.011411387473344803,
+ "gamma_dfa_per_layer": [
+ 0.29157841205596924,
+ -0.05369853973388672,
+ -0.09859319031238556,
+ -0.09364113211631775
+ ],
+ "acc_eval": 0.1875,
+ "loss_eval": 10589.0087890625,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 7636.35595703125,
+ 6016687.0,
+ 6089686.0,
+ 6570658.5,
+ 6741688.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001416882500052452,
+ 0.0007854877039790154,
+ 0.0007851187838241458,
+ 0.0007847094675526023,
+ 0.0007846617372706532
+ ],
+ "gamma_dfa": 0.004635758697986603,
+ "gamma_dfa_per_layer": [
+ 0.2832094430923462,
+ -0.06018421798944473,
+ -0.10714054107666016,
+ -0.09734164923429489
+ ],
+ "acc_eval": 0.1884765625,
+ "loss_eval": 11045.0107421875,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 7700.8466796875,
+ 6215443.5,
+ 6289647.5,
+ 6780492.0,
+ 6955139.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017022350803017616,
+ 0.0007623002748005092,
+ 0.000762303126975894,
+ 0.000762506271712482,
+ 0.0007625941070728004
+ ],
+ "gamma_dfa": 0.026831449940800667,
+ "gamma_dfa_per_layer": [
+ 0.339847594499588,
+ -0.0706903263926506,
+ -0.0816052109003067,
+ -0.08022625744342804
+ ],
+ "acc_eval": 0.154296875,
+ "loss_eval": 9215.373046875,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 7773.85986328125,
+ 6413204.5,
+ 6488502.5,
+ 6988337.0,
+ 7166683.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013730988139286637,
+ 0.0007787180948071182,
+ 0.0007787116337567568,
+ 0.0007787745562382042,
+ 0.0007787866634316742
+ ],
+ "gamma_dfa": 0.013194277882575989,
+ "gamma_dfa_per_layer": [
+ 0.30715805292129517,
+ -0.0632064938545227,
+ -0.09261326491832733,
+ -0.09856118261814117
+ ],
+ "acc_eval": 0.2236328125,
+ "loss_eval": 6176.3076171875,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 7820.23388671875,
+ 6598801.0,
+ 6675650.0,
+ 7184845.0,
+ 7367520.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015506811905652285,
+ 0.000799653644207865,
+ 0.0007990750018507242,
+ 0.0007989082369022071,
+ 0.0007991326274350286
+ ],
+ "gamma_dfa": 0.00773581862449646,
+ "gamma_dfa_per_layer": [
+ 0.28355157375335693,
+ -0.054453425109386444,
+ -0.11499008536338806,
+ -0.08316478878259659
+ ],
+ "acc_eval": 0.205078125,
+ "loss_eval": 7889.31005859375,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 7864.2060546875,
+ 6797904.5,
+ 6876033.0,
+ 7392718.0,
+ 7578431.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020978215616196394,
+ 0.0007834822754375637,
+ 0.0007832171395421028,
+ 0.0007829645182937384,
+ 0.0007829380920156837
+ ],
+ "gamma_dfa": 0.033629802986979485,
+ "gamma_dfa_per_layer": [
+ 0.34407293796539307,
+ -0.05567466467618942,
+ -0.08536086976528168,
+ -0.06851819157600403
+ ],
+ "acc_eval": 0.15625,
+ "loss_eval": 14391.9736328125,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 7871.78173828125,
+ 7003051.0,
+ 7083124.0,
+ 7611188.0,
+ 7801170.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012560655595734715,
+ 0.0007599582313559949,
+ 0.0007599598611705005,
+ 0.0007601079414598644,
+ 0.0007601887919008732
+ ],
+ "gamma_dfa": 0.004498079419136047,
+ "gamma_dfa_per_layer": [
+ 0.32327917218208313,
+ -0.07260935008525848,
+ -0.10525670647621155,
+ -0.1274207979440689
+ ],
+ "acc_eval": 0.1572265625,
+ "loss_eval": 7188.275390625,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 7934.14794921875,
+ 7210797.0,
+ 7292245.5,
+ 7829288.0,
+ 8023057.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001343236886896193,
+ 0.0007599524687975645,
+ 0.0007598291267640889,
+ 0.0007597675430588424,
+ 0.0007598883821628988
+ ],
+ "gamma_dfa": 0.02613817434757948,
+ "gamma_dfa_per_layer": [
+ 0.3003483712673187,
+ -0.0427340604364872,
+ -0.09165668487548828,
+ -0.06140492856502533
+ ],
+ "acc_eval": 0.259765625,
+ "loss_eval": 7055.94677734375,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 7964.50244140625,
+ 7416797.0,
+ 7500505.0,
+ 8048676.5,
+ 8247824.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015083092730492353,
+ 0.0007851184927858412,
+ 0.0007850866531953216,
+ 0.0007850754773244262,
+ 0.0007851301343180239
+ ],
+ "gamma_dfa": 0.027105171233415604,
+ "gamma_dfa_per_layer": [
+ 0.37000784277915955,
+ -0.05895276367664337,
+ -0.10036876797676086,
+ -0.1022656261920929
+ ],
+ "acc_eval": 0.166015625,
+ "loss_eval": 7052.08203125,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 8006.1318359375,
+ 7588913.0,
+ 7673353.5,
+ 8229041.0,
+ 8431689.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014928504824638367,
+ 0.0007839660393074155,
+ 0.000783930707257241,
+ 0.0007839277386665344,
+ 0.0007839910103939474
+ ],
+ "gamma_dfa": 0.018935419619083405,
+ "gamma_dfa_per_layer": [
+ 0.3158775568008423,
+ -0.051478639245033264,
+ -0.09881415218114853,
+ -0.08984308689832687
+ ],
+ "acc_eval": 0.2119140625,
+ "loss_eval": 6266.041015625,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 8030.2109375,
+ 7754257.5,
+ 7839832.5,
+ 8400781.0,
+ 8605522.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012633835431188345,
+ 0.0007809567032381892,
+ 0.0007807457586750388,
+ 0.0007805972127243876,
+ 0.0007805809145793319
+ ],
+ "gamma_dfa": 0.009956683963537216,
+ "gamma_dfa_per_layer": [
+ 0.30735114216804504,
+ -0.06991781294345856,
+ -0.09387198090553284,
+ -0.10373461246490479
+ ],
+ "acc_eval": 0.1806640625,
+ "loss_eval": 8467.8125,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 8048.080078125,
+ 7913574.5,
+ 8000306.0,
+ 8567918.0,
+ 8775169.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001400441862642765,
+ 0.0007796542486175895,
+ 0.0007795418496243656,
+ 0.0007795065175741911,
+ 0.0007797059370204806
+ ],
+ "gamma_dfa": 0.008816102519631386,
+ "gamma_dfa_per_layer": [
+ 0.28880423307418823,
+ -0.05614739656448364,
+ -0.11088694632053375,
+ -0.0865054801106453
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 9558.021484375,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 8067.34375,
+ 8070731.5,
+ 8158800.0,
+ 8733572.0,
+ 8943043.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014346289681270719,
+ 0.000756031135097146,
+ 0.0007560329977422953,
+ 0.0007561623933725059,
+ 0.0007562324753962457
+ ],
+ "gamma_dfa": 0.009170351549983025,
+ "gamma_dfa_per_layer": [
+ 0.3515056073665619,
+ -0.0781104564666748,
+ -0.10490105301141739,
+ -0.1318126916885376
+ ],
+ "acc_eval": 0.1103515625,
+ "loss_eval": 11967.486328125,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 8073.40283203125,
+ 8227977.0,
+ 8317204.5,
+ 8898513.0,
+ 9110756.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015745362034067512,
+ 0.0007811843534000218,
+ 0.000781158625613898,
+ 0.0007811560644768178,
+ 0.0007812076364643872
+ ],
+ "gamma_dfa": 0.011113166809082031,
+ "gamma_dfa_per_layer": [
+ 0.30191734433174133,
+ -0.05505914241075516,
+ -0.10382715612649918,
+ -0.09857837855815887
+ ],
+ "acc_eval": 0.177734375,
+ "loss_eval": 7797.017578125,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 8071.63623046875,
+ 8375112.0,
+ 8465576.0,
+ 9052592.0,
+ 9267093.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002133303554728627,
+ 0.0007824470521882176,
+ 0.0007822668994776905,
+ 0.0007822004845365882,
+ 0.0007824745844118297
+ ],
+ "gamma_dfa": 0.03663862869143486,
+ "gamma_dfa_per_layer": [
+ 0.34291785955429077,
+ -0.036236945539712906,
+ -0.10749906301498413,
+ -0.052627336233854294
+ ],
+ "acc_eval": 0.1396484375,
+ "loss_eval": 11433.0302734375,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 8084.59130859375,
+ 8523176.0,
+ 8614498.0,
+ 9207429.0,
+ 9424164.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001537870615720749,
+ 0.0007688916521146894,
+ 0.0007688923506066203,
+ 0.0007689034100621939,
+ 0.0007689160411246121
+ ],
+ "gamma_dfa": 0.020611698739230633,
+ "gamma_dfa_per_layer": [
+ 0.3258458971977234,
+ -0.053132835775613785,
+ -0.10754033923149109,
+ -0.08272592723369598
+ ],
+ "acc_eval": 0.1787109375,
+ "loss_eval": 6151.634765625,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 8098.82373046875,
+ 8648680.0,
+ 8741121.0,
+ 9338018.0,
+ 9556207.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014389777788892388,
+ 0.0007975181215442717,
+ 0.0007967942510731518,
+ 0.0007966712000779808,
+ 0.0007968792924657464
+ ],
+ "gamma_dfa": 0.009284427389502525,
+ "gamma_dfa_per_layer": [
+ 0.29391974210739136,
+ -0.058484748005867004,
+ -0.11177978664636612,
+ -0.08651749789714813
+ ],
+ "acc_eval": 0.18359375,
+ "loss_eval": 5277.328125,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 8113.7255859375,
+ 8773553.0,
+ 8866719.0,
+ 9469018.0,
+ 9689706.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00145814404822886,
+ 0.0007955037872307003,
+ 0.0007954062311910093,
+ 0.0007954093161970377,
+ 0.0007956796325743198
+ ],
+ "gamma_dfa": 0.01389121450483799,
+ "gamma_dfa_per_layer": [
+ 0.28217679262161255,
+ -0.058154717087745667,
+ -0.08273636549711227,
+ -0.08572085201740265
+ ],
+ "acc_eval": 0.1923828125,
+ "loss_eval": 10207.12109375,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 8063.9951171875,
+ 8889169.0,
+ 8984089.0,
+ 9593494.0,
+ 9817277.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011409161379560828,
+ 0.0007544065010733902,
+ 0.0007542934035882354,
+ 0.000754217617213726,
+ 0.0007543462561443448
+ ],
+ "gamma_dfa": 0.018794666975736618,
+ "gamma_dfa_per_layer": [
+ 0.2941493093967438,
+ -0.0533231720328331,
+ -0.09251905977725983,
+ -0.07312840968370438
+ ],
+ "acc_eval": 0.2626953125,
+ "loss_eval": 4281.3994140625,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 8021.80126953125,
+ 9019768.0,
+ 9115790.0,
+ 9730846.0,
+ 9956825.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012580875772982836,
+ 0.0007680498529225588,
+ 0.0007680428680032492,
+ 0.0007680479320697486,
+ 0.0007680551498197019
+ ],
+ "gamma_dfa": 0.027317012660205364,
+ "gamma_dfa_per_layer": [
+ 0.3265392780303955,
+ -0.04611017927527428,
+ -0.09342358261346817,
+ -0.0777374655008316
+ ],
+ "acc_eval": 0.2275390625,
+ "loss_eval": 4907.6142578125,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 7995.38916015625,
+ 9118244.0,
+ 9214531.0,
+ 9832139.0,
+ 10058956.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012337823864072561,
+ 0.0007691435748711228,
+ 0.000768946367315948,
+ 0.000768885191064328,
+ 0.0007689236663281918
+ ],
+ "gamma_dfa": 0.012230871245265007,
+ "gamma_dfa_per_layer": [
+ 0.2935040593147278,
+ -0.06186644732952118,
+ -0.09978199750185013,
+ -0.08293212950229645
+ ],
+ "acc_eval": 0.2001953125,
+ "loss_eval": 7199.5888671875,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 7966.3759765625,
+ 9213122.0,
+ 9310022.0,
+ 9931662.0,
+ 10160365.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011302486527711153,
+ 0.0007655700901523232,
+ 0.0007655754452571273,
+ 0.0007655742228962481,
+ 0.0007655934314243495
+ ],
+ "gamma_dfa": 0.01679898425936699,
+ "gamma_dfa_per_layer": [
+ 0.3025580048561096,
+ -0.05692540109157562,
+ -0.10290184617042542,
+ -0.07553482055664062
+ ],
+ "acc_eval": 0.2490234375,
+ "loss_eval": 2667.806640625,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 7937.92041015625,
+ 9292608.0,
+ 9390243.0,
+ 10015125.0,
+ 10244868.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011147550540044904,
+ 0.0007753095123916864,
+ 0.0007750216755084693,
+ 0.000774735352024436,
+ 0.0007747214986011386
+ ],
+ "gamma_dfa": 0.027967805042862892,
+ "gamma_dfa_per_layer": [
+ 0.3572651743888855,
+ -0.05705829709768295,
+ -0.09071685373783112,
+ -0.09761880338191986
+ ],
+ "acc_eval": 0.1923828125,
+ "loss_eval": 3299.91259765625,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 7904.56689453125,
+ 9393010.0,
+ 9491687.0,
+ 10122118.0,
+ 10354408.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00107352074701339,
+ 0.0007645431905984879,
+ 0.0007645484292879701,
+ 0.0007645472651347518,
+ 0.0007645685109309852
+ ],
+ "gamma_dfa": 0.02625838667154312,
+ "gamma_dfa_per_layer": [
+ 0.3598015606403351,
+ -0.06442467868328094,
+ -0.09077714383602142,
+ -0.09956619143486023
+ ],
+ "acc_eval": 0.2119140625,
+ "loss_eval": 2758.64599609375,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 7855.07861328125,
+ 9500690.0,
+ 9600497.0,
+ 10235757.0,
+ 10469660.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001235201139934361,
+ 0.0007838172605261207,
+ 0.000783789437264204,
+ 0.0007840599282644689,
+ 0.00078408676199615
+ ],
+ "gamma_dfa": 0.02602401003241539,
+ "gamma_dfa_per_layer": [
+ 0.35960710048675537,
+ -0.06299363076686859,
+ -0.10128454864025116,
+ -0.09123288094997406
+ ],
+ "acc_eval": 0.1689453125,
+ "loss_eval": 4279.3154296875,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 7826.134765625,
+ 9581674.0,
+ 9682195.0,
+ 10320423.0,
+ 10555402.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010469084372743964,
+ 0.0007737708510830998,
+ 0.0007735842373222113,
+ 0.0007734137470833957,
+ 0.0007734144455753267
+ ],
+ "gamma_dfa": 0.024147922173142433,
+ "gamma_dfa_per_layer": [
+ 0.37674999237060547,
+ -0.07557321339845657,
+ -0.09047992527484894,
+ -0.11410516500473022
+ ],
+ "acc_eval": 0.1669921875,
+ "loss_eval": 3201.240966796875,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 7779.2138671875,
+ 9660604.0,
+ 9761859.0,
+ 10404086.0,
+ 10640750.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010143390391021967,
+ 0.0007633482455275953,
+ 0.0007633481291122735,
+ 0.0007633698405697942,
+ 0.0007633839850313962
+ ],
+ "gamma_dfa": 0.019840596243739128,
+ "gamma_dfa_per_layer": [
+ 0.30444687604904175,
+ -0.049144186079502106,
+ -0.09650193899869919,
+ -0.07943836599588394
+ ],
+ "acc_eval": 0.2763671875,
+ "loss_eval": 1991.417236328125,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 7760.08642578125,
+ 9716882.0,
+ 9818513.0,
+ 10462903.0,
+ 10700433.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00105896289460361,
+ 0.0007729134522378445,
+ 0.0007727605989202857,
+ 0.0007726037292741239,
+ 0.000772611063439399
+ ],
+ "gamma_dfa": 0.026730000041425228,
+ "gamma_dfa_per_layer": [
+ 0.34768593311309814,
+ -0.056363869458436966,
+ -0.09562714397907257,
+ -0.0887749195098877
+ ],
+ "acc_eval": 0.2177734375,
+ "loss_eval": 2112.26025390625,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 7743.93798828125,
+ 9786243.0,
+ 9888395.0,
+ 10535762.0,
+ 10774483.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010133162140846252,
+ 0.0007726953481324017,
+ 0.0007724745664745569,
+ 0.0007722667651250958,
+ 0.0007722647860646248
+ ],
+ "gamma_dfa": 0.019241390749812126,
+ "gamma_dfa_per_layer": [
+ 0.3473237156867981,
+ -0.06556949764490128,
+ -0.10282130539417267,
+ -0.10196734964847565
+ ],
+ "acc_eval": 0.193359375,
+ "loss_eval": 2962.46826171875,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 7708.34033203125,
+ 9842047.0,
+ 9944650.0,
+ 10594529.0,
+ 10834219.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000999346375465393,
+ 0.0007619770476594567,
+ 0.0007619837997481227,
+ 0.0007619837415404618,
+ 0.0007620092947036028
+ ],
+ "gamma_dfa": 0.019368495792150497,
+ "gamma_dfa_per_layer": [
+ 0.3106932044029236,
+ -0.057876452803611755,
+ -0.09636038541793823,
+ -0.0789823830127716
+ ],
+ "acc_eval": 0.2607421875,
+ "loss_eval": 1792.6400146484375,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 7673.24560546875,
+ 9901470.0,
+ 10004649.0,
+ 10656950.0,
+ 10898699.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009565355721861124,
+ 0.0007485878886654973,
+ 0.0007484929519705474,
+ 0.000748424616176635,
+ 0.0007485424866899848
+ ],
+ "gamma_dfa": 0.01748405210673809,
+ "gamma_dfa_per_layer": [
+ 0.2931858003139496,
+ -0.05277211219072342,
+ -0.09270339459180832,
+ -0.07777408510446548
+ ],
+ "acc_eval": 0.29296875,
+ "loss_eval": 974.1173095703125,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 7628.22412109375,
+ 9951868.0,
+ 10055369.0,
+ 10709207.0,
+ 10951317.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000980330049060285,
+ 0.0007466387469321489,
+ 0.0007466417155228555,
+ 0.0007467885152436793,
+ 0.0007468488765880466
+ ],
+ "gamma_dfa": 0.019473757594823837,
+ "gamma_dfa_per_layer": [
+ 0.29309791326522827,
+ -0.05341349542140961,
+ -0.08986704051494598,
+ -0.07192234694957733
+ ],
+ "acc_eval": 0.27734375,
+ "loss_eval": 1743.6519775390625,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 7586.08837890625,
+ 9992418.0,
+ 10096238.0,
+ 10751557.0,
+ 10993641.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009816273814067245,
+ 0.0007609970052726567,
+ 0.000761001487262547,
+ 0.0007610011962242424,
+ 0.0007610262255184352
+ ],
+ "gamma_dfa": 0.017493372783064842,
+ "gamma_dfa_per_layer": [
+ 0.307644248008728,
+ -0.054675400257110596,
+ -0.09402725845575333,
+ -0.08896809816360474
+ ],
+ "acc_eval": 0.2783203125,
+ "loss_eval": 986.1089477539062,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 7546.07666015625,
+ 10019561.0,
+ 10123471.0,
+ 10779392.0,
+ 11021634.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010106659028679132,
+ 0.0007606986328028142,
+ 0.0007606985163874924,
+ 0.0007607255247421563,
+ 0.0007607414736412466
+ ],
+ "gamma_dfa": 0.0189383989199996,
+ "gamma_dfa_per_layer": [
+ 0.3057447671890259,
+ -0.05296015366911888,
+ -0.09528908133506775,
+ -0.08174193650484085
+ ],
+ "acc_eval": 0.2412109375,
+ "loss_eval": 1453.539306640625,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 7507.373046875,
+ 10034866.0,
+ 10138899.0,
+ 10794880.0,
+ 11037002.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009441400761716068,
+ 0.0007457168539986014,
+ 0.0007457205792888999,
+ 0.0007458969485014677,
+ 0.0007459585904143751
+ ],
+ "gamma_dfa": 0.016358308494091034,
+ "gamma_dfa_per_layer": [
+ 0.29192131757736206,
+ -0.054730333387851715,
+ -0.08949868381023407,
+ -0.08225906640291214
+ ],
+ "acc_eval": 0.2939453125,
+ "loss_eval": 889.3756103515625,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 7475.10595703125,
+ 10059038.0,
+ 10163330.0,
+ 10820810.0,
+ 11063516.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009275015909224749,
+ 0.0007406340446323156,
+ 0.0007405761862173676,
+ 0.0007405940559692681,
+ 0.0007405842188745737
+ ],
+ "gamma_dfa": 0.019343840889632702,
+ "gamma_dfa_per_layer": [
+ 0.2714617848396301,
+ -0.049602191895246506,
+ -0.07989576458930969,
+ -0.06458846479654312
+ ],
+ "acc_eval": 0.322265625,
+ "loss_eval": 778.108642578125,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 7444.8466796875,
+ 10064810.0,
+ 10169219.0,
+ 10827134.0,
+ 11070129.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009403944713994861,
+ 0.000745263765566051,
+ 0.0007452677236869931,
+ 0.0007454471196979284,
+ 0.0007455073646269739
+ ],
+ "gamma_dfa": 0.01310044713318348,
+ "gamma_dfa_per_layer": [
+ 0.28572195768356323,
+ -0.054389551281929016,
+ -0.09277918189764023,
+ -0.08615143597126007
+ ],
+ "acc_eval": 0.26953125,
+ "loss_eval": 932.53662109375,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 7414.4970703125,
+ 10075394.0,
+ 10179775.0,
+ 10837778.0,
+ 11080979.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009539846796542406,
+ 0.0007622878183610737,
+ 0.0007622832781635225,
+ 0.0007622758857905865,
+ 0.0007622810662724078
+ ],
+ "gamma_dfa": 0.02442830428481102,
+ "gamma_dfa_per_layer": [
+ 0.34633398056030273,
+ -0.059510812163352966,
+ -0.09629844129085541,
+ -0.09281150996685028
+ ],
+ "acc_eval": 0.228515625,
+ "loss_eval": 1020.4122924804688,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 7385.740234375,
+ 10098198.0,
+ 10202575.0,
+ 10860396.0,
+ 11103300.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009258585050702095,
+ 0.0007462432840839028,
+ 0.0007461663917638361,
+ 0.000746095203794539,
+ 0.0007462148205377162
+ ],
+ "gamma_dfa": 0.021881024353206158,
+ "gamma_dfa_per_layer": [
+ 0.3117921054363251,
+ -0.0562119297683239,
+ -0.0811537504196167,
+ -0.08690232783555984
+ ],
+ "acc_eval": 0.2783203125,
+ "loss_eval": 812.965576171875,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 7372.93115234375,
+ 10112263.0,
+ 10216603.0,
+ 10874068.0,
+ 11116538.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009158457978628576,
+ 0.000744756544008851,
+ 0.0007447608513757586,
+ 0.0007449553813785315,
+ 0.0007450156263075769
+ ],
+ "gamma_dfa": 0.018241400830447674,
+ "gamma_dfa_per_layer": [
+ 0.27702248096466064,
+ -0.048618000000715256,
+ -0.0829005166888237,
+ -0.072538360953331
+ ],
+ "acc_eval": 0.330078125,
+ "loss_eval": 675.6625366210938,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 7363.2099609375,
+ 10119183.0,
+ 10223550.0,
+ 10881119.0,
+ 11123569.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009229940478689969,
+ 0.0007447171374224126,
+ 0.000744720280636102,
+ 0.0007448522374033928,
+ 0.000744906603358686
+ ],
+ "gamma_dfa": 0.016729017719626427,
+ "gamma_dfa_per_layer": [
+ 0.27939361333847046,
+ -0.048901431262493134,
+ -0.08870212733745575,
+ -0.07487398386001587
+ ],
+ "acc_eval": 0.3251953125,
+ "loss_eval": 708.3804931640625,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 7355.3544921875,
+ 10123197.0,
+ 10227558.0,
+ 10885026.0,
+ 11127411.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009278868092224002,
+ 0.0007445889641530812,
+ 0.0007445933879353106,
+ 0.0007447681855410337,
+ 0.0007448261021636426
+ ],
+ "gamma_dfa": 0.014646172523498535,
+ "gamma_dfa_per_layer": [
+ 0.28425437211990356,
+ -0.053754955530166626,
+ -0.08852015435695648,
+ -0.08339457213878632
+ ],
+ "acc_eval": 0.310546875,
+ "loss_eval": 688.0819091796875,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 7349.30078125,
+ 10126695.0,
+ 10231071.0,
+ 10888593.0,
+ 11130985.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000914200150873512,
+ 0.0007393965497612953,
+ 0.000739329494535923,
+ 0.0007393491105176508,
+ 0.0007393329287879169
+ ],
+ "gamma_dfa": 0.01913625281304121,
+ "gamma_dfa_per_layer": [
+ 0.26301705837249756,
+ -0.04846196621656418,
+ -0.07772514969110489,
+ -0.06028493121266365
+ ],
+ "acc_eval": 0.3203125,
+ "loss_eval": 697.3836669921875,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 7345.333984375,
+ 10127832.0,
+ 10232199.0,
+ 10889673.0,
+ 11132020.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009217644692398608,
+ 0.0007456630119122565,
+ 0.0007455685408785939,
+ 0.0007454968290403485,
+ 0.0007456148159690201
+ ],
+ "gamma_dfa": 0.017519758082926273,
+ "gamma_dfa_per_layer": [
+ 0.29056763648986816,
+ -0.05349243804812431,
+ -0.08799343556165695,
+ -0.0790027305483818
+ ],
+ "acc_eval": 0.30859375,
+ "loss_eval": 661.5548095703125,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 7343.10888671875,
+ 10128861.0,
+ 10233227.0,
+ 10890713.0,
+ 11133060.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009042566525749862,
+ 0.0007393184932880104,
+ 0.0007392505649477243,
+ 0.0007392706465907395,
+ 0.0007392524858005345
+ ],
+ "gamma_dfa": 0.018206479027867317,
+ "gamma_dfa_per_layer": [
+ 0.2680240869522095,
+ -0.047486238181591034,
+ -0.08014586567878723,
+ -0.06756606698036194
+ ],
+ "acc_eval": 0.3388671875,
+ "loss_eval": 636.5595703125,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 7342.0625,
+ 10129300.0,
+ 10233666.0,
+ 10891137.0,
+ 11133475.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009002314181998372,
+ 0.0007393373525701463,
+ 0.0007392485276795924,
+ 0.0007392755360342562,
+ 0.0007392438710667193
+ ],
+ "gamma_dfa": 0.01726893801242113,
+ "gamma_dfa_per_layer": [
+ 0.2736765742301941,
+ -0.05038469657301903,
+ -0.0817006528377533,
+ -0.07251547276973724
+ ],
+ "acc_eval": 0.3330078125,
+ "loss_eval": 611.882080078125,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 7341.77294921875,
+ 10129401.0,
+ 10233766.0,
+ 10891235.0,
+ 11133570.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009032402304001153,
+ 0.0007393273408524692,
+ 0.0007392435800284147,
+ 0.0007392680854536593,
+ 0.0007392411935143173
+ ],
+ "gamma_dfa": 0.01641188934445381,
+ "gamma_dfa_per_layer": [
+ 0.2728629410266876,
+ -0.05080822855234146,
+ -0.08297968655824661,
+ -0.0734274685382843
+ ],
+ "acc_eval": 0.33203125,
+ "loss_eval": 625.6834106445312,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file
diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s456.json b/results/snapshot_no_outln_v1/snapshot_noLN_s456.json
new file mode 100644
index 0000000..f490ffc
--- /dev/null
+++ b/results/snapshot_no_outln_v1/snapshot_noLN_s456.json
@@ -0,0 +1,4766 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_no_outln_v1",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 456,
+ "depth": 4,
+ "d_hidden": 256
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "architecture": "ResidualMLP_NoOutLN",
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 8.696551322937012,
+ 8.737784385681152,
+ 8.813130378723145,
+ 8.844642639160156,
+ 8.889528274536133
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005607507191598415,
+ 0.0005558764678426087,
+ 0.0005541853606700897,
+ 0.0005498801474459469,
+ 0.0005458085797727108
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.091796875,
+ "loss_eval": 2.3707523345947266,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 40.06809616088867,
+ 37.16851043701172,
+ 35.97419738769531,
+ 34.98802185058594,
+ 34.09989547729492
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00013246900925878435,
+ 0.00013836311700288206,
+ 0.00014998784172348678,
+ 0.00017555677914060652,
+ 0.0002279145992361009
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4365234375,
+ "loss_eval": 1.5941123962402344,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 51.32597732543945,
+ 46.865997314453125,
+ 44.336944580078125,
+ 42.399295806884766,
+ 41.083709716796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010603138071019202,
+ 0.00011028712469851598,
+ 0.00011670063395285979,
+ 0.00013331198715604842,
+ 0.00016258291725534946
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4736328125,
+ "loss_eval": 1.4793150424957275,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 62.084197998046875,
+ 56.17497253417969,
+ 52.24001693725586,
+ 48.81613540649414,
+ 45.96797561645508
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.958917507901788e-05,
+ 0.00010542560630710796,
+ 0.00011132164945593104,
+ 0.00012339121894910932,
+ 0.00014191119407769293
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.48046875,
+ "loss_eval": 1.4157963991165161,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 70.11115264892578,
+ 62.7204704284668,
+ 57.0128059387207,
+ 52.67961883544922,
+ 49.0619010925293
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.119982860283926e-05,
+ 9.68000604189001e-05,
+ 0.0001028164042509161,
+ 0.0001113277321564965,
+ 0.00012708066788036376
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.529296875,
+ "loss_eval": 1.3824131488800049,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 77.96520233154297,
+ 68.33187866210938,
+ 62.02028274536133,
+ 56.785953521728516,
+ 52.50190734863281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.251978190150112e-05,
+ 9.91317501757294e-05,
+ 0.00010523655510041863,
+ 0.00011500742402859032,
+ 0.00012610112025868148
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.49609375,
+ "loss_eval": 1.4219003915786743,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 84.35594940185547,
+ 73.65497589111328,
+ 65.76171875,
+ 59.78555679321289,
+ 54.72732925415039
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.53061064844951e-05,
+ 9.119947208091617e-05,
+ 9.546471119392663e-05,
+ 0.00010272912186337635,
+ 0.00011094262299593538
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5107421875,
+ "loss_eval": 1.3764042854309082,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 90.34719848632812,
+ 78.86559295654297,
+ 69.58448028564453,
+ 62.62751388549805,
+ 56.49700164794922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.279601024696603e-05,
+ 8.869311568560079e-05,
+ 9.525373752694577e-05,
+ 0.00010276824468746781,
+ 0.00011047293082810938
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.521484375,
+ "loss_eval": 1.3063517808914185,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 94.70899200439453,
+ 82.14017486572266,
+ 72.3757553100586,
+ 63.97325134277344,
+ 57.261043548583984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.42147201183252e-05,
+ 8.977072138804942e-05,
+ 9.571140253683552e-05,
+ 0.00010196219227509573,
+ 0.00010500354983378202
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.521484375,
+ "loss_eval": 1.3536221981048584,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 101.69925689697266,
+ 87.86920928955078,
+ 77.13504791259766,
+ 68.15769958496094,
+ 60.63106918334961
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.040699322009459e-05,
+ 8.682452607899904e-05,
+ 9.194648009724915e-05,
+ 9.875267278403044e-05,
+ 0.00010358950385125354
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.517578125,
+ "loss_eval": 1.3398748636245728,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 106.84738159179688,
+ 92.9166259765625,
+ 81.7030029296875,
+ 71.8150863647461,
+ 63.29521179199219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.807361544109881e-05,
+ 8.290779078379273e-05,
+ 8.751150744501501e-05,
+ 9.41800099099055e-05,
+ 9.622493234928697e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5595703125,
+ "loss_eval": 1.3021488189697266,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 110.62977600097656,
+ 96.08146667480469,
+ 83.02938842773438,
+ 71.82244873046875,
+ 62.47097396850586
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.582613034173846e-05,
+ 8.177754352800548e-05,
+ 8.888287266017869e-05,
+ 9.501135355094448e-05,
+ 9.754132042871788e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.53125,
+ "loss_eval": 1.2963578701019287,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 115.87433624267578,
+ 99.99412536621094,
+ 86.81661987304688,
+ 75.194580078125,
+ 65.24598693847656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.453945727320388e-05,
+ 7.999759691301733e-05,
+ 8.587146294303238e-05,
+ 9.281275561079383e-05,
+ 9.684430551715195e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.537109375,
+ "loss_eval": 1.300926685333252,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 115.8588638305664,
+ 100.0324478149414,
+ 87.23123931884766,
+ 75.2608871459961,
+ 64.53407287597656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.783657201798633e-05,
+ 8.2304140960332e-05,
+ 8.792509470367804e-05,
+ 9.308305016020313e-05,
+ 9.498461440671235e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5302734375,
+ "loss_eval": 1.2952370643615723,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 121.24994659423828,
+ 103.9144515991211,
+ 88.99864959716797,
+ 75.50836944580078,
+ 64.28103637695312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.956428453326225e-05,
+ 8.667269139550626e-05,
+ 9.291838068747893e-05,
+ 9.890568617265671e-05,
+ 0.00010031831334345043
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.537109375,
+ "loss_eval": 1.3034818172454834,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 124.64612579345703,
+ 107.64379119873047,
+ 92.03299713134766,
+ 77.67626190185547,
+ 66.19109344482422
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.466476381523535e-05,
+ 8.086472371360287e-05,
+ 8.857141801854596e-05,
+ 9.320858225692064e-05,
+ 9.685206168796867e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.521484375,
+ "loss_eval": 1.2701925039291382,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 128.4908905029297,
+ 110.93827819824219,
+ 95.34327697753906,
+ 80.90787506103516,
+ 68.56732940673828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.461471977876499e-05,
+ 8.18013577372767e-05,
+ 8.659388549858704e-05,
+ 9.226851398125291e-05,
+ 9.443429007660598e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5537109375,
+ "loss_eval": 1.2619553804397583,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 130.65846252441406,
+ 112.31464385986328,
+ 95.85350036621094,
+ 79.80601501464844,
+ 67.30303192138672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.368716615019366e-05,
+ 8.01649657660164e-05,
+ 8.653382974443957e-05,
+ 9.32966941036284e-05,
+ 9.312365727964789e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5576171875,
+ "loss_eval": 1.2436624765396118,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 133.13165283203125,
+ 114.61791229248047,
+ 97.15895080566406,
+ 81.40515899658203,
+ 69.13287353515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.137899228837341e-05,
+ 7.771244418108836e-05,
+ 8.332561264978722e-05,
+ 8.920324762584642e-05,
+ 8.9491848484613e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.56640625,
+ "loss_eval": 1.239585518836975,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 136.59140014648438,
+ 117.42953491210938,
+ 99.51315307617188,
+ 83.76544189453125,
+ 69.16895294189453
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.198385719675571e-05,
+ 7.928090053610504e-05,
+ 8.52016091812402e-05,
+ 9.1185538622085e-05,
+ 9.257275087293237e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5673828125,
+ "loss_eval": 1.2780827283859253,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 139.33346557617188,
+ 119.61570739746094,
+ 102.05357360839844,
+ 85.16582489013672,
+ 70.09222412109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.267932232934982e-05,
+ 7.949839346110821e-05,
+ 8.610116492491215e-05,
+ 9.125673386733979e-05,
+ 9.256677003577352e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5419921875,
+ "loss_eval": 1.2823748588562012,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 141.82034301757812,
+ 122.27132415771484,
+ 103.36873626708984,
+ 86.49518585205078,
+ 71.40383911132812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.251821807585657e-05,
+ 7.807672955095768e-05,
+ 8.464990969514474e-05,
+ 8.788360719336197e-05,
+ 8.839634392643347e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.55859375,
+ "loss_eval": 1.2162373065948486,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 144.1250762939453,
+ 123.32146453857422,
+ 105.33419036865234,
+ 87.95057678222656,
+ 71.54405975341797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.141266542021185e-05,
+ 7.827960507711396e-05,
+ 8.527522732038051e-05,
+ 9.162349306279793e-05,
+ 8.910013275453821e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5712890625,
+ "loss_eval": 1.2267348766326904,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 145.35816955566406,
+ 123.92304229736328,
+ 106.45323944091797,
+ 89.38124084472656,
+ 72.80756378173828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.914530968060717e-05,
+ 7.74021100369282e-05,
+ 8.25833558337763e-05,
+ 8.843685645842925e-05,
+ 8.765731763560325e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615234375,
+ "loss_eval": 1.2464958429336548,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 146.9630126953125,
+ 126.59661102294922,
+ 108.23934936523438,
+ 90.85575103759766,
+ 72.80107879638672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.045341044431552e-05,
+ 7.726218609604985e-05,
+ 8.23774971649982e-05,
+ 8.931937190936878e-05,
+ 9.00102750165388e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5556640625,
+ "loss_eval": 1.226228952407837,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 150.7821044921875,
+ 129.61668395996094,
+ 108.98286437988281,
+ 89.68734741210938,
+ 72.85277557373047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.34334607841447e-05,
+ 7.900002674432471e-05,
+ 8.469617750961334e-05,
+ 8.900847751647234e-05,
+ 8.846351556712762e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.572265625,
+ "loss_eval": 1.2140324115753174,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 151.44703674316406,
+ 129.4413604736328,
+ 110.14541625976562,
+ 91.28382110595703,
+ 74.19001770019531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.830286292824894e-05,
+ 7.440579793183133e-05,
+ 8.040962711675093e-05,
+ 8.615498518338427e-05,
+ 8.749076368985698e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5771484375,
+ "loss_eval": 1.2101829051971436,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 153.631591796875,
+ 132.0617218017578,
+ 110.9275894165039,
+ 92.176513671875,
+ 73.5614242553711
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.137414650060236e-05,
+ 7.97546817921102e-05,
+ 8.503787830704823e-05,
+ 9.110210521612316e-05,
+ 9.112519910559058e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.1954376697540283,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 155.2130584716797,
+ 133.7564697265625,
+ 113.44039916992188,
+ 93.51616668701172,
+ 74.26422882080078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.436865416821092e-05,
+ 8.266629447462037e-05,
+ 8.722272468730807e-05,
+ 9.24940686672926e-05,
+ 9.228193084709346e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.568359375,
+ "loss_eval": 1.2368288040161133,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 156.52346801757812,
+ 134.0899200439453,
+ 113.28357696533203,
+ 93.11508178710938,
+ 74.41522216796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.232115603983402e-05,
+ 7.883219950599596e-05,
+ 8.385341061512008e-05,
+ 8.885351417120546e-05,
+ 8.985922613646835e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5849609375,
+ "loss_eval": 1.1935406923294067,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 157.1343536376953,
+ 136.0911102294922,
+ 115.831298828125,
+ 94.6191177368164,
+ 74.93243408203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.815487722633407e-05,
+ 7.527582783950493e-05,
+ 8.152059308486059e-05,
+ 8.597332634963095e-05,
+ 8.487412560498342e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1716928482055664,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 158.87771606445312,
+ 136.84617614746094,
+ 115.38484191894531,
+ 95.1522445678711,
+ 75.46046447753906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.11698376107961e-05,
+ 7.946270488901064e-05,
+ 8.58406419865787e-05,
+ 8.943407010519877e-05,
+ 8.97061254363507e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5908203125,
+ "loss_eval": 1.1900701522827148,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 158.57237243652344,
+ 135.3989715576172,
+ 115.39788818359375,
+ 94.26459503173828,
+ 74.65320587158203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.135280611691996e-05,
+ 7.875803567003459e-05,
+ 8.35385944810696e-05,
+ 9.056212002178654e-05,
+ 8.802927186479792e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.58984375,
+ "loss_eval": 1.1936118602752686,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 161.12164306640625,
+ 138.0847930908203,
+ 116.51541137695312,
+ 96.06510925292969,
+ 75.79708862304688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.089033169904724e-05,
+ 7.788193033775315e-05,
+ 8.262616029242054e-05,
+ 8.66727132233791e-05,
+ 8.98441721801646e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1777372360229492,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 162.0608673095703,
+ 138.521728515625,
+ 117.39189147949219,
+ 96.19066619873047,
+ 75.76524353027344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.102260860847309e-05,
+ 7.727317279204726e-05,
+ 8.381292718695477e-05,
+ 8.586590411141515e-05,
+ 8.668057853356004e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1749277114868164,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 161.66477966308594,
+ 138.45208740234375,
+ 118.22246551513672,
+ 96.99449920654297,
+ 76.40058135986328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.717143696732819e-05,
+ 7.219286635518074e-05,
+ 7.78083413024433e-05,
+ 8.173672540578991e-05,
+ 8.14773520687595e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.183088779449463,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 163.6893310546875,
+ 140.37518310546875,
+ 119.34339904785156,
+ 96.78111267089844,
+ 75.42987823486328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.809990736655891e-05,
+ 7.472001743735746e-05,
+ 7.982164243003353e-05,
+ 8.6645879491698e-05,
+ 8.662666368763894e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.1695549488067627,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 164.063232421875,
+ 140.68441772460938,
+ 118.45069122314453,
+ 96.70316314697266,
+ 75.4270248413086
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.114750769687817e-05,
+ 7.883143553044647e-05,
+ 8.33458179840818e-05,
+ 8.941504347603768e-05,
+ 8.57952400110662e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.1776624917984009,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 163.89480590820312,
+ 140.18966674804688,
+ 119.30622863769531,
+ 97.97473907470703,
+ 76.34546661376953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.944040069356561e-05,
+ 7.674084190512076e-05,
+ 8.196813723770902e-05,
+ 8.950124902185053e-05,
+ 8.920513209886849e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.1852729320526123,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 165.47622680664062,
+ 141.58221435546875,
+ 119.55635070800781,
+ 98.0240707397461,
+ 76.13150787353516
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.238827674882486e-05,
+ 7.85816737334244e-05,
+ 8.403261745115742e-05,
+ 8.998374687507749e-05,
+ 8.897150837583467e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5869140625,
+ "loss_eval": 1.1676307916641235,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 164.69053649902344,
+ 142.07537841796875,
+ 121.09794616699219,
+ 99.6556396484375,
+ 77.98886108398438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.123505201889202e-05,
+ 7.861913036322221e-05,
+ 8.443401020485908e-05,
+ 8.940586121752858e-05,
+ 8.976398385129869e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1959164142608643,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 164.97906494140625,
+ 141.9008026123047,
+ 120.19933319091797,
+ 98.47044372558594,
+ 76.0770263671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.325963088078424e-05,
+ 8.044692367548123e-05,
+ 8.460321987513453e-05,
+ 9.052005771081895e-05,
+ 8.883728878572583e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1650420427322388,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 167.11508178710938,
+ 144.4076690673828,
+ 121.90902709960938,
+ 99.70268249511719,
+ 77.1493911743164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.938715523574501e-05,
+ 7.598697993671522e-05,
+ 8.122843428282067e-05,
+ 8.419268124271184e-05,
+ 8.758077456150204e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1334974765777588,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 167.23953247070312,
+ 143.8128662109375,
+ 121.41165924072266,
+ 99.37804412841797,
+ 76.86026763916016
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.253287185449153e-05,
+ 7.92228602222167e-05,
+ 8.514960791217163e-05,
+ 9.06435088836588e-05,
+ 8.896931103663519e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1443839073181152,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 167.02175903320312,
+ 143.56179809570312,
+ 121.07357025146484,
+ 98.59805297851562,
+ 76.59933471679688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.202434790087864e-05,
+ 7.884378283051774e-05,
+ 8.405950211454183e-05,
+ 8.979378617368639e-05,
+ 8.789195271674544e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.1233543157577515,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 168.8506622314453,
+ 144.7351531982422,
+ 122.07427978515625,
+ 100.25342559814453,
+ 77.3443832397461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.906851194798946e-05,
+ 7.469953561667353e-05,
+ 7.91402708273381e-05,
+ 8.30625431262888e-05,
+ 8.482224802719429e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1078553199768066,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 167.80520629882812,
+ 145.0210418701172,
+ 123.11544036865234,
+ 101.08995056152344,
+ 77.6504898071289
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.715168274240568e-05,
+ 7.365776400547475e-05,
+ 7.808832015143707e-05,
+ 8.405041444348171e-05,
+ 8.283500210382044e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1213364601135254,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 168.5064697265625,
+ 144.57977294921875,
+ 122.67310333251953,
+ 100.03209686279297,
+ 76.30200958251953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.193082274170592e-05,
+ 7.761332381051034e-05,
+ 8.224599878303707e-05,
+ 8.772317232796922e-05,
+ 8.76585254445672e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.1593999862670898,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 168.2687225341797,
+ 145.1931610107422,
+ 123.04153442382812,
+ 100.33060455322266,
+ 77.3511734008789
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.396154978778213e-05,
+ 8.14273880678229e-05,
+ 8.724145300220698e-05,
+ 9.166308882413432e-05,
+ 9.03390027815476e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1506351232528687,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 169.19711303710938,
+ 145.7348175048828,
+ 122.21668243408203,
+ 100.78398895263672,
+ 77.85338592529297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.148115400923416e-05,
+ 7.858182652853429e-05,
+ 8.472947956761345e-05,
+ 8.831475861370564e-05,
+ 9.002227307064459e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1426208019256592,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 169.87611389160156,
+ 144.65980529785156,
+ 122.2470932006836,
+ 99.39762115478516,
+ 76.66820526123047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.574502524221316e-05,
+ 8.358684863196686e-05,
+ 8.949989569373429e-05,
+ 9.581056656315923e-05,
+ 9.291989408666268e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.146412968635559,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 167.4952850341797,
+ 143.16302490234375,
+ 119.86161804199219,
+ 97.8775863647461,
+ 75.75617980957031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.487049151677638e-05,
+ 8.140889985952526e-05,
+ 8.958375110523775e-05,
+ 9.491044329479337e-05,
+ 9.230020805262029e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6064453125,
+ "loss_eval": 1.1555390357971191,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 169.03530883789062,
+ 144.57913208007812,
+ 122.20657348632812,
+ 100.42291259765625,
+ 77.34142303466797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.283290324267e-05,
+ 8.043479465413839e-05,
+ 8.612027886556461e-05,
+ 9.16399949346669e-05,
+ 9.119778405874968e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.145568609237671,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 168.97242736816406,
+ 144.64987182617188,
+ 121.88980865478516,
+ 99.5838394165039,
+ 76.98419952392578
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.706385804340243e-05,
+ 8.52798912092112e-05,
+ 9.141799091594294e-05,
+ 9.48576707742177e-05,
+ 9.280487574869767e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.173735499382019,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 169.5861053466797,
+ 145.18853759765625,
+ 123.36368560791016,
+ 100.5948257446289,
+ 77.515380859375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.197257218649611e-05,
+ 7.774284313200042e-05,
+ 8.511826308676973e-05,
+ 9.136695007327944e-05,
+ 8.776389586273581e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.125669240951538,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 168.54624938964844,
+ 144.20028686523438,
+ 120.96566009521484,
+ 98.61659240722656,
+ 75.90725708007812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.784854824421927e-05,
+ 8.512740896549076e-05,
+ 9.021186269819736e-05,
+ 9.572209819452837e-05,
+ 9.406798199051991e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.143272042274475,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 167.1956024169922,
+ 144.33364868164062,
+ 121.39191436767578,
+ 99.15605926513672,
+ 76.89862060546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.683308649575338e-05,
+ 8.338083716807887e-05,
+ 9.210927237290889e-05,
+ 9.760970715433359e-05,
+ 9.435461106477305e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.1492671966552734,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 168.5964813232422,
+ 144.6849365234375,
+ 122.38106536865234,
+ 99.73613739013672,
+ 77.72384643554688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.762440509395674e-05,
+ 8.45814065542072e-05,
+ 9.048492211150005e-05,
+ 9.445888281334192e-05,
+ 9.163413778878748e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1285452842712402,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 169.4349365234375,
+ 145.3781280517578,
+ 122.81243896484375,
+ 100.45063781738281,
+ 77.73384094238281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.32980333850719e-05,
+ 8.07973847258836e-05,
+ 8.676065772306174e-05,
+ 8.88932918314822e-05,
+ 8.98713551578112e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.623046875,
+ "loss_eval": 1.1177959442138672,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 167.85089111328125,
+ 143.60365295410156,
+ 120.23004913330078,
+ 98.14772033691406,
+ 76.00984191894531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.664797885809094e-05,
+ 8.470165630569682e-05,
+ 9.283467807108536e-05,
+ 9.794873039936647e-05,
+ 9.169583063339815e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.1301027536392212,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 167.4250946044922,
+ 144.43685913085938,
+ 120.5447769165039,
+ 98.6132583618164,
+ 76.67144775390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.264616579050198e-05,
+ 8.033386984607205e-05,
+ 8.730305125936866e-05,
+ 9.157789463642985e-05,
+ 9.014589886646718e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6337890625,
+ "loss_eval": 1.1262563467025757,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 167.57273864746094,
+ 143.9201202392578,
+ 120.18034362792969,
+ 99.7088851928711,
+ 77.43472290039062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.527784327976406e-05,
+ 8.20689310785383e-05,
+ 8.86347406776622e-05,
+ 9.488592331763357e-05,
+ 9.351663175038993e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1255381107330322,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 168.32432556152344,
+ 143.3669891357422,
+ 120.5047378540039,
+ 98.29914093017578,
+ 76.91972351074219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.1095946370624e-05,
+ 9.126035001827404e-05,
+ 9.773251076694578e-05,
+ 0.00010036173625849187,
+ 9.892736852634698e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.625,
+ "loss_eval": 1.121397614479065,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 167.19789123535156,
+ 143.76556396484375,
+ 120.66227722167969,
+ 98.42743682861328,
+ 76.89801788330078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.633089262526482e-05,
+ 8.335815800819546e-05,
+ 9.061676246346906e-05,
+ 9.574641444487497e-05,
+ 9.495441918261349e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1192781925201416,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 166.93948364257812,
+ 142.26893615722656,
+ 119.55793762207031,
+ 97.94837951660156,
+ 76.42357635498047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.782453758409247e-05,
+ 8.425768464803696e-05,
+ 9.212247096002102e-05,
+ 9.447304182685912e-05,
+ 9.302303078584373e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1216533184051514,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 166.6027069091797,
+ 143.06201171875,
+ 120.18063354492188,
+ 98.2688217163086,
+ 76.29009246826172
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.051560871535912e-05,
+ 8.871743193594739e-05,
+ 9.67002852121368e-05,
+ 0.00010364756599301472,
+ 9.896839765133336e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.623046875,
+ "loss_eval": 1.1287095546722412,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 167.1055908203125,
+ 142.63758850097656,
+ 119.64879608154297,
+ 97.64229583740234,
+ 76.44933319091797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.66752491472289e-05,
+ 8.481083932565525e-05,
+ 9.087422949960455e-05,
+ 9.747539297677577e-05,
+ 9.831935312831774e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1142747402191162,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 165.7790985107422,
+ 141.932861328125,
+ 119.308349609375,
+ 97.3916244506836,
+ 76.28073120117188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.054008503677323e-05,
+ 8.828196587273851e-05,
+ 9.400352428201586e-05,
+ 0.0001006148086162284,
+ 9.63730999501422e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6220703125,
+ "loss_eval": 1.1091513633728027,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 166.0056915283203,
+ 142.36737060546875,
+ 119.14185333251953,
+ 97.59127044677734,
+ 76.91047668457031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.921652286313474e-05,
+ 8.842039096634835e-05,
+ 9.518962178844959e-05,
+ 9.989101090468466e-05,
+ 9.532425610814244e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.634765625,
+ "loss_eval": 1.109208106994629,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 165.06881713867188,
+ 141.9323272705078,
+ 119.31546783447266,
+ 97.39105987548828,
+ 76.88532257080078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.891654968261719e-05,
+ 8.609334327047691e-05,
+ 9.276948549086228e-05,
+ 9.923002653522417e-05,
+ 9.674452303443104e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.102659821510315,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 165.70677185058594,
+ 141.7493896484375,
+ 119.19147491455078,
+ 97.61845397949219,
+ 76.11932373046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.021068788366392e-05,
+ 8.757255272939801e-05,
+ 9.637014591135085e-05,
+ 0.00010106353875016794,
+ 9.785306610865518e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1182312965393066,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 164.398193359375,
+ 141.26121520996094,
+ 118.28160095214844,
+ 96.55244445800781,
+ 75.79473876953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.341020293300971e-05,
+ 9.248757123714313e-05,
+ 9.663405944593251e-05,
+ 0.00010157335054827854,
+ 9.801337728276849e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.1038966178894043,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 164.95956420898438,
+ 141.71456909179688,
+ 118.70948028564453,
+ 96.87312316894531,
+ 76.1374740600586
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.227327634813264e-05,
+ 9.05249617062509e-05,
+ 9.777413652045652e-05,
+ 0.00010368443327024579,
+ 9.96799353742972e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1255979537963867,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 164.7284393310547,
+ 140.8751678466797,
+ 118.047607421875,
+ 96.35321044921875,
+ 75.17439270019531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.813700358383358e-05,
+ 8.510561019647866e-05,
+ 9.316992509411648e-05,
+ 9.944752673618495e-05,
+ 9.348603634862229e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6298828125,
+ "loss_eval": 1.1074620485305786,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 164.93450927734375,
+ 140.53248596191406,
+ 117.69375610351562,
+ 96.16271209716797,
+ 75.15106201171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.089678158285096e-05,
+ 9.048588981386274e-05,
+ 9.746959403855726e-05,
+ 0.00010185279097640887,
+ 9.633745503379032e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.118239164352417,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 164.21043395996094,
+ 139.88815307617188,
+ 117.45735931396484,
+ 95.94420623779297,
+ 75.4442138671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.050485485000536e-05,
+ 8.884233102435246e-05,
+ 9.638822666602209e-05,
+ 9.927270002663136e-05,
+ 9.542587213218212e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6337890625,
+ "loss_eval": 1.1022429466247559,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 163.64498901367188,
+ 139.56788635253906,
+ 117.33267974853516,
+ 95.80303192138672,
+ 75.07954406738281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.35943064885214e-05,
+ 9.346263686893508e-05,
+ 0.0001004879450192675,
+ 0.00010487801773706451,
+ 0.0001030422281473875
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.101865530014038,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 163.15895080566406,
+ 139.2528533935547,
+ 116.07748413085938,
+ 94.62651824951172,
+ 74.8349380493164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.33335579955019e-05,
+ 9.210313146468252e-05,
+ 9.823974687606096e-05,
+ 0.00010392737749498338,
+ 9.883133316179737e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6337890625,
+ "loss_eval": 1.107062816619873,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 162.9849090576172,
+ 138.823974609375,
+ 116.6355972290039,
+ 95.05895233154297,
+ 74.80722045898438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.333245204994455e-05,
+ 9.167871758108959e-05,
+ 9.739672532305121e-05,
+ 0.00010222326818620786,
+ 9.918824798660353e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6328125,
+ "loss_eval": 1.1088743209838867,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 162.9673614501953,
+ 138.89553833007812,
+ 116.67662811279297,
+ 94.80388641357422,
+ 74.41240692138672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.250313112512231e-05,
+ 9.097345173358917e-05,
+ 9.694542677607387e-05,
+ 0.00010250341438222677,
+ 9.611865971237421e-05
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6318359375,
+ "loss_eval": 1.1069759130477905,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 163.01101684570312,
+ 138.9472198486328,
+ 116.52082824707031,
+ 94.81626892089844,
+ 74.34078216552734
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.468546730000526e-05,
+ 9.535141725791618e-05,
+ 9.998930181609467e-05,
+ 0.00010477996693225577,
+ 0.00010350123920943588
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6455078125,
+ "loss_eval": 1.11004638671875,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 162.48593139648438,
+ 138.60171508789062,
+ 116.15435028076172,
+ 94.63046264648438,
+ 74.77122497558594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.888062438927591e-05,
+ 9.835455421125516e-05,
+ 0.00010451052366988733,
+ 0.00010972235031658784,
+ 0.00010192779154749587
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.63671875,
+ "loss_eval": 1.1166486740112305,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 162.33985900878906,
+ 138.57908630371094,
+ 115.86516571044922,
+ 94.62572479248047,
+ 74.61656951904297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.704938227310777e-05,
+ 9.788614988792688e-05,
+ 0.00010670957271941006,
+ 0.00011224307672819123,
+ 0.00010563644173089415
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6337890625,
+ "loss_eval": 1.1027870178222656,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 162.28363037109375,
+ 137.98855590820312,
+ 115.68619537353516,
+ 94.57305145263672,
+ 74.67822265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.545320451958105e-05,
+ 9.513215627521276e-05,
+ 0.00010359021689509973,
+ 0.00010905940871452913,
+ 0.00010360238957218826
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6416015625,
+ "loss_eval": 1.1074315309524536,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 161.65008544921875,
+ 138.2888946533203,
+ 115.37015533447266,
+ 94.0649185180664,
+ 74.40010070800781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.725856605451554e-05,
+ 9.554363350616768e-05,
+ 0.00010503961675567552,
+ 0.00011096282105427235,
+ 0.00010341637971578166
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 1.104964017868042,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 162.56822204589844,
+ 138.35604858398438,
+ 115.56212615966797,
+ 93.74854278564453,
+ 74.29190826416016
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.511068881489336e-05,
+ 9.339748066850007e-05,
+ 0.00010132823081221431,
+ 0.00010685007873689756,
+ 0.00010203333658864722
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.634765625,
+ "loss_eval": 1.110845923423767,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 161.8057861328125,
+ 137.9845733642578,
+ 115.51632690429688,
+ 94.12870788574219,
+ 74.2806167602539
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.701891783857718e-05,
+ 9.453850361751392e-05,
+ 0.00010162424587178975,
+ 0.00010690372437238693,
+ 0.0001028447222779505
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.640625,
+ "loss_eval": 1.108534574508667,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 161.5404815673828,
+ 137.67727661132812,
+ 115.56287384033203,
+ 94.2837142944336,
+ 74.19786834716797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.555947715649381e-05,
+ 9.61149125942029e-05,
+ 0.00010081662185257301,
+ 0.00010581265814835206,
+ 0.00010205370926996693
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.642578125,
+ "loss_eval": 1.1068053245544434,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 161.6155242919922,
+ 137.77752685546875,
+ 115.26612854003906,
+ 93.79004669189453,
+ 74.01652526855469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.888345473678783e-05,
+ 9.766507719177753e-05,
+ 0.00010646588634699583,
+ 0.0001093660102924332,
+ 0.0001023485092446208
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.640625,
+ "loss_eval": 1.112060308456421,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 161.4155731201172,
+ 137.4070281982422,
+ 114.93219757080078,
+ 93.83850860595703,
+ 74.04694366455078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.62668312038295e-05,
+ 9.635779133532196e-05,
+ 0.00010364993795519695,
+ 0.00010628051677485928,
+ 0.00010416742588859051
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 1.1054459810256958,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 161.10385131835938,
+ 137.37892150878906,
+ 114.876953125,
+ 93.37522888183594,
+ 73.81317901611328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.967578469309956e-05,
+ 9.864033199846745e-05,
+ 0.00010763857426354662,
+ 0.00011277131852693856,
+ 0.0001057170593412593
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.634765625,
+ "loss_eval": 1.1104364395141602,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 160.9930419921875,
+ 137.13717651367188,
+ 114.8873062133789,
+ 93.33486938476562,
+ 74.0313949584961
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.793028973741457e-05,
+ 9.762586705619469e-05,
+ 0.00010612032929202542,
+ 0.00010882189963012934,
+ 0.00010218457464361563
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 1.107926607131958,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 161.131103515625,
+ 136.96864318847656,
+ 114.8429183959961,
+ 93.4638442993164,
+ 74.06806945800781
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.899801468942314e-05,
+ 9.761646651895717e-05,
+ 0.00010549664148129523,
+ 0.00011210257798666134,
+ 0.000105380589957349
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.1014349460601807,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 160.92770385742188,
+ 137.00291442871094,
+ 114.67124938964844,
+ 93.55059051513672,
+ 73.94056701660156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.758921467233449e-05,
+ 9.86124505288899e-05,
+ 0.0001072377126547508,
+ 0.00011291914415778592,
+ 0.00010492445289855823
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.1031121015548706,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 160.88087463378906,
+ 136.80621337890625,
+ 114.49836730957031,
+ 93.34219360351562,
+ 73.85013580322266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.935505320550874e-05,
+ 9.829271584749222e-05,
+ 0.00010722390288719907,
+ 0.00011369076673872769,
+ 0.0001048692429321818
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.64453125,
+ "loss_eval": 1.105837106704712,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 160.87530517578125,
+ 136.97203063964844,
+ 114.57328033447266,
+ 93.34746551513672,
+ 73.79950714111328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.837936184136197e-05,
+ 9.732619946589693e-05,
+ 0.00010843550262507051,
+ 0.00011282044579274952,
+ 0.00010489222768228501
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6435546875,
+ "loss_eval": 1.1061646938323975,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 160.83152770996094,
+ 136.82012939453125,
+ 114.41039276123047,
+ 93.26609802246094,
+ 73.75130462646484
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.924134453991428e-05,
+ 9.699882502900437e-05,
+ 0.00010844215285032988,
+ 0.00011508698662510142,
+ 0.00010382343316450715
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.1083133220672607,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 160.8388214111328,
+ 136.79220581054688,
+ 114.45349884033203,
+ 93.23229217529297,
+ 73.71869659423828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.902873378247023e-05,
+ 9.731733007356524e-05,
+ 0.0001077003325917758,
+ 0.00011335347517160699,
+ 0.00010528459824854508
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.1074192523956299,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 160.82676696777344,
+ 136.7546844482422,
+ 114.41687774658203,
+ 93.24365234375,
+ 73.72588348388672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.967860048869625e-05,
+ 9.900779696181417e-05,
+ 0.00010877639579121023,
+ 0.00011359385825926438,
+ 0.0001041799841914326
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.1075721979141235,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 160.8055419921875,
+ 136.8428955078125,
+ 114.41191864013672,
+ 93.23294067382812,
+ 73.72472381591797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.870402962202206e-05,
+ 9.879077697405592e-05,
+ 0.00010879703768296167,
+ 0.00011367550177965313,
+ 0.00010426441440358758
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.107743263244629,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 160.795166015625,
+ 136.82778930664062,
+ 114.41122436523438,
+ 93.22368621826172,
+ 73.72713470458984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.868239092407748e-05,
+ 9.911284723784775e-05,
+ 0.00010880655463552102,
+ 0.00011359110794728622,
+ 0.00010424658830743283
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.646484375,
+ "loss_eval": 1.1077194213867188,
+ "epoch": 100
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.696551322937012,
+ 8.737784385681152,
+ 8.813130378723145,
+ 8.844642639160156,
+ 8.889528274536133
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005607507191598415,
+ 0.0005558764678426087,
+ 0.0005541853606700897,
+ 0.0005498801474459469,
+ 0.0005458085797727108
+ ],
+ "gamma_dfa": 0.002593531389720738,
+ "gamma_dfa_per_layer": [
+ 0.011040969751775265,
+ 0.0018278355710208416,
+ -0.019951725378632545,
+ 0.01745704561471939
+ ],
+ "acc_eval": 0.091796875,
+ "loss_eval": 2.3707523345947266,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 543.6214599609375,
+ 970.167724609375,
+ 1128.5582275390625,
+ 1385.4898681640625,
+ 1506.6824951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006441785371862352,
+ 0.0006426527979783714,
+ 0.0006424304447136819,
+ 0.000642389350105077,
+ 0.0006423307931981981
+ ],
+ "gamma_dfa": 0.013619338162243366,
+ "gamma_dfa_per_layer": [
+ 0.044537801295518875,
+ 0.008280456066131592,
+ -0.026753954589366913,
+ 0.02841304987668991
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 7.057413101196289,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 877.8099365234375,
+ 2093.12060546875,
+ 2686.85400390625,
+ 3536.0849609375,
+ 3998.738037109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007192303892225027,
+ 0.000718857510946691,
+ 0.0007187117007561028,
+ 0.0007188154268078506,
+ 0.0007185889990068972
+ ],
+ "gamma_dfa": -0.0027784015983343124,
+ "gamma_dfa_per_layer": [
+ 0.04956255108118057,
+ -0.024007968604564667,
+ -0.02988382987678051,
+ -0.006784358993172646
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 11.82400131225586,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 1082.57763671875,
+ 3122.52001953125,
+ 4171.595703125,
+ 5502.81494140625,
+ 6367.2392578125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007569500594399869,
+ 0.0007553253090009093,
+ 0.0007550596492365003,
+ 0.0007549565634690225,
+ 0.0007544843829236925
+ ],
+ "gamma_dfa": -0.004858810920268297,
+ "gamma_dfa_per_layer": [
+ 0.06696394830942154,
+ -0.024477044120430946,
+ -0.04227307811379433,
+ -0.019649069756269455
+ ],
+ "acc_eval": 0.18359375,
+ "loss_eval": 24.264713287353516,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 1244.07275390625,
+ 4114.89111328125,
+ 5548.310546875,
+ 7262.12744140625,
+ 8410.1474609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007311897934414446,
+ 0.0007286664913408458,
+ 0.0007287323824129999,
+ 0.0007287483895197511,
+ 0.0007287858170457184
+ ],
+ "gamma_dfa": -0.003940413473173976,
+ "gamma_dfa_per_layer": [
+ 0.06546925008296967,
+ -0.03793267905712128,
+ -0.03520221635699272,
+ -0.008096008561551571
+ ],
+ "acc_eval": 0.197265625,
+ "loss_eval": 21.850379943847656,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 1357.7320556640625,
+ 5130.4609375,
+ 7149.40380859375,
+ 9744.58984375,
+ 11396.052734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000750180275645107,
+ 0.0007480062777176499,
+ 0.0007475404418073595,
+ 0.0007476753671653569,
+ 0.0007474455051124096
+ ],
+ "gamma_dfa": -6.745467544533312e-06,
+ "gamma_dfa_per_layer": [
+ 0.08006488531827927,
+ -0.0292807687073946,
+ -0.04997118189930916,
+ -0.0008399165817536414
+ ],
+ "acc_eval": 0.2314453125,
+ "loss_eval": 30.650737762451172,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 1438.5594482421875,
+ 5736.68994140625,
+ 8271.92578125,
+ 11658.373046875,
+ 13768.2861328125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000744938850402832,
+ 0.0007369474042207003,
+ 0.0007347911596298218,
+ 0.0007346841157414019,
+ 0.000734883826225996
+ ],
+ "gamma_dfa": -0.0024929028004407883,
+ "gamma_dfa_per_layer": [
+ 0.08933529257774353,
+ -0.03695790469646454,
+ -0.04257381707429886,
+ -0.019775182008743286
+ ],
+ "acc_eval": 0.23046875,
+ "loss_eval": 42.61720275878906,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 1512.00244140625,
+ 6517.73779296875,
+ 9229.724609375,
+ 13440.5166015625,
+ 16669.212890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007609400781802833,
+ 0.0007555288611911237,
+ 0.0007558621582575142,
+ 0.0007557112840004265,
+ 0.0007554451585747302
+ ],
+ "gamma_dfa": -0.007545993197709322,
+ "gamma_dfa_per_layer": [
+ 0.08795229345560074,
+ -0.03476891666650772,
+ -0.06410981714725494,
+ -0.01925753243267536
+ ],
+ "acc_eval": 0.208984375,
+ "loss_eval": 50.873321533203125,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 1582.1080322265625,
+ 7188.6318359375,
+ 9899.5947265625,
+ 15346.5009765625,
+ 19886.591796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007456639432348311,
+ 0.0007417471497319639,
+ 0.0007396289147436619,
+ 0.0007396984728984535,
+ 0.0007395402644760907
+ ],
+ "gamma_dfa": -0.009718619287014008,
+ "gamma_dfa_per_layer": [
+ 0.09109380096197128,
+ -0.042414966970682144,
+ -0.04605134204030037,
+ -0.0415019690990448
+ ],
+ "acc_eval": 0.189453125,
+ "loss_eval": 54.14390182495117,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 1618.51708984375,
+ 7916.01416015625,
+ 10608.3408203125,
+ 17416.95703125,
+ 24058.658203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007598118390887976,
+ 0.0007534913602285087,
+ 0.0007532819290645421,
+ 0.0007532560266554356,
+ 0.0007529302965849638
+ ],
+ "gamma_dfa": 0.0011779842898249626,
+ "gamma_dfa_per_layer": [
+ 0.10601411014795303,
+ -0.0355507917702198,
+ -0.04322661831974983,
+ -0.022524762898683548
+ ],
+ "acc_eval": 0.169921875,
+ "loss_eval": 79.9201889038086,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 1708.6558837890625,
+ 8872.5908203125,
+ 11589.568359375,
+ 19666.24609375,
+ 28447.203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000754358887206763,
+ 0.0007440761546604335,
+ 0.0007443547365255654,
+ 0.0007444044458679855,
+ 0.0007447295938618481
+ ],
+ "gamma_dfa": -0.006681790575385094,
+ "gamma_dfa_per_layer": [
+ 0.12310357391834259,
+ -0.054726000875234604,
+ -0.061426255851984024,
+ -0.03367847949266434
+ ],
+ "acc_eval": 0.189453125,
+ "loss_eval": 117.76714324951172,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 1757.5994873046875,
+ 10265.8017578125,
+ 13090.66796875,
+ 22099.814453125,
+ 34584.30078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000756443478167057,
+ 0.0007464477675966918,
+ 0.000743720680475235,
+ 0.0007434834260493517,
+ 0.0007420994224958122
+ ],
+ "gamma_dfa": -0.01398628018796444,
+ "gamma_dfa_per_layer": [
+ 0.12564796209335327,
+ -0.05404478684067726,
+ -0.07238315045833588,
+ -0.05516514554619789
+ ],
+ "acc_eval": 0.189453125,
+ "loss_eval": 103.90010070800781,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 1799.9754638671875,
+ 11735.4208984375,
+ 14739.4091796875,
+ 24244.48828125,
+ 40467.53125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007648739847354591,
+ 0.0007477994076907635,
+ 0.0007476488244719803,
+ 0.0007475496386177838,
+ 0.0007478601182810962
+ ],
+ "gamma_dfa": -0.005489904433488846,
+ "gamma_dfa_per_layer": [
+ 0.1469549834728241,
+ -0.04884009808301926,
+ -0.05759190022945404,
+ -0.06248260289430618
+ ],
+ "acc_eval": 0.2041015625,
+ "loss_eval": 124.61287689208984,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 1851.51123046875,
+ 13681.8662109375,
+ 17609.712890625,
+ 27533.84375,
+ 52049.0703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007830688264220953,
+ 0.0007742528687231243,
+ 0.0007744400063529611,
+ 0.0007723497110418975,
+ 0.0007720965659245849
+ ],
+ "gamma_dfa": -0.0014207642525434494,
+ "gamma_dfa_per_layer": [
+ 0.18515333533287048,
+ -0.04434240236878395,
+ -0.09712066501379013,
+ -0.0493733249604702
+ ],
+ "acc_eval": 0.142578125,
+ "loss_eval": 212.8883056640625,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 1899.2525634765625,
+ 16269.4736328125,
+ 21580.724609375,
+ 31947.771484375,
+ 66851.5703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000794055697042495,
+ 0.0007606232538819313,
+ 0.0007601877441629767,
+ 0.0007598533411510289,
+ 0.000759296934120357
+ ],
+ "gamma_dfa": 0.012796862982213497,
+ "gamma_dfa_per_layer": [
+ 0.206809401512146,
+ -0.04797299578785896,
+ -0.0716182291507721,
+ -0.03603072464466095
+ ],
+ "acc_eval": 0.1591796875,
+ "loss_eval": 268.9534912109375,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 1988.337890625,
+ 20679.96484375,
+ 27719.126953125,
+ 37757.640625,
+ 86759.0234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007827074150554836,
+ 0.0007373052649199963,
+ 0.0007380677270703018,
+ 0.000736265501473099,
+ 0.0007371739484369755
+ ],
+ "gamma_dfa": 0.003913283348083496,
+ "gamma_dfa_per_layer": [
+ 0.18332748115062714,
+ -0.05311701446771622,
+ -0.06076449155807495,
+ -0.053792841732501984
+ ],
+ "acc_eval": 0.2548828125,
+ "loss_eval": 367.0162048339844,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 2074.877685546875,
+ 25397.2421875,
+ 35934.484375,
+ 45723.14453125,
+ 111497.4296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008315286249853671,
+ 0.0007900919299572706,
+ 0.0007844009087421,
+ 0.0007838390883989632,
+ 0.0007860813639126718
+ ],
+ "gamma_dfa": -0.002616437152028084,
+ "gamma_dfa_per_layer": [
+ 0.21044191718101501,
+ -0.05741831660270691,
+ -0.1141648143529892,
+ -0.049324534833431244
+ ],
+ "acc_eval": 0.1220703125,
+ "loss_eval": 449.4093322753906,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 2160.0703125,
+ 30060.396484375,
+ 43998.6953125,
+ 54128.03515625,
+ 137197.4375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007943993550725281,
+ 0.0007568124565295875,
+ 0.0007565468549728394,
+ 0.0007549119181931019,
+ 0.0007542246603406966
+ ],
+ "gamma_dfa": 0.005578489974141121,
+ "gamma_dfa_per_layer": [
+ 0.21836650371551514,
+ -0.057003527879714966,
+ -0.08258379250764847,
+ -0.05646522343158722
+ ],
+ "acc_eval": 0.2099609375,
+ "loss_eval": 505.51385498046875,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 2261.926025390625,
+ 35914.08203125,
+ 53701.83203125,
+ 65022.0234375,
+ 174995.234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008322449866682291,
+ 0.0007640637923032045,
+ 0.0007639409159310162,
+ 0.000764198659453541,
+ 0.0007642150158062577
+ ],
+ "gamma_dfa": 0.017949961125850677,
+ "gamma_dfa_per_layer": [
+ 0.23718158900737762,
+ -0.05374513193964958,
+ -0.062201935797929764,
+ -0.04943467676639557
+ ],
+ "acc_eval": 0.2109375,
+ "loss_eval": 610.7471923828125,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 2326.78271484375,
+ 42755.171875,
+ 66353.453125,
+ 77731.328125,
+ 221615.828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008451915346086025,
+ 0.0007553622708655894,
+ 0.0007553161703981459,
+ 0.0007546090637333691,
+ 0.0007550025475211442
+ ],
+ "gamma_dfa": 0.029257358983159065,
+ "gamma_dfa_per_layer": [
+ 0.26171058416366577,
+ -0.04214981198310852,
+ -0.06413372606039047,
+ -0.03839761018753052
+ ],
+ "acc_eval": 0.19921875,
+ "loss_eval": 652.3941650390625,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 2443.6630859375,
+ 48300.12109375,
+ 77390.1015625,
+ 91484.09375,
+ 270700.96875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009103405755013227,
+ 0.0007761572487652302,
+ 0.0007760545704513788,
+ 0.0007730794604867697,
+ 0.0007728201453574002
+ ],
+ "gamma_dfa": 0.017114468850195408,
+ "gamma_dfa_per_layer": [
+ 0.26115190982818604,
+ -0.050561077892780304,
+ -0.08694136142730713,
+ -0.05519159510731697
+ ],
+ "acc_eval": 0.1669921875,
+ "loss_eval": 1354.747314453125,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 2499.429931640625,
+ 57379.33203125,
+ 93242.0859375,
+ 111601.9921875,
+ 332709.625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010016581509262323,
+ 0.0007549687870778143,
+ 0.0007551733287982643,
+ 0.0007543734973296523,
+ 0.0007547553977929056
+ ],
+ "gamma_dfa": 0.047867871820926666,
+ "gamma_dfa_per_layer": [
+ 0.3270750641822815,
+ -0.037589848041534424,
+ -0.06097441166639328,
+ -0.037039317190647125
+ ],
+ "acc_eval": 0.2041015625,
+ "loss_eval": 1818.91650390625,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 2615.140625,
+ 75715.7109375,
+ 109683.390625,
+ 132553.84375,
+ 406621.46875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008831259910948575,
+ 0.0007625823491252959,
+ 0.0007627239683642983,
+ 0.0007604075944982469,
+ 0.0007611791370436549
+ ],
+ "gamma_dfa": 0.022762255743145943,
+ "gamma_dfa_per_layer": [
+ 0.27839380502700806,
+ -0.05395745486021042,
+ -0.07682197540998459,
+ -0.05656535178422928
+ ],
+ "acc_eval": 0.2119140625,
+ "loss_eval": 1167.954833984375,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 2742.37353515625,
+ 97227.28125,
+ 131140.8125,
+ 155048.3125,
+ 481929.84375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001124670379795134,
+ 0.0007696108077652752,
+ 0.0007702686125412583,
+ 0.0007697975379414856,
+ 0.0007697619148530066
+ ],
+ "gamma_dfa": 0.03202100656926632,
+ "gamma_dfa_per_layer": [
+ 0.300557404756546,
+ -0.04680653661489487,
+ -0.052118271589279175,
+ -0.0735485702753067
+ ],
+ "acc_eval": 0.240234375,
+ "loss_eval": 2470.89453125,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 2858.224609375,
+ 126260.15625,
+ 160387.703125,
+ 186178.890625,
+ 564007.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001086456119082868,
+ 0.0007698858971707523,
+ 0.0007706494652666152,
+ 0.0007701858412474394,
+ 0.0007703170995227993
+ ],
+ "gamma_dfa": 0.03411092050373554,
+ "gamma_dfa_per_layer": [
+ 0.3229827582836151,
+ -0.03976103663444519,
+ -0.05624774843454361,
+ -0.09053029119968414
+ ],
+ "acc_eval": 0.2080078125,
+ "loss_eval": 1589.14599609375,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 3010.89697265625,
+ 156964.375,
+ 194623.5,
+ 223223.875,
+ 662826.6875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010667620226740837,
+ 0.0007900846539996564,
+ 0.0007894287118688226,
+ 0.0007884356309659779,
+ 0.0007912488654255867
+ ],
+ "gamma_dfa": 0.03901553526520729,
+ "gamma_dfa_per_layer": [
+ 0.34151530265808105,
+ -0.04678330570459366,
+ -0.06850147247314453,
+ -0.0701683834195137
+ ],
+ "acc_eval": 0.19921875,
+ "loss_eval": 1886.69091796875,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 3121.8056640625,
+ 191038.40625,
+ 232148.296875,
+ 265744.1875,
+ 761219.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011186219053342938,
+ 0.0007986227865330875,
+ 0.0007986134733073413,
+ 0.0007980577065609396,
+ 0.0007973008905537426
+ ],
+ "gamma_dfa": 0.027425863780081272,
+ "gamma_dfa_per_layer": [
+ 0.35862213373184204,
+ -0.061674464493989944,
+ -0.0841888040304184,
+ -0.10305541008710861
+ ],
+ "acc_eval": 0.185546875,
+ "loss_eval": 1700.765869140625,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 3283.62646484375,
+ 232390.3125,
+ 279218.25,
+ 315312.8125,
+ 875470.4375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001439103507436812,
+ 0.0007854723371565342,
+ 0.0007857424207031727,
+ 0.0007855244330130517,
+ 0.0007853199495002627
+ ],
+ "gamma_dfa": 0.03129031043499708,
+ "gamma_dfa_per_layer": [
+ 0.33073610067367554,
+ -0.058702368289232254,
+ -0.06629009544849396,
+ -0.080582395195961
+ ],
+ "acc_eval": 0.201171875,
+ "loss_eval": 3809.69873046875,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 3407.8984375,
+ 272082.28125,
+ 324674.25,
+ 365055.125,
+ 983575.625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001244095852598548,
+ 0.0008176793926395476,
+ 0.0008168797940015793,
+ 0.000815192295704037,
+ 0.0008157575502991676
+ ],
+ "gamma_dfa": 0.02919871360063553,
+ "gamma_dfa_per_layer": [
+ 0.3321998715400696,
+ -0.048228584229946136,
+ -0.057734884321689606,
+ -0.10944154858589172
+ ],
+ "acc_eval": 0.1650390625,
+ "loss_eval": 5145.80615234375,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 3570.579833984375,
+ 325919.34375,
+ 383859.84375,
+ 429527.59375,
+ 1121656.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013903328217566013,
+ 0.0008181754965335131,
+ 0.0008133396040648222,
+ 0.0008111604838632047,
+ 0.0008120551356114447
+ ],
+ "gamma_dfa": 0.04902177257463336,
+ "gamma_dfa_per_layer": [
+ 0.33004581928253174,
+ -0.017712868750095367,
+ -0.016218842938542366,
+ -0.10002701729536057
+ ],
+ "acc_eval": 0.1220703125,
+ "loss_eval": 4755.40869140625,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 3675.836181640625,
+ 381066.84375,
+ 446664.84375,
+ 495540.4375,
+ 1244910.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013685236917808652,
+ 0.0007945130346342921,
+ 0.0007943777018226683,
+ 0.0007925048121251166,
+ 0.0007924467790871859
+ ],
+ "gamma_dfa": 0.01623274479061365,
+ "gamma_dfa_per_layer": [
+ 0.27984413504600525,
+ -0.06000320240855217,
+ -0.06209240108728409,
+ -0.09281755238771439
+ ],
+ "acc_eval": 0.1962890625,
+ "loss_eval": 3555.3525390625,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 3779.81103515625,
+ 443408.34375,
+ 515845.65625,
+ 568047.125,
+ 1396404.125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001294015790335834,
+ 0.0007740295841358602,
+ 0.0007753889658488333,
+ 0.0007745815673843026,
+ 0.000773973239120096
+ ],
+ "gamma_dfa": 0.048758171033114195,
+ "gamma_dfa_per_layer": [
+ 0.3447470963001251,
+ -0.05413726717233658,
+ -0.0899808406829834,
+ -0.005596304312348366
+ ],
+ "acc_eval": 0.1103515625,
+ "loss_eval": 8851.5302734375,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 3920.750732421875,
+ 517289.40625,
+ 595296.5625,
+ 655510.1875,
+ 1569922.125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001448597526177764,
+ 0.0008134506642818451,
+ 0.0008149920613504946,
+ 0.0008116801618598402,
+ 0.0008117944234982133
+ ],
+ "gamma_dfa": 0.016455436125397682,
+ "gamma_dfa_per_layer": [
+ 0.28803595900535583,
+ -0.048596471548080444,
+ -0.07654894888401031,
+ -0.09706879407167435
+ ],
+ "acc_eval": 0.1767578125,
+ "loss_eval": 4626.505859375,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 4035.357666015625,
+ 605458.75,
+ 691596.8125,
+ 758344.75,
+ 1762235.125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013269236078485847,
+ 0.0007732360390946269,
+ 0.0007741436711512506,
+ 0.000773612700868398,
+ 0.0007734647369943559
+ ],
+ "gamma_dfa": 0.029436825774610043,
+ "gamma_dfa_per_layer": [
+ 0.2940990924835205,
+ -0.04052134230732918,
+ -0.05536778271198273,
+ -0.08046266436576843
+ ],
+ "acc_eval": 0.2578125,
+ "loss_eval": 2423.88037109375,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 4180.47998046875,
+ 680883.875,
+ 781089.375,
+ 856024.9375,
+ 1949442.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015648282133042812,
+ 0.0007914449088275433,
+ 0.0007915649330243468,
+ 0.0007914216257631779,
+ 0.0007914576563052833
+ ],
+ "gamma_dfa": 0.019646714441478252,
+ "gamma_dfa_per_layer": [
+ 0.2821764647960663,
+ -0.0451091043651104,
+ -0.08556324988603592,
+ -0.07291725277900696
+ ],
+ "acc_eval": 0.2314453125,
+ "loss_eval": 3942.80810546875,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 4309.49462890625,
+ 763385.4375,
+ 877493.9375,
+ 964321.4375,
+ 2131046.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001357953529804945,
+ 0.0008006176794879138,
+ 0.000801383052021265,
+ 0.0008009205921553075,
+ 0.0008007651194930077
+ ],
+ "gamma_dfa": 0.012816952541470528,
+ "gamma_dfa_per_layer": [
+ 0.3179120421409607,
+ -0.07943161576986313,
+ -0.08064424991607666,
+ -0.1065683662891388
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 4230.3056640625,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 4492.82568359375,
+ 851087.875,
+ 976163.875,
+ 1072469.125,
+ 2314147.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001730966498143971,
+ 0.000772459723521024,
+ 0.0007729437202215195,
+ 0.0007728235796093941,
+ 0.0007726353942416608
+ ],
+ "gamma_dfa": 0.03693788964301348,
+ "gamma_dfa_per_layer": [
+ 0.29988259077072144,
+ -0.0496492013335228,
+ -0.08479931950569153,
+ -0.0176825113594532
+ ],
+ "acc_eval": 0.1484375,
+ "loss_eval": 8231.34765625,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 4624.63720703125,
+ 951948.25,
+ 1092683.875,
+ 1196542.75,
+ 2542183.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002538386033847928,
+ 0.0007714434177614748,
+ 0.0007710265927016735,
+ 0.0007713963277637959,
+ 0.0007713483064435422
+ ],
+ "gamma_dfa": 0.04740711580961943,
+ "gamma_dfa_per_layer": [
+ 0.33979880809783936,
+ -0.04041346162557602,
+ -0.07300114631652832,
+ -0.03675573691725731
+ ],
+ "acc_eval": 0.1923828125,
+ "loss_eval": 8949.130859375,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 4807.11767578125,
+ 1054507.625,
+ 1214753.0,
+ 1323814.0,
+ 2764538.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0027727719862014055,
+ 0.000796200183685869,
+ 0.0007976335473358631,
+ 0.0007973454194143414,
+ 0.0007971985614858568
+ ],
+ "gamma_dfa": 0.08554775826632977,
+ "gamma_dfa_per_layer": [
+ 0.5049943923950195,
+ -0.037710923701524734,
+ -0.07092456519603729,
+ -0.05416787043213844
+ ],
+ "acc_eval": 0.1162109375,
+ "loss_eval": 12713.4443359375,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 4955.41943359375,
+ 1174053.875,
+ 1354818.125,
+ 1476400.375,
+ 3014463.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020058690570294857,
+ 0.0008079316467046738,
+ 0.0008077211095951498,
+ 0.0008079909021034837,
+ 0.000808066048193723
+ ],
+ "gamma_dfa": -0.01097937673330307,
+ "gamma_dfa_per_layer": [
+ 0.23371317982673645,
+ -0.07769355922937393,
+ -0.08009498566389084,
+ -0.11984214186668396
+ ],
+ "acc_eval": 0.169921875,
+ "loss_eval": 5398.2822265625,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 5098.02978515625,
+ 1282560.25,
+ 1488493.125,
+ 1621443.25,
+ 3242451.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017661951715126634,
+ 0.0007956374902278185,
+ 0.0007964695687405765,
+ 0.0007961427327245474,
+ 0.0007956251502037048
+ ],
+ "gamma_dfa": 0.022673148661851883,
+ "gamma_dfa_per_layer": [
+ 0.3096145689487457,
+ -0.05532063543796539,
+ -0.08393190801143646,
+ -0.07966943085193634
+ ],
+ "acc_eval": 0.185546875,
+ "loss_eval": 4639.80908203125,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 5239.9326171875,
+ 1391390.625,
+ 1615340.375,
+ 1765558.375,
+ 3480115.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020867532584816217,
+ 0.0007667955360375345,
+ 0.0007673996733501554,
+ 0.0007673778454773128,
+ 0.0007672442006878555
+ ],
+ "gamma_dfa": 0.0395392719656229,
+ "gamma_dfa_per_layer": [
+ 0.33367329835891724,
+ -0.043648943305015564,
+ -0.055444151163101196,
+ -0.07642311602830887
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 9990.30859375,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 5359.44677734375,
+ 1521280.0,
+ 1767789.625,
+ 1930907.75,
+ 3750866.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017118212999776006,
+ 0.0007934573804959655,
+ 0.0007942463853396475,
+ 0.000793949409853667,
+ 0.0007934118038974702
+ ],
+ "gamma_dfa": 0.03361810464411974,
+ "gamma_dfa_per_layer": [
+ 0.3103788495063782,
+ -0.03702692314982414,
+ -0.055835530161857605,
+ -0.08304397761821747
+ ],
+ "acc_eval": 0.216796875,
+ "loss_eval": 9768.205078125,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 5546.62451171875,
+ 1660698.625,
+ 1925789.375,
+ 2096456.25,
+ 4028953.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017267497023567557,
+ 0.000821329711470753,
+ 0.0008239842718467116,
+ 0.0008229895029217005,
+ 0.0008229521918110549
+ ],
+ "gamma_dfa": 0.029660841450095177,
+ "gamma_dfa_per_layer": [
+ 0.35288333892822266,
+ -0.043948374688625336,
+ -0.0895853042602539,
+ -0.10070629417896271
+ ],
+ "acc_eval": 0.1884765625,
+ "loss_eval": 8935.0380859375,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 5664.30810546875,
+ 1784317.875,
+ 2078188.375,
+ 2264432.75,
+ 4288914.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0022900900803506374,
+ 0.0007636325899511576,
+ 0.0007642185082659125,
+ 0.0007641956908628345,
+ 0.0007639650139026344
+ ],
+ "gamma_dfa": 0.06175872636958957,
+ "gamma_dfa_per_layer": [
+ 0.4067830443382263,
+ -0.03052734024822712,
+ -0.06545087695121765,
+ -0.06376992166042328
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 8287.39453125,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 5794.2666015625,
+ 1915382.125,
+ 2237977.75,
+ 2434797.75,
+ 4568056.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001793600502423942,
+ 0.0008144167950376868,
+ 0.0008172079687938094,
+ 0.0008157116826623678,
+ 0.0008155000978149474
+ ],
+ "gamma_dfa": 0.034024693071842194,
+ "gamma_dfa_per_layer": [
+ 0.35199591517448425,
+ -0.03579515218734741,
+ -0.09812411665916443,
+ -0.08197787404060364
+ ],
+ "acc_eval": 0.1806640625,
+ "loss_eval": 8560.4384765625,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 5928.12158203125,
+ 2057562.625,
+ 2403872.5,
+ 2624509.5,
+ 4865204.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001855076989158988,
+ 0.0007629086030647159,
+ 0.0007635788642801344,
+ 0.0007633934146724641,
+ 0.0007630206528119743
+ ],
+ "gamma_dfa": 0.023082666099071503,
+ "gamma_dfa_per_layer": [
+ 0.27648454904556274,
+ -0.05024096742272377,
+ -0.0845799595117569,
+ -0.049332957714796066
+ ],
+ "acc_eval": 0.197265625,
+ "loss_eval": 10714.77734375,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 6079.8232421875,
+ 2190046.5,
+ 2564464.5,
+ 2797927.0,
+ 5132383.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015576905570924282,
+ 0.0007896191673353314,
+ 0.0007904896046966314,
+ 0.0007902018842287362,
+ 0.0007895485614426434
+ ],
+ "gamma_dfa": 0.03866780921816826,
+ "gamma_dfa_per_layer": [
+ 0.37201371788978577,
+ -0.049719154834747314,
+ -0.07755836844444275,
+ -0.09006495773792267
+ ],
+ "acc_eval": 0.19140625,
+ "loss_eval": 7322.5205078125,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 6184.03369140625,
+ 2339567.0,
+ 2744136.25,
+ 2990721.25,
+ 5426845.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020522314589470625,
+ 0.0007883926737122238,
+ 0.0007893759175203741,
+ 0.0007890417473390698,
+ 0.0007883401704020798
+ ],
+ "gamma_dfa": 0.021758251823484898,
+ "gamma_dfa_per_layer": [
+ 0.2855323553085327,
+ -0.04375234618782997,
+ -0.07049872726202011,
+ -0.08424827456474304
+ ],
+ "acc_eval": 0.2080078125,
+ "loss_eval": 13975.05859375,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 6295.5458984375,
+ 2477445.75,
+ 2917469.0,
+ 3179694.0,
+ 5727252.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002105356426909566,
+ 0.0008074102224782109,
+ 0.0008063287241384387,
+ 0.000806407246273011,
+ 0.0008067074231803417
+ ],
+ "gamma_dfa": 0.0267162024974823,
+ "gamma_dfa_per_layer": [
+ 0.30986034870147705,
+ -0.05209521949291229,
+ -0.09783680737018585,
+ -0.05306351184844971
+ ],
+ "acc_eval": 0.1435546875,
+ "loss_eval": 9590.544921875,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 6367.55029296875,
+ 2638468.75,
+ 3095811.75,
+ 3362978.75,
+ 6030941.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015475827967748046,
+ 0.0008064319263212383,
+ 0.0008070095209404826,
+ 0.0008065010770224035,
+ 0.0008065410074777901
+ ],
+ "gamma_dfa": 0.00636688619852066,
+ "gamma_dfa_per_layer": [
+ 0.29843205213546753,
+ -0.03980886936187744,
+ -0.06682014465332031,
+ -0.16633549332618713
+ ],
+ "acc_eval": 0.11328125,
+ "loss_eval": 12254.064453125,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 6482.18798828125,
+ 2769282.5,
+ 3257572.75,
+ 3548043.5,
+ 6284645.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0022430147510021925,
+ 0.0008079760009422898,
+ 0.000807179429102689,
+ 0.0008071344927884638,
+ 0.0008072732598520815
+ ],
+ "gamma_dfa": 0.04464401211589575,
+ "gamma_dfa_per_layer": [
+ 0.3536185026168823,
+ -0.02255946770310402,
+ -0.07369404286146164,
+ -0.07878894358873367
+ ],
+ "acc_eval": 0.181640625,
+ "loss_eval": 10079.115234375,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 6566.8623046875,
+ 2899506.0,
+ 3420720.5,
+ 3728966.75,
+ 6555012.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001695870072580874,
+ 0.000820032088086009,
+ 0.0008200806332752109,
+ 0.0008201819728128612,
+ 0.0008201953023672104
+ ],
+ "gamma_dfa": 0.034856872633099556,
+ "gamma_dfa_per_layer": [
+ 0.3895777463912964,
+ -0.057720690965652466,
+ -0.08937396109104156,
+ -0.10305560380220413
+ ],
+ "acc_eval": 0.1181640625,
+ "loss_eval": 10401.4013671875,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 6618.705078125,
+ 3056073.5,
+ 3608076.25,
+ 3938206.0,
+ 6870646.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014620226575061679,
+ 0.000811390345916152,
+ 0.0008111409260891378,
+ 0.000811099074780941,
+ 0.000811324454843998
+ ],
+ "gamma_dfa": 0.002492595463991165,
+ "gamma_dfa_per_layer": [
+ 0.2934489846229553,
+ -0.07660828530788422,
+ -0.0814061164855957,
+ -0.12546420097351074
+ ],
+ "acc_eval": 0.16796875,
+ "loss_eval": 11906.7060546875,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 6674.03759765625,
+ 3201735.0,
+ 3787927.75,
+ 4133561.75,
+ 7173546.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015491953818127513,
+ 0.0007825249340385199,
+ 0.0007832346600480378,
+ 0.0007830507238395512,
+ 0.0007823925698176026
+ ],
+ "gamma_dfa": 0.054443607572466135,
+ "gamma_dfa_per_layer": [
+ 0.38785266876220703,
+ -0.022086789831519127,
+ -0.062120988965034485,
+ -0.08587045967578888
+ ],
+ "acc_eval": 0.2373046875,
+ "loss_eval": 9465.3525390625,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 6740.52392578125,
+ 3338670.5,
+ 3953341.75,
+ 4315309.5,
+ 7447204.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015645271632820368,
+ 0.0007820724858902395,
+ 0.0007820809260010719,
+ 0.0007819690508767962,
+ 0.0007819557213224471
+ ],
+ "gamma_dfa": 0.027317455038428307,
+ "gamma_dfa_per_layer": [
+ 0.3320838212966919,
+ -0.06272841989994049,
+ -0.06253603100776672,
+ -0.09754955023527145
+ ],
+ "acc_eval": 0.1923828125,
+ "loss_eval": 9605.2587890625,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 6826.42578125,
+ 3488233.5,
+ 4125392.0,
+ 4514242.0,
+ 7747655.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018625661032274365,
+ 0.0008403572137467563,
+ 0.0008396300836466253,
+ 0.0008392629097215831,
+ 0.000840048654936254
+ ],
+ "gamma_dfa": 0.018042685464024544,
+ "gamma_dfa_per_layer": [
+ 0.34575170278549194,
+ -0.061284519731998444,
+ -0.08629278838634491,
+ -0.12600365281105042
+ ],
+ "acc_eval": 0.1494140625,
+ "loss_eval": 13453.193359375,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 6878.60009765625,
+ 3647417.5,
+ 4303500.5,
+ 4707215.0,
+ 8039602.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001495232223533094,
+ 0.0008112883078865707,
+ 0.0008119228295981884,
+ 0.0008115706732496619,
+ 0.0008112648501992226
+ ],
+ "gamma_dfa": 0.025581182446330786,
+ "gamma_dfa_per_layer": [
+ 0.301077663898468,
+ -0.015085713937878609,
+ -0.07233025878667831,
+ -0.11133696138858795
+ ],
+ "acc_eval": 0.1513671875,
+ "loss_eval": 10446.5498046875,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 6956.30126953125,
+ 3782040.0,
+ 4474453.5,
+ 4889139.0,
+ 8311892.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001576881273649633,
+ 0.0008043631678447127,
+ 0.0008050674805417657,
+ 0.0008046348229981959,
+ 0.0008046681759878993
+ ],
+ "gamma_dfa": 0.005857756361365318,
+ "gamma_dfa_per_layer": [
+ 0.28321602940559387,
+ -0.03702875226736069,
+ -0.06707675755023956,
+ -0.15567949414253235
+ ],
+ "acc_eval": 0.1484375,
+ "loss_eval": 6591.0849609375,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 7021.955078125,
+ 3911149.5,
+ 4636672.0,
+ 5064123.0,
+ 8571758.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002099651610478759,
+ 0.0008183405152522027,
+ 0.0008207465871237218,
+ 0.0008196401176974177,
+ 0.000819449604023248
+ ],
+ "gamma_dfa": 0.006074780598282814,
+ "gamma_dfa_per_layer": [
+ 0.2577749490737915,
+ -0.05066239833831787,
+ -0.06501314789056778,
+ -0.1178002804517746
+ ],
+ "acc_eval": 0.2109375,
+ "loss_eval": 7962.04443359375,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 7101.7373046875,
+ 4061103.5,
+ 4820611.0,
+ 5257086.0,
+ 8861818.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018932655220851302,
+ 0.0008025900460779667,
+ 0.0008032865589484572,
+ 0.000802954426035285,
+ 0.0008029173477552831
+ ],
+ "gamma_dfa": 0.020984639413654804,
+ "gamma_dfa_per_layer": [
+ 0.3329803943634033,
+ -0.03559138998389244,
+ -0.06842450797557831,
+ -0.14502593874931335
+ ],
+ "acc_eval": 0.1650390625,
+ "loss_eval": 8638.353515625,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 7120.71240234375,
+ 4194965.0,
+ 4982087.0,
+ 5430094.5,
+ 9121286.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015255591133609414,
+ 0.0007772985845804214,
+ 0.0007780406740494072,
+ 0.0007778139552101493,
+ 0.000777201319579035
+ ],
+ "gamma_dfa": 0.0210345396772027,
+ "gamma_dfa_per_layer": [
+ 0.3191820979118347,
+ -0.05588069185614586,
+ -0.0712573379278183,
+ -0.10790590941905975
+ ],
+ "acc_eval": 0.22265625,
+ "loss_eval": 8870.3212890625,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 7166.24462890625,
+ 4326872.0,
+ 5144769.0,
+ 5605003.0,
+ 9390572.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0019027154194191098,
+ 0.000822498113848269,
+ 0.0008225358324125409,
+ 0.0008226112113334239,
+ 0.0008225055644288659
+ ],
+ "gamma_dfa": 0.01758619397878647,
+ "gamma_dfa_per_layer": [
+ 0.29208946228027344,
+ -0.046764522790908813,
+ -0.10779638588428497,
+ -0.06718377768993378
+ ],
+ "acc_eval": 0.154296875,
+ "loss_eval": 18607.9921875,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 7173.86865234375,
+ 4454190.5,
+ 5300661.5,
+ 5764316.0,
+ 9633685.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017527258023619652,
+ 0.0008042250410653651,
+ 0.0008040837710723281,
+ 0.0008041510009206831,
+ 0.0008041784167289734
+ ],
+ "gamma_dfa": 0.04197401413694024,
+ "gamma_dfa_per_layer": [
+ 0.31714165210723877,
+ -0.025468191131949425,
+ -0.05378583073616028,
+ -0.0699915736913681
+ ],
+ "acc_eval": 0.1826171875,
+ "loss_eval": 10768.23046875,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 7200.1064453125,
+ 4569527.5,
+ 5448454.0,
+ 5924151.0,
+ 9865530.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016467028763145208,
+ 0.0007759482250548899,
+ 0.0007759520667605102,
+ 0.0007758319843560457,
+ 0.0007757880375720561
+ ],
+ "gamma_dfa": 0.019114631228148937,
+ "gamma_dfa_per_layer": [
+ 0.3342781364917755,
+ -0.05670151486992836,
+ -0.0891423374414444,
+ -0.111975759267807
+ ],
+ "acc_eval": 0.1865234375,
+ "loss_eval": 9049.12109375,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 7198.30419921875,
+ 4679779.5,
+ 5583911.5,
+ 6073903.5,
+ 10075961.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015529918018728495,
+ 0.0008276477456092834,
+ 0.0008274043793790042,
+ 0.0008273764979094267,
+ 0.00082727539120242
+ ],
+ "gamma_dfa": 0.012379471212625504,
+ "gamma_dfa_per_layer": [
+ 0.33610183000564575,
+ -0.0668979212641716,
+ -0.09369023889303207,
+ -0.12599578499794006
+ ],
+ "acc_eval": 0.1533203125,
+ "loss_eval": 9929.3125,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 7191.220703125,
+ 4787683.5,
+ 5730170.5,
+ 6223255.0,
+ 10287596.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002624395303428173,
+ 0.0008026033756323159,
+ 0.0008024688577279449,
+ 0.0008025110582821071,
+ 0.000802531314548105
+ ],
+ "gamma_dfa": 0.041071049869060516,
+ "gamma_dfa_per_layer": [
+ 0.3911614418029785,
+ -0.03441564738750458,
+ -0.07384517788887024,
+ -0.11861641705036163
+ ],
+ "acc_eval": 0.1669921875,
+ "loss_eval": 9811.68359375,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 7184.458984375,
+ 4895536.0,
+ 5864442.5,
+ 6369317.5,
+ 10509902.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016685851151123643,
+ 0.0007737133419141173,
+ 0.0007737109554000199,
+ 0.0007736092084087431,
+ 0.0007735762046650052
+ ],
+ "gamma_dfa": 0.03856207150965929,
+ "gamma_dfa_per_layer": [
+ 0.3347627520561218,
+ -0.05478603392839432,
+ -0.09395486861467361,
+ -0.03177356347441673
+ ],
+ "acc_eval": 0.15625,
+ "loss_eval": 7798.90283203125,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 7166.86083984375,
+ 4995598.0,
+ 5984263.5,
+ 6498221.0,
+ 10708319.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013723000884056091,
+ 0.0008002148242667317,
+ 0.0007998319924809039,
+ 0.0007997409556992352,
+ 0.0008000954985618591
+ ],
+ "gamma_dfa": 0.024815326556563377,
+ "gamma_dfa_per_layer": [
+ 0.3238403797149658,
+ -0.05496574938297272,
+ -0.0969959944486618,
+ -0.07261732965707779
+ ],
+ "acc_eval": 0.1552734375,
+ "loss_eval": 6333.236328125,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 7156.17236328125,
+ 5093715.5,
+ 6108802.5,
+ 6629623.5,
+ 10896864.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001458030310459435,
+ 0.0007727351039648056,
+ 0.0007727306219749153,
+ 0.0007726310286670923,
+ 0.0007726071053184569
+ ],
+ "gamma_dfa": 0.018785862252116203,
+ "gamma_dfa_per_layer": [
+ 0.31862637400627136,
+ -0.06633786112070084,
+ -0.07025538384914398,
+ -0.10688968002796173
+ ],
+ "acc_eval": 0.2060546875,
+ "loss_eval": 5966.35400390625,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 7127.96875,
+ 5203388.5,
+ 6229672.5,
+ 6756540.5,
+ 11105730.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018821367993950844,
+ 0.000799131637904793,
+ 0.0007999413646757603,
+ 0.0007995158084668219,
+ 0.0007994744228199124
+ ],
+ "gamma_dfa": 0.033654400147497654,
+ "gamma_dfa_per_layer": [
+ 0.3480244278907776,
+ -0.0470522977411747,
+ -0.08066973835229874,
+ -0.08568479120731354
+ ],
+ "acc_eval": 0.21484375,
+ "loss_eval": 8679.373046875,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 7127.84326171875,
+ 5291613.5,
+ 6343081.5,
+ 6873492.5,
+ 11283083.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013305873144418001,
+ 0.0008001387468539178,
+ 0.0007999925292097032,
+ 0.0008000367670319974,
+ 0.0008000454981811345
+ ],
+ "gamma_dfa": 0.026681816205382347,
+ "gamma_dfa_per_layer": [
+ 0.33079925179481506,
+ -0.04635504633188248,
+ -0.060725681483745575,
+ -0.11699125915765762
+ ],
+ "acc_eval": 0.2001953125,
+ "loss_eval": 7321.45654296875,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 7118.43115234375,
+ 5399320.5,
+ 6461637.5,
+ 6995765.0,
+ 11479911.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0027539313305169344,
+ 0.0007441912894137204,
+ 0.000744749209843576,
+ 0.0007447105017490685,
+ 0.0007443142239935696
+ ],
+ "gamma_dfa": 0.0691906102001667,
+ "gamma_dfa_per_layer": [
+ 0.4505346715450287,
+ -0.03461931645870209,
+ -0.07136575877666473,
+ -0.06778715550899506
+ ],
+ "acc_eval": 0.16015625,
+ "loss_eval": 10899.68359375,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 7104.958984375,
+ 5484605.5,
+ 6570873.0,
+ 7105816.5,
+ 11646348.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011745812371373177,
+ 0.000797195709310472,
+ 0.0007963370881043375,
+ 0.0007962601375766098,
+ 0.0007965530967339873
+ ],
+ "gamma_dfa": 0.016523053869605064,
+ "gamma_dfa_per_layer": [
+ 0.3157949447631836,
+ -0.05805324763059616,
+ -0.0915503203868866,
+ -0.10009916126728058
+ ],
+ "acc_eval": 0.185546875,
+ "loss_eval": 4549.11328125,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 7046.66552734375,
+ 5575192.0,
+ 6682143.0,
+ 7216392.5,
+ 11814821.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014973932411521673,
+ 0.0007987518329173326,
+ 0.000798598921392113,
+ 0.0007986334967426956,
+ 0.00079863186692819
+ ],
+ "gamma_dfa": 0.006323261186480522,
+ "gamma_dfa_per_layer": [
+ 0.3186365067958832,
+ -0.07689585536718369,
+ -0.08955803513526917,
+ -0.12688957154750824
+ ],
+ "acc_eval": 0.1845703125,
+ "loss_eval": 5873.4677734375,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 6997.1630859375,
+ 5656117.0,
+ 6779526.0,
+ 7314913.5,
+ 11969090.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014266286743804812,
+ 0.0007692458457313478,
+ 0.0007703236187808216,
+ 0.0007699450361542404,
+ 0.0007692069630138576
+ ],
+ "gamma_dfa": 0.04031236469745636,
+ "gamma_dfa_per_layer": [
+ 0.3853839635848999,
+ -0.054634347558021545,
+ -0.08128909766674042,
+ -0.0882110595703125
+ ],
+ "acc_eval": 0.1953125,
+ "loss_eval": 4200.4296875,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 6970.02099609375,
+ 5731178.0,
+ 6870747.5,
+ 7405309.0,
+ 12120166.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013568063732236624,
+ 0.0007682641153223813,
+ 0.000768258236348629,
+ 0.0007681549177505076,
+ 0.0007681125425733626
+ ],
+ "gamma_dfa": 0.04615131672471762,
+ "gamma_dfa_per_layer": [
+ 0.3717971444129944,
+ -0.05474664270877838,
+ -0.05301285162568092,
+ -0.07943238317966461
+ ],
+ "acc_eval": 0.1943359375,
+ "loss_eval": 3897.47607421875,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 6942.25,
+ 5793439.5,
+ 6946580.5,
+ 7481325.5,
+ 12242140.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011983924778178334,
+ 0.0007509839488193393,
+ 0.0007508245762437582,
+ 0.0007505225948989391,
+ 0.0007505776011385024
+ ],
+ "gamma_dfa": 0.03128352388739586,
+ "gamma_dfa_per_layer": [
+ 0.31842517852783203,
+ -0.03316807746887207,
+ -0.06335921585559845,
+ -0.09676378965377808
+ ],
+ "acc_eval": 0.2685546875,
+ "loss_eval": 3095.559814453125,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 6881.80810546875,
+ 5850806.5,
+ 7011394.5,
+ 7546550.5,
+ 12350002.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011590005597099662,
+ 0.0007501945947296917,
+ 0.0007500603678636253,
+ 0.0007497719489037991,
+ 0.0007498189806938171
+ ],
+ "gamma_dfa": 0.01806825865060091,
+ "gamma_dfa_per_layer": [
+ 0.313739538192749,
+ -0.047393035143613815,
+ -0.07615944743156433,
+ -0.11791402101516724
+ ],
+ "acc_eval": 0.205078125,
+ "loss_eval": 3942.599853515625,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 6837.1533203125,
+ 5897771.5,
+ 7073526.0,
+ 7607611.5,
+ 12444407.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001163899782113731,
+ 0.0007416060543619096,
+ 0.0007419964531436563,
+ 0.0007419841131195426,
+ 0.0007417319575324655
+ ],
+ "gamma_dfa": 0.03044590726494789,
+ "gamma_dfa_per_layer": [
+ 0.30829477310180664,
+ -0.03881052881479263,
+ -0.07340054214000702,
+ -0.07430007308721542
+ ],
+ "acc_eval": 0.2939453125,
+ "loss_eval": 2950.356689453125,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 6806.5322265625,
+ 5963679.5,
+ 7147126.0,
+ 7679290.5,
+ 12557362.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012401024578139186,
+ 0.0007945983088575304,
+ 0.0007953918538987637,
+ 0.0007950742146931589,
+ 0.0007950655417516828
+ ],
+ "gamma_dfa": -0.007623729296028614,
+ "gamma_dfa_per_layer": [
+ 0.24250081181526184,
+ -0.04293825104832649,
+ -0.07043637335300446,
+ -0.15962110459804535
+ ],
+ "acc_eval": 0.14453125,
+ "loss_eval": 3910.8994140625,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 6782.47607421875,
+ 5997089.0,
+ 7185317.5,
+ 7719894.5,
+ 12633342.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012797614326700568,
+ 0.0007944905664771795,
+ 0.0007951240986585617,
+ 0.0007947491831146181,
+ 0.0007947032572701573
+ ],
+ "gamma_dfa": 0.03983990382403135,
+ "gamma_dfa_per_layer": [
+ 0.35600101947784424,
+ -0.023466136306524277,
+ -0.07362768054008484,
+ -0.09954758733510971
+ ],
+ "acc_eval": 0.193359375,
+ "loss_eval": 3587.8212890625,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 6723.70654296875,
+ 6042461.0,
+ 7238613.0,
+ 7771656.5,
+ 12718382.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012927292846143246,
+ 0.000765398726798594,
+ 0.0007653928478248417,
+ 0.0007653140346519649,
+ 0.0007652752683497965
+ ],
+ "gamma_dfa": 0.03482971154153347,
+ "gamma_dfa_per_layer": [
+ 0.34003761410713196,
+ -0.05069781839847565,
+ -0.05738937109708786,
+ -0.09263157844543457
+ ],
+ "acc_eval": 0.23046875,
+ "loss_eval": 2805.9716796875,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 6669.96435546875,
+ 6085424.0,
+ 7288909.5,
+ 7821635.0,
+ 12799732.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011438996298238635,
+ 0.000740286021027714,
+ 0.0007406995864585042,
+ 0.0007406825898215175,
+ 0.0007403898634947836
+ ],
+ "gamma_dfa": 0.03725961223244667,
+ "gamma_dfa_per_layer": [
+ 0.32540398836135864,
+ -0.04895278066396713,
+ -0.07243393361568451,
+ -0.05497882515192032
+ ],
+ "acc_eval": 0.2373046875,
+ "loss_eval": 2089.305908203125,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 6611.064453125,
+ 6121666.0,
+ 7328789.5,
+ 7859580.5,
+ 12864450.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010610584868118167,
+ 0.0007183317793533206,
+ 0.0007201047264970839,
+ 0.0007199530373327434,
+ 0.0007199217798188329
+ ],
+ "gamma_dfa": 0.03143393341451883,
+ "gamma_dfa_per_layer": [
+ 0.2940787076950073,
+ -0.035069357603788376,
+ -0.0604243278503418,
+ -0.07284928858280182
+ ],
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1459.638916015625,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 6564.220703125,
+ 6147971.0,
+ 7358806.5,
+ 7888597.5,
+ 12918884.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001103258109651506,
+ 0.0007199789397418499,
+ 0.0007205012370832264,
+ 0.0007201395928859711,
+ 0.000719686911907047
+ ],
+ "gamma_dfa": 0.02568601444363594,
+ "gamma_dfa_per_layer": [
+ 0.3047623038291931,
+ -0.05378233641386032,
+ -0.07432089745998383,
+ -0.0739150121808052
+ ],
+ "acc_eval": 0.2607421875,
+ "loss_eval": 1398.54931640625,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 6523.052734375,
+ 6163991.5,
+ 7377848.0,
+ 7906464.0,
+ 12959929.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010483200894668698,
+ 0.0007394760614261031,
+ 0.0007398684392683208,
+ 0.0007398549350909889,
+ 0.0007395940483547747
+ ],
+ "gamma_dfa": 0.028113607317209244,
+ "gamma_dfa_per_layer": [
+ 0.2919086515903473,
+ -0.04769399017095566,
+ -0.06982402503490448,
+ -0.06193620711565018
+ ],
+ "acc_eval": 0.294921875,
+ "loss_eval": 1247.0958251953125,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 6480.38134765625,
+ 6177022.5,
+ 7396143.5,
+ 7924145.0,
+ 12992374.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011187344789505005,
+ 0.0007568535511381924,
+ 0.0007568564033135772,
+ 0.0007567762513644993,
+ 0.0007568445871584117
+ ],
+ "gamma_dfa": 0.029856184497475624,
+ "gamma_dfa_per_layer": [
+ 0.32282522320747375,
+ -0.05086465924978256,
+ -0.06785817444324493,
+ -0.08467765152454376
+ ],
+ "acc_eval": 0.267578125,
+ "loss_eval": 1623.752197265625,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 6430.5322265625,
+ 6198352.0,
+ 7419959.0,
+ 7946585.0,
+ 13023161.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010678176768124104,
+ 0.0007456489838659763,
+ 0.0007455460145138204,
+ 0.0007452794816344976,
+ 0.000745359982829541
+ ],
+ "gamma_dfa": 0.019207272678613663,
+ "gamma_dfa_per_layer": [
+ 0.28421786427497864,
+ -0.04965135455131531,
+ -0.07151313126087189,
+ -0.08622428774833679
+ ],
+ "acc_eval": 0.291015625,
+ "loss_eval": 1205.84716796875,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 6396.35009765625,
+ 6216262.0,
+ 7436144.0,
+ 7961794.0,
+ 13045224.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010295198298990726,
+ 0.0007388790836557746,
+ 0.0007392680854536593,
+ 0.000739254173822701,
+ 0.000738998525775969
+ ],
+ "gamma_dfa": 0.02955447882413864,
+ "gamma_dfa_per_layer": [
+ 0.2954120337963104,
+ -0.046598292887210846,
+ -0.069032222032547,
+ -0.061563603579998016
+ ],
+ "acc_eval": 0.298828125,
+ "loss_eval": 1123.675048828125,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 6366.1259765625,
+ 6230148.5,
+ 7451647.0,
+ 7975150.0,
+ 13064555.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010110137518495321,
+ 0.0007565211853943765,
+ 0.0007565242704004049,
+ 0.0007563806138932705,
+ 0.0007564250845462084
+ ],
+ "gamma_dfa": 0.011881772428750992,
+ "gamma_dfa_per_layer": [
+ 0.2693521976470947,
+ -0.04482053220272064,
+ -0.07126723229885101,
+ -0.1057373434305191
+ ],
+ "acc_eval": 0.240234375,
+ "loss_eval": 1118.5343017578125,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 6341.41796875,
+ 6233793.0,
+ 7457683.5,
+ 7981064.5,
+ 13074395.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010112811578437686,
+ 0.0007385196513496339,
+ 0.0007389356032945216,
+ 0.000738917791750282,
+ 0.0007386352517642081
+ ],
+ "gamma_dfa": 0.0292903920635581,
+ "gamma_dfa_per_layer": [
+ 0.28946253657341003,
+ -0.033900823444128036,
+ -0.06436440348625183,
+ -0.07403574138879776
+ ],
+ "acc_eval": 0.306640625,
+ "loss_eval": 1028.103515625,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 6319.90185546875,
+ 6241203.5,
+ 7463285.5,
+ 7986068.5,
+ 13084655.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010045261587947607,
+ 0.0007187838782556355,
+ 0.0007187584415078163,
+ 0.0007185733411461115,
+ 0.0007185345166362822
+ ],
+ "gamma_dfa": 0.02470484748482704,
+ "gamma_dfa_per_layer": [
+ 0.2734910249710083,
+ -0.0429413765668869,
+ -0.06623440980911255,
+ -0.06549584865570068
+ ],
+ "acc_eval": 0.3271484375,
+ "loss_eval": 879.8018798828125,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 6299.453125,
+ 6240490.0,
+ 7464953.0,
+ 7988364.0,
+ 13086769.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010041827335953712,
+ 0.0007186768343672156,
+ 0.0007186515722423792,
+ 0.0007184677524492145,
+ 0.0007184296264313161
+ ],
+ "gamma_dfa": 0.022233721800148487,
+ "gamma_dfa_per_layer": [
+ 0.2633175849914551,
+ -0.04053181782364845,
+ -0.06492872536182404,
+ -0.06892215460538864
+ ],
+ "acc_eval": 0.322265625,
+ "loss_eval": 871.9059448242188,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 6280.70068359375,
+ 6248322.5,
+ 7472246.5,
+ 7994814.0,
+ 13094255.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000998231815174222,
+ 0.0007185792201198637,
+ 0.0007185565191321075,
+ 0.0007183970883488655,
+ 0.0007183645502664149
+ ],
+ "gamma_dfa": 0.02329079993069172,
+ "gamma_dfa_per_layer": [
+ 0.27325427532196045,
+ -0.04209248721599579,
+ -0.0645713210105896,
+ -0.07342726737260818
+ ],
+ "acc_eval": 0.326171875,
+ "loss_eval": 876.770263671875,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 6259.79541015625,
+ 6251884.0,
+ 7473855.0,
+ 7995730.5,
+ 13095582.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001000022399239242,
+ 0.0007185632712207735,
+ 0.0007185383583419025,
+ 0.0007183536072261631,
+ 0.0007183143752627075
+ ],
+ "gamma_dfa": 0.01565107237547636,
+ "gamma_dfa_per_layer": [
+ 0.26019614934921265,
+ -0.042762644588947296,
+ -0.06100854650139809,
+ -0.09382066875696182
+ ],
+ "acc_eval": 0.31640625,
+ "loss_eval": 847.3887939453125,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 6250.6630859375,
+ 6252472.0,
+ 7474356.5,
+ 7996154.0,
+ 13096382.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009951539104804397,
+ 0.000718452560249716,
+ 0.0007184353889897466,
+ 0.0007182956906035542,
+ 0.0007182672270573676
+ ],
+ "gamma_dfa": 0.01607441157102585,
+ "gamma_dfa_per_layer": [
+ 0.2622864246368408,
+ -0.04606177657842636,
+ -0.06511188298463821,
+ -0.08681511878967285
+ ],
+ "acc_eval": 0.3125,
+ "loss_eval": 820.6640625,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 6245.84228515625,
+ 6252136.5,
+ 7473891.5,
+ 7995642.0,
+ 13095543.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009887836640700698,
+ 0.0007184472633525729,
+ 0.0007184235146269202,
+ 0.0007182589615695179,
+ 0.0007182253757491708
+ ],
+ "gamma_dfa": 0.01632563304156065,
+ "gamma_dfa_per_layer": [
+ 0.2587689757347107,
+ -0.041752640157938004,
+ -0.06282168626785278,
+ -0.08889211714267731
+ ],
+ "acc_eval": 0.3271484375,
+ "loss_eval": 794.9835815429688,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 6243.275390625,
+ 6252353.5,
+ 7474147.5,
+ 7995911.0,
+ 13095907.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010000880574807525,
+ 0.0007184495334513485,
+ 0.0007184281130321324,
+ 0.0007182535482570529,
+ 0.0007182166446000338
+ ],
+ "gamma_dfa": 0.01966456975787878,
+ "gamma_dfa_per_layer": [
+ 0.26670968532562256,
+ -0.04189712926745415,
+ -0.06575733423233032,
+ -0.08039694279432297
+ ],
+ "acc_eval": 0.3173828125,
+ "loss_eval": 809.9351196289062,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 6242.01708984375,
+ 6252447.5,
+ 7474218.0,
+ 7995986.5,
+ 13096086.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009963318007066846,
+ 0.000718410883564502,
+ 0.000718392024282366,
+ 0.0007182427798397839,
+ 0.0007182121044024825
+ ],
+ "gamma_dfa": 0.017472295090556145,
+ "gamma_dfa_per_layer": [
+ 0.26097655296325684,
+ -0.042458876967430115,
+ -0.06487732380628586,
+ -0.08375117182731628
+ ],
+ "acc_eval": 0.326171875,
+ "loss_eval": 790.8746337890625,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 6241.6884765625,
+ 6252462.0,
+ 7474227.5,
+ 7995996.0,
+ 13096118.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009859646670520306,
+ 0.0007156162173487246,
+ 0.0007178352097980678,
+ 0.0007174411439336836,
+ 0.0007168283336795866
+ ],
+ "gamma_dfa": 0.01725842524319887,
+ "gamma_dfa_per_layer": [
+ 0.25597745180130005,
+ -0.041728582233190536,
+ -0.06328003108501434,
+ -0.08193513751029968
+ ],
+ "acc_eval": 0.3359375,
+ "loss_eval": 790.8336181640625,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file