From aa73718eb6427d7da3b9cb416275802d90c4b2ed Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Sun, 14 Jun 2026 04:06:32 -0500 Subject: Add new experiment scripts, figures, and paper assets; untrack pyc/build artifacts Co-Authored-By: Claude Opus 4.8 (1M context) --- results/snapshot_no_outln_v1/run_s123.log | 51 + results/snapshot_no_outln_v1/run_s42.log | 51 + results/snapshot_no_outln_v1/run_s456.log | 51 + .../snapshot_fa_canonical_noln_s42.json | 1824 ++++++++ .../snapshot_no_outln_v1/snapshot_fa_noln_s42.json | 1824 ++++++++ .../snapshot_no_outln_v1/snapshot_noLN_s123.json | 4766 ++++++++++++++++++++ .../snapshot_no_outln_v1/snapshot_noLN_s42.json | 4766 ++++++++++++++++++++ .../snapshot_no_outln_v1/snapshot_noLN_s456.json | 4766 ++++++++++++++++++++ 8 files changed, 18099 insertions(+) create mode 100644 results/snapshot_no_outln_v1/run_s123.log create mode 100644 results/snapshot_no_outln_v1/run_s42.log create mode 100644 results/snapshot_no_outln_v1/run_s456.log create mode 100644 results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json create mode 100644 results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json create mode 100644 results/snapshot_no_outln_v1/snapshot_noLN_s123.json create mode 100644 results/snapshot_no_outln_v1/snapshot_noLN_s42.json create mode 100644 results/snapshot_no_outln_v1/snapshot_noLN_s456.json (limited to 'results/snapshot_no_outln_v1') diff --git a/results/snapshot_no_outln_v1/run_s123.log b/results/snapshot_no_outln_v1/run_s123.log new file mode 100644 index 0000000..a946d6d --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s123.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=123 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.791e+00 ||g||=5.394e-04 acc=0.1016 + [BP-noLN] Ep 1: ||h_L||=3.456e+01 ||g||=1.382e-04 acc=0.4355 + [BP-noLN] Ep 5: ||h_L||=5.193e+01 ||g||=9.721e-05 acc=0.5049 + [BP-noLN] Ep 10: ||h_L||=6.115e+01 ||g||=8.778e-05 acc=0.5430 + [BP-noLN] Ep 15: ||h_L||=6.668e+01 ||g||=8.387e-05 acc=0.5586 + [BP-noLN] Ep 20: ||h_L||=6.880e+01 ||g||=8.997e-05 acc=0.5176 + [BP-noLN] Ep 25: ||h_L||=7.092e+01 ||g||=8.184e-05 acc=0.5850 + [BP-noLN] Ep 30: ||h_L||=7.285e+01 ||g||=7.960e-05 acc=0.5693 + [BP-noLN] Ep 35: ||h_L||=7.522e+01 ||g||=8.247e-05 acc=0.5869 + [BP-noLN] Ep 40: ||h_L||=7.551e+01 ||g||=8.186e-05 acc=0.6201 + [BP-noLN] Ep 45: ||h_L||=7.421e+01 ||g||=8.565e-05 acc=0.5918 + [BP-noLN] Ep 50: ||h_L||=7.473e+01 ||g||=9.094e-05 acc=0.5840 + [BP-noLN] Ep 55: ||h_L||=7.556e+01 ||g||=8.896e-05 acc=0.6143 + [BP-noLN] Ep 60: ||h_L||=7.545e+01 ||g||=9.015e-05 acc=0.6396 + [BP-noLN] Ep 65: ||h_L||=7.509e+01 ||g||=9.009e-05 acc=0.6455 + [BP-noLN] Ep 70: ||h_L||=7.466e+01 ||g||=9.170e-05 acc=0.6230 + [BP-noLN] Ep 75: ||h_L||=7.410e+01 ||g||=1.030e-04 acc=0.6455 + [BP-noLN] Ep 80: ||h_L||=7.313e+01 ||g||=1.043e-04 acc=0.6309 + [BP-noLN] Ep 85: ||h_L||=7.275e+01 ||g||=1.035e-04 acc=0.6396 + [BP-noLN] Ep 90: ||h_L||=7.262e+01 ||g||=1.079e-04 acc=0.6445 + [BP-noLN] Ep 95: ||h_L||=7.256e+01 ||g||=1.087e-04 acc=0.6377 + [BP-noLN] Ep 100: ||h_L||=7.248e+01 ||g||=1.082e-04 acc=0.6396 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.791e+00 ||g||=5.394e-04 acc=0.1016 + [DFA-noLN] Ep 1: ||h_L||=1.231e+03 ||g||=6.461e-04 acc=0.2129 γ=0.0130 + [DFA-noLN] Ep 5: ||h_L||=1.290e+04 ||g||=7.423e-04 acc=0.2080 γ=-0.0053 + [DFA-noLN] Ep 10: ||h_L||=6.970e+04 ||g||=7.399e-04 acc=0.2031 γ=-0.0038 + [DFA-noLN] Ep 15: ||h_L||=2.144e+05 ||g||=7.383e-04 acc=0.1807 γ=0.0158 + [DFA-noLN] Ep 20: ||h_L||=5.289e+05 ||g||=7.379e-04 acc=0.2295 γ=0.0205 + [DFA-noLN] Ep 25: ||h_L||=1.047e+06 ||g||=7.582e-04 acc=0.1729 γ=-0.0056 + [DFA-noLN] Ep 30: ||h_L||=1.809e+06 ||g||=7.676e-04 acc=0.1934 γ=0.0171 + [DFA-noLN] Ep 35: ||h_L||=2.741e+06 ||g||=7.757e-04 acc=0.1504 γ=0.0181 + [DFA-noLN] Ep 40: ||h_L||=3.868e+06 ||g||=7.547e-04 acc=0.1377 γ=0.0036 + [DFA-noLN] Ep 45: ||h_L||=5.087e+06 ||g||=7.677e-04 acc=0.2246 γ=0.0148 + [DFA-noLN] Ep 50: ||h_L||=6.378e+06 ||g||=7.632e-04 acc=0.2002 γ=-0.0010 + [DFA-noLN] Ep 55: ||h_L||=7.652e+06 ||g||=7.547e-04 acc=0.0908 γ=0.0198 + [DFA-noLN] Ep 60: ||h_L||=8.786e+06 ||g||=7.196e-04 acc=0.1670 γ=0.0255 + [DFA-noLN] Ep 65: ||h_L||=9.795e+06 ||g||=7.598e-04 acc=0.1699 γ=0.0191 + [DFA-noLN] Ep 70: ||h_L||=1.063e+07 ||g||=7.313e-04 acc=0.2422 γ=0.0235 + [DFA-noLN] Ep 75: ||h_L||=1.127e+07 ||g||=7.316e-04 acc=0.2490 γ=0.0445 + [DFA-noLN] Ep 80: ||h_L||=1.173e+07 ||g||=7.425e-04 acc=0.1904 γ=0.0283 + [DFA-noLN] Ep 85: ||h_L||=1.203e+07 ||g||=7.233e-04 acc=0.2500 γ=0.0402 + [DFA-noLN] Ep 90: ||h_L||=1.216e+07 ||g||=7.064e-04 acc=0.3096 γ=0.0335 + [DFA-noLN] Ep 95: ||h_L||=1.218e+07 ||g||=7.087e-04 acc=0.2920 γ=0.0295 + [DFA-noLN] Ep 100: ||h_L||=1.218e+07 ||g||=7.086e-04 acc=0.3135 γ=0.0273 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s123.json diff --git a/results/snapshot_no_outln_v1/run_s42.log b/results/snapshot_no_outln_v1/run_s42.log new file mode 100644 index 0000000..81d2970 --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s42.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=42 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.893e+00 ||g||=5.483e-04 acc=0.1123 + [BP-noLN] Ep 1: ||h_L||=3.310e+01 ||g||=1.421e-04 acc=0.4229 + [BP-noLN] Ep 5: ||h_L||=5.238e+01 ||g||=9.984e-05 acc=0.5010 + [BP-noLN] Ep 10: ||h_L||=6.111e+01 ||g||=8.972e-05 acc=0.5518 + [BP-noLN] Ep 15: ||h_L||=6.640e+01 ||g||=8.892e-05 acc=0.5195 + [BP-noLN] Ep 20: ||h_L||=6.977e+01 ||g||=8.730e-05 acc=0.5488 + [BP-noLN] Ep 25: ||h_L||=7.080e+01 ||g||=8.598e-05 acc=0.5547 + [BP-noLN] Ep 30: ||h_L||=7.441e+01 ||g||=8.621e-05 acc=0.5723 + [BP-noLN] Ep 35: ||h_L||=7.537e+01 ||g||=7.991e-05 acc=0.6025 + [BP-noLN] Ep 40: ||h_L||=7.552e+01 ||g||=8.747e-05 acc=0.5859 + [BP-noLN] Ep 45: ||h_L||=7.571e+01 ||g||=8.227e-05 acc=0.5918 + [BP-noLN] Ep 50: ||h_L||=7.514e+01 ||g||=9.716e-05 acc=0.5811 + [BP-noLN] Ep 55: ||h_L||=7.693e+01 ||g||=9.600e-05 acc=0.6006 + [BP-noLN] Ep 60: ||h_L||=7.581e+01 ||g||=9.903e-05 acc=0.6113 + [BP-noLN] Ep 65: ||h_L||=7.549e+01 ||g||=1.009e-04 acc=0.6221 + [BP-noLN] Ep 70: ||h_L||=7.530e+01 ||g||=1.088e-04 acc=0.6074 + [BP-noLN] Ep 75: ||h_L||=7.454e+01 ||g||=1.082e-04 acc=0.6143 + [BP-noLN] Ep 80: ||h_L||=7.426e+01 ||g||=1.162e-04 acc=0.6123 + [BP-noLN] Ep 85: ||h_L||=7.353e+01 ||g||=1.161e-04 acc=0.6084 + [BP-noLN] Ep 90: ||h_L||=7.339e+01 ||g||=1.168e-04 acc=0.6123 + [BP-noLN] Ep 95: ||h_L||=7.308e+01 ||g||=1.164e-04 acc=0.6143 + [BP-noLN] Ep 100: ||h_L||=7.297e+01 ||g||=1.158e-04 acc=0.6162 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.893e+00 ||g||=5.483e-04 acc=0.1123 + [DFA-noLN] Ep 1: ||h_L||=1.560e+03 ||g||=6.859e-04 acc=0.1494 γ=0.0084 + [DFA-noLN] Ep 5: ||h_L||=1.050e+04 ||g||=7.522e-04 acc=0.1748 γ=-0.0063 + [DFA-noLN] Ep 10: ||h_L||=2.200e+04 ||g||=7.641e-04 acc=0.1445 γ=-0.0167 + [DFA-noLN] Ep 15: ||h_L||=1.004e+05 ||g||=7.608e-04 acc=0.1738 γ=-0.0118 + [DFA-noLN] Ep 20: ||h_L||=3.150e+05 ||g||=7.782e-04 acc=0.2070 γ=0.0027 + [DFA-noLN] Ep 25: ||h_L||=6.817e+05 ||g||=7.884e-04 acc=0.1572 γ=0.0340 + [DFA-noLN] Ep 30: ||h_L||=1.298e+06 ||g||=7.771e-04 acc=0.1299 γ=0.0393 + [DFA-noLN] Ep 35: ||h_L||=2.143e+06 ||g||=7.980e-04 acc=0.0996 γ=0.0196 + [DFA-noLN] Ep 40: ||h_L||=3.180e+06 ||g||=7.691e-04 acc=0.1016 γ=-0.0085 + [DFA-noLN] Ep 45: ||h_L||=4.347e+06 ||g||=7.934e-04 acc=0.1582 γ=0.0262 + [DFA-noLN] Ep 50: ||h_L||=5.552e+06 ||g||=7.869e-04 acc=0.2197 γ=0.0165 + [DFA-noLN] Ep 55: ||h_L||=6.742e+06 ||g||=7.851e-04 acc=0.1885 γ=0.0046 + [DFA-noLN] Ep 60: ||h_L||=7.801e+06 ||g||=7.600e-04 acc=0.1572 γ=0.0045 + [DFA-noLN] Ep 65: ||h_L||=8.775e+06 ||g||=7.795e-04 acc=0.2031 γ=0.0088 + [DFA-noLN] Ep 70: ||h_L||=9.556e+06 ||g||=7.968e-04 acc=0.1836 γ=0.0093 + [DFA-noLN] Ep 75: ||h_L||=1.016e+07 ||g||=7.656e-04 acc=0.2490 γ=0.0168 + [DFA-noLN] Ep 80: ||h_L||=1.064e+07 ||g||=7.633e-04 acc=0.2764 γ=0.0198 + [DFA-noLN] Ep 85: ||h_L||=1.095e+07 ||g||=7.466e-04 acc=0.2773 γ=0.0195 + [DFA-noLN] Ep 90: ||h_L||=1.107e+07 ||g||=7.453e-04 acc=0.2695 γ=0.0131 + [DFA-noLN] Ep 95: ||h_L||=1.113e+07 ||g||=7.446e-04 acc=0.3105 γ=0.0146 + [DFA-noLN] Ep 100: ||h_L||=1.113e+07 ||g||=7.392e-04 acc=0.3320 γ=0.0164 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s42.json diff --git a/results/snapshot_no_outln_v1/run_s456.log b/results/snapshot_no_outln_v1/run_s456.log new file mode 100644 index 0000000..a0a3bd0 --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s456.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=456 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918 + [BP-noLN] Ep 1: ||h_L||=3.410e+01 ||g||=1.500e-04 acc=0.4365 + [BP-noLN] Ep 5: ||h_L||=5.250e+01 ||g||=1.052e-04 acc=0.4961 + [BP-noLN] Ep 10: ||h_L||=6.330e+01 ||g||=8.751e-05 acc=0.5596 + [BP-noLN] Ep 15: ||h_L||=6.619e+01 ||g||=8.857e-05 acc=0.5215 + [BP-noLN] Ep 20: ||h_L||=7.009e+01 ||g||=8.610e-05 acc=0.5420 + [BP-noLN] Ep 25: ||h_L||=7.285e+01 ||g||=8.470e-05 acc=0.5723 + [BP-noLN] Ep 30: ||h_L||=7.493e+01 ||g||=8.152e-05 acc=0.5938 + [BP-noLN] Ep 35: ||h_L||=7.640e+01 ||g||=7.781e-05 acc=0.6074 + [BP-noLN] Ep 40: ||h_L||=7.799e+01 ||g||=8.443e-05 acc=0.5938 + [BP-noLN] Ep 45: ||h_L||=7.734e+01 ||g||=7.914e-05 acc=0.6143 + [BP-noLN] Ep 50: ||h_L||=7.667e+01 ||g||=8.950e-05 acc=0.5996 + [BP-noLN] Ep 55: ||h_L||=7.591e+01 ||g||=9.021e-05 acc=0.6201 + [BP-noLN] Ep 60: ||h_L||=7.667e+01 ||g||=8.730e-05 acc=0.6338 + [BP-noLN] Ep 65: ||h_L||=7.629e+01 ||g||=9.670e-05 acc=0.6230 + [BP-noLN] Ep 70: ||h_L||=7.612e+01 ||g||=9.637e-05 acc=0.6260 + [BP-noLN] Ep 75: ||h_L||=7.544e+01 ||g||=9.639e-05 acc=0.6338 + [BP-noLN] Ep 80: ||h_L||=7.434e+01 ||g||=9.999e-05 acc=0.6455 + [BP-noLN] Ep 85: ||h_L||=7.429e+01 ||g||=1.013e-04 acc=0.6348 + [BP-noLN] Ep 90: ||h_L||=7.381e+01 ||g||=1.076e-04 acc=0.6348 + [BP-noLN] Ep 95: ||h_L||=7.380e+01 ||g||=1.084e-04 acc=0.6436 + [BP-noLN] Ep 100: ||h_L||=7.373e+01 ||g||=1.088e-04 acc=0.6465 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918 + [DFA-noLN] Ep 1: ||h_L||=1.507e+03 ||g||=6.424e-04 acc=0.2246 γ=0.0136 + [DFA-noLN] Ep 5: ||h_L||=1.140e+04 ||g||=7.475e-04 acc=0.2314 γ=-0.0000 + [DFA-noLN] Ep 10: ||h_L||=2.845e+04 ||g||=7.444e-04 acc=0.1895 γ=-0.0067 + [DFA-noLN] Ep 15: ||h_L||=8.676e+04 ||g||=7.381e-04 acc=0.2549 γ=0.0039 + [DFA-noLN] Ep 20: ||h_L||=2.707e+05 ||g||=7.761e-04 acc=0.1670 γ=0.0171 + [DFA-noLN] Ep 25: ||h_L||=6.628e+05 ||g||=7.894e-04 acc=0.1992 γ=0.0390 + [DFA-noLN] Ep 30: ||h_L||=1.245e+06 ||g||=7.944e-04 acc=0.1963 γ=0.0162 + [DFA-noLN] Ep 35: ||h_L||=2.131e+06 ||g||=8.014e-04 acc=0.1904 γ=0.0128 + [DFA-noLN] Ep 40: ||h_L||=3.242e+06 ||g||=7.965e-04 acc=0.1855 γ=0.0227 + [DFA-noLN] Ep 45: ||h_L||=4.568e+06 ||g||=8.172e-04 acc=0.1807 γ=0.0340 + [DFA-noLN] Ep 50: ||h_L||=6.031e+06 ||g||=8.070e-04 acc=0.1133 γ=0.0064 + [DFA-noLN] Ep 55: ||h_L||=7.447e+06 ||g||=7.821e-04 acc=0.1924 γ=0.0273 + [DFA-noLN] Ep 60: ||h_L||=8.862e+06 ||g||=8.033e-04 acc=0.1650 γ=0.0210 + [DFA-noLN] Ep 65: ||h_L||=1.008e+07 ||g||=8.274e-04 acc=0.1533 γ=0.0124 + [DFA-noLN] Ep 70: ||h_L||=1.111e+07 ||g||=7.999e-04 acc=0.2148 γ=0.0337 + [DFA-noLN] Ep 75: ||h_L||=1.197e+07 ||g||=7.703e-04 acc=0.1953 γ=0.0403 + [DFA-noLN] Ep 80: ||h_L||=1.256e+07 ||g||=7.954e-04 acc=0.1445 γ=-0.0076 + [DFA-noLN] Ep 85: ||h_L||=1.292e+07 ||g||=7.205e-04 acc=0.2607 γ=0.0257 + [DFA-noLN] Ep 90: ||h_L||=1.306e+07 ||g||=7.565e-04 acc=0.2402 γ=0.0119 + [DFA-noLN] Ep 95: ||h_L||=1.310e+07 ||g||=7.185e-04 acc=0.3164 γ=0.0157 + [DFA-noLN] Ep 100: ||h_L||=1.310e+07 ||g||=7.178e-04 acc=0.3359 γ=0.0173 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s456.json diff --git a/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json new file mode 100644 index 0000000..7e5cb37 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json @@ -0,0 +1,1824 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "acc_eval": 0.1123046875, + "epoch": 0 + }, + { + "hidden_norms": [ + 736.34716796875, + 1637.1044921875, + 2033.1922607421875, + 2161.380859375, + 2126.18505859375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0006836718530394137, + 0.0006813183426856995, + 0.0006814387743361294, + 0.0006832550279796124, + 0.0006794488872401416 + ], + "acc_eval": 0.1953125, + "epoch": 1 + }, + { + "hidden_norms": [ + 1106.3868408203125, + 2963.552001953125, + 4087.33837890625, + 4421.4921875, + 4265.1083984375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007476353785023093, + 0.0007440777844749391, + 0.0007443943759426475, + 0.0007477496401406825, + 0.0007366884965449572 + ], + "acc_eval": 0.1044921875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1371.9425048828125, + 4214.05078125, + 6238.47265625, + 6697.2333984375, + 6399.22314453125 + ], + "bp_grad_norms_per_sample_med": [ + 0.000730870058760047, + 0.00072717375587672, + 0.0007270713686011732, + 0.0007290731882676482, + 0.0007233614451251924 + ], + "acc_eval": 0.1943359375, + "epoch": 3 + }, + { + "hidden_norms": [ + 1574.7962646484375, + 4805.0556640625, + 7044.64599609375, + 7593.78955078125, + 7215.32763671875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007098641362972558, + 0.0007034889422357082, + 0.0007031699060462415, + 0.0007120345253497362, + 0.000694308546371758 + ], + "acc_eval": 0.2451171875, + "epoch": 4 + }, + { + "hidden_norms": [ + 1726.088623046875, + 6184.34521484375, + 9521.791015625, + 10387.7236328125, + 9721.431640625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007400272879749537, + 0.0007343650795519352, + 0.0007334973197430372, + 0.0007343514007516205, + 0.0007319966680370271 + ], + "acc_eval": 0.212890625, + "epoch": 5 + }, + { + "hidden_norms": [ + 1902.689697265625, + 7697.52197265625, + 12328.0595703125, + 13597.1787109375, + 12504.158203125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007165716378949583, + 0.0007126733544282615, + 0.0007124089752323925, + 0.0007126083364710212, + 0.0007107863784767687 + ], + "acc_eval": 0.15625, + "epoch": 6 + }, + { + "hidden_norms": [ + 2069.750244140625, + 10379.2958984375, + 16444.7421875, + 18267.94921875, + 16595.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007099996437318623, + 0.0007088935235515237, + 0.0007090346189215779, + 0.000710709486156702, + 0.0007023006328381598 + ], + "acc_eval": 0.154296875, + "epoch": 7 + }, + { + "hidden_norms": [ + 2226.40673828125, + 12703.916015625, + 20184.30859375, + 22453.73828125, + 20183.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.00072157580871135, + 0.0007210742915049195, + 0.0007212630589492619, + 0.0007244180305860937, + 0.0007163899717852473 + ], + "acc_eval": 0.2236328125, + "epoch": 8 + }, + { + "hidden_norms": [ + 2289.455078125, + 15611.2138671875, + 24559.412109375, + 27336.787109375, + 24451.6796875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007243232685141265, + 0.0007221215637400746, + 0.0007219284889288247, + 0.0007259267731569707, + 0.0007173537742346525 + ], + "acc_eval": 0.169921875, + "epoch": 9 + }, + { + "hidden_norms": [ + 2396.09814453125, + 19678.587890625, + 30417.08203125, + 34140.70703125, + 30261.052734375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007124242256395519, + 0.0007074667955748737, + 0.0007074963650666177, + 0.0007131542661227286, + 0.0007022957433946431 + ], + "acc_eval": 0.1904296875, + "epoch": 10 + }, + { + "hidden_norms": [ + 2467.864013671875, + 24019.642578125, + 41156.921875, + 46706.38671875, + 41256.71484375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007333463290706277, + 0.0007277126424014568, + 0.0007268521003425121, + 0.000731462670955807, + 0.0007225224399007857 + ], + "acc_eval": 0.169921875, + "epoch": 11 + }, + { + "hidden_norms": [ + 2518.561767578125, + 28957.451171875, + 55737.69140625, + 64112.609375, + 56246.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007202349370345473, + 0.0007073598098941147, + 0.0007049349951557815, + 0.0007059182389639318, + 0.0007044971571303904 + ], + "acc_eval": 0.1513671875, + "epoch": 12 + }, + { + "hidden_norms": [ + 2614.843994140625, + 34279.15625, + 74158.109375, + 86073.96875, + 75187.59375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007299556746147573, + 0.0007100331713445485, + 0.0007101728115230799, + 0.0007166104041971266, + 0.0007030466804280877 + ], + "acc_eval": 0.24609375, + "epoch": 13 + }, + { + "hidden_norms": [ + 2697.871337890625, + 41263.5390625, + 96222.8984375, + 112901.9765625, + 98551.3046875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007336065755225718, + 0.0007151410100050271, + 0.0007150733144953847, + 0.0007166287978179753, + 0.0007151660392992198 + ], + "acc_eval": 0.134765625, + "epoch": 14 + }, + { + "hidden_norms": [ + 2815.983154296875, + 53842.3828125, + 126185.5625, + 149526.796875, + 130144.4765625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007365003693848848, + 0.0007177364313974977, + 0.0007168670417740941, + 0.000717108603566885, + 0.0007130720769055188 + ], + "acc_eval": 0.150390625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2928.448974609375, + 65162.98046875, + 153909.296875, + 184005.875, + 159483.03125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007613440393470228, + 0.000720723532140255, + 0.000720796815585345, + 0.0007208258030004799, + 0.0007211563643068075 + ], + "acc_eval": 0.166015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 2970.975341796875, + 76176.9609375, + 179093.75, + 216167.875, + 186723.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007602480472996831, + 0.0007191941258497536, + 0.0007163456757552922, + 0.0007164765265770257, + 0.0007142137037590146 + ], + "acc_eval": 0.1796875, + "epoch": 17 + }, + { + "hidden_norms": [ + 3078.336181640625, + 91839.40625, + 215980.015625, + 263515.15625, + 227071.515625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007584959384985268, + 0.0007150565506890416, + 0.0007151922909542918, + 0.000715585716534406, + 0.0007152389152906835 + ], + "acc_eval": 0.1767578125, + "epoch": 18 + }, + { + "hidden_norms": [ + 3202.803466796875, + 104358.6875, + 248325.390625, + 305395.84375, + 262365.46875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007867171661928296, + 0.0007155268103815615, + 0.0007155817584134638, + 0.0007157608633860946, + 0.0007155768107622862 + ], + "acc_eval": 0.138671875, + "epoch": 19 + }, + { + "hidden_norms": [ + 3282.27490234375, + 117747.359375, + 284217.3125, + 351018.15625, + 300903.65625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007691550417803228, + 0.0007147297146730125, + 0.0007147309370338917, + 0.0007150261080823839, + 0.0007147534633986652 + ], + "acc_eval": 0.1923828125, + "epoch": 20 + }, + { + "hidden_norms": [ + 3394.945556640625, + 129443.9765625, + 317078.65625, + 393509.375, + 336658.40625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008442914695478976, + 0.0007179519161581993, + 0.0007190873729996383, + 0.000723545381333679, + 0.0007175213540904224 + ], + "acc_eval": 0.1376953125, + "epoch": 21 + }, + { + "hidden_norms": [ + 3484.2763671875, + 140426.171875, + 355086.84375, + 443148.09375, + 378501.53125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007702927687205374, + 0.0006826652679592371, + 0.0006794629734940827, + 0.0006826536264270544, + 0.0006794703076593578 + ], + "acc_eval": 0.19140625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3529.414306640625, + 153612.265625, + 393522.9375, + 493183.03125, + 421284.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008731107809580863, + 0.0007047304534353316, + 0.0007038630428723991, + 0.000708943116478622, + 0.000701444165315479 + ], + "acc_eval": 0.16796875, + "epoch": 23 + }, + { + "hidden_norms": [ + 3604.90283203125, + 165405.75, + 423586.46875, + 533219.375, + 454992.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008110221242532134, + 0.0006812610663473606, + 0.0006812110659666359, + 0.0006817537359893322, + 0.0006813214858993888 + ], + "acc_eval": 0.20703125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3761.85400390625, + 178944.296875, + 464984.875, + 587869.375, + 501438.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008038324886001647, + 0.0006578225293196738, + 0.0006502956384792924, + 0.000664222112391144, + 0.0006502254982478917 + ], + "acc_eval": 0.240234375, + "epoch": 25 + }, + { + "hidden_norms": [ + 3818.5869140625, + 193167.4375, + 505599.375, + 643764.4375, + 550033.3125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007956585614010692, + 0.0007038708426989615, + 0.0007025190279819071, + 0.0007078333292156458, + 0.0006988184759393334 + ], + "acc_eval": 0.185546875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3924.1787109375, + 207801.1875, + 548741.125, + 701043.0625, + 599520.4375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009222823427990079, + 0.000673642847687006, + 0.0006724554114043713, + 0.0006726986612193286, + 0.0006725445855408907 + ], + "acc_eval": 0.216796875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4061.806884765625, + 222595.921875, + 590807.5, + 755718.75, + 646775.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008092334610410035, + 0.0007093537133187056, + 0.0007078479393385351, + 0.0007069098646752536, + 0.0007029378321021795 + ], + "acc_eval": 0.2158203125, + "epoch": 28 + }, + { + "hidden_norms": [ + 4216.11083984375, + 237549.296875, + 636429.5625, + 816954.9375, + 699524.9375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008620031294412911, + 0.0007326522027142346, + 0.00072627910412848, + 0.000725903722923249, + 0.0007269763154909015 + ], + "acc_eval": 0.1533203125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4319.05029296875, + 251667.5, + 681409.75, + 874567.9375, + 748820.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008448463049717247, + 0.0007160686072893441, + 0.000714016379788518, + 0.0007141274982132018, + 0.0007095346227288246 + ], + "acc_eval": 0.1591796875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4387.8330078125, + 268470.375, + 733153.125, + 943456.375, + 808793.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009849616326391697, + 0.0007160623208619654, + 0.0007154300110414624, + 0.0007152247708290815, + 0.0007160453242249787 + ], + "acc_eval": 0.1884765625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4495.54638671875, + 291274.59375, + 806698.75, + 1039374.875, + 892062.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008646573405712843, + 0.000731874315533787, + 0.0007177238585427403, + 0.0007205329020507634, + 0.0007192457560449839 + ], + "acc_eval": 0.17578125, + "epoch": 32 + }, + { + "hidden_norms": [ + 4596.96337890625, + 305228.46875, + 848072.5625, + 1092268.625, + 937583.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009474663529545069, + 0.0007221641135402024, + 0.000721680698916316, + 0.0007284134044311941, + 0.0007212713244371116 + ], + "acc_eval": 0.171875, + "epoch": 33 + }, + { + "hidden_norms": [ + 4724.111328125, + 321366.5, + 891238.9375, + 1149886.25, + 987910.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009131877450272441, + 0.0007397676818072796, + 0.0007398735033348203, + 0.0007397927111014724, + 0.0007406016811728477 + ], + "acc_eval": 0.125, + "epoch": 34 + }, + { + "hidden_norms": [ + 4865.970703125, + 344027.15625, + 946722.0625, + 1219714.625, + 1049445.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001010064734145999, + 0.0007341124583035707, + 0.0007336883572861552, + 0.0007345521007664502, + 0.0007338698487728834 + ], + "acc_eval": 0.119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5003.3857421875, + 373410.21875, + 1026535.0625, + 1321456.25, + 1139824.625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010555180488154292, + 0.0007112861494533718, + 0.0007111895247362554, + 0.0007112334715202451, + 0.000711193191818893 + ], + "acc_eval": 0.1591796875, + "epoch": 36 + }, + { + "hidden_norms": [ + 5121.19287109375, + 405646.9375, + 1111111.125, + 1430716.625, + 1237074.375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010308363707736135, + 0.0007563655963167548, + 0.0007560031372122467, + 0.000755665882024914, + 0.0007561628590337932 + ], + "acc_eval": 0.134765625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5212.7294921875, + 434054.15625, + 1180238.125, + 1518019.875, + 1314350.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001035128254443407, + 0.0007314062095247209, + 0.0007304889149963856, + 0.0007291524088941514, + 0.0007313747191801667 + ], + "acc_eval": 0.140625, + "epoch": 38 + }, + { + "hidden_norms": [ + 5322.74951171875, + 462000.6875, + 1248006.75, + 1606243.125, + 1392563.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009023830061778426, + 0.000720554031431675, + 0.0007195135112851858, + 0.0007197313825599849, + 0.0007196948863565922 + ], + "acc_eval": 0.1708984375, + "epoch": 39 + }, + { + "hidden_norms": [ + 5453.89111328125, + 498941.0625, + 1343521.0, + 1731177.375, + 1504101.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010444134240970016, + 0.0007362678297795355, + 0.0007352089160121977, + 0.0007340405718423426, + 0.0007357052527368069 + ], + "acc_eval": 0.1328125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5515.6982421875, + 529817.75, + 1409505.625, + 1816151.0, + 1580539.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011280628386884928, + 0.0007231750059872866, + 0.0007211649208329618, + 0.000721275107935071, + 0.0007212632917799056 + ], + "acc_eval": 0.1611328125, + "epoch": 41 + }, + { + "hidden_norms": [ + 5617.26513671875, + 567492.4375, + 1498097.5, + 1931607.875, + 1684206.875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010544253746047616, + 0.0007354306289926171, + 0.0007348860381171107, + 0.0007349851075559855, + 0.0007350810337811708 + ], + "acc_eval": 0.1416015625, + "epoch": 42 + }, + { + "hidden_norms": [ + 5740.7978515625, + 596215.625, + 1561745.25, + 2014107.25, + 1758526.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010764201870188117, + 0.0007244387525133789, + 0.000723967794328928, + 0.000724096957128495, + 0.0007241644198074937 + ], + "acc_eval": 0.19921875, + "epoch": 43 + }, + { + "hidden_norms": [ + 5808.19677734375, + 630780.3125, + 1636034.875, + 2109305.75, + 1845552.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010526466649025679, + 0.0007206913433037698, + 0.0007207048474811018, + 0.0007211468764580786, + 0.0007207895396277308 + ], + "acc_eval": 0.173828125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5868.3583984375, + 673578.625, + 1729325.25, + 2227518.0, + 1953361.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009479392319917679, + 0.0007091389270499349, + 0.0007090644794516265, + 0.0007082624360918999, + 0.0007085782708600163 + ], + "acc_eval": 0.1923828125, + "epoch": 45 + }, + { + "hidden_norms": [ + 5953.82421875, + 720273.0, + 1840695.5, + 2372038.0, + 2084658.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0014002618845552206, + 0.0007315247785300016, + 0.0007256051758304238, + 0.0007254919619299471, + 0.000725599646102637 + ], + "acc_eval": 0.17578125, + "epoch": 46 + }, + { + "hidden_norms": [ + 6054.7861328125, + 758000.6875, + 1930354.375, + 2488163.75, + 2190582.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001109408913180232, + 0.0007018125616014004, + 0.0007016566814854741, + 0.000701890152413398, + 0.0007018494652584195 + ], + "acc_eval": 0.203125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6155.0859375, + 790443.0, + 2009565.875, + 2590829.25, + 2285268.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010253023356199265, + 0.0007347314967773855, + 0.0007304528844542801, + 0.0007322027231566608, + 0.0007312395609915257 + ], + "acc_eval": 0.154296875, + "epoch": 48 + }, + { + "hidden_norms": [ + 6216.64453125, + 830678.125, + 2088773.5, + 2691122.0, + 2376731.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010403504129499197, + 0.0006902964669279754, + 0.0006906419876031578, + 0.0006905900663696229, + 0.0006906461785547435 + ], + "acc_eval": 0.1591796875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6252.98486328125, + 867790.1875, + 2159729.75, + 2781409.5, + 2460902.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011370684951543808, + 0.0007390088285319507, + 0.0007305812323465943, + 0.0007310720975510776, + 0.0007304322207346559 + ], + "acc_eval": 0.15234375, + "epoch": 50 + }, + { + "hidden_norms": [ + 6294.51611328125, + 897267.5625, + 2218282.5, + 2858224.75, + 2530432.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0013790406519547105, + 0.0007320911972783506, + 0.0007304649334400892, + 0.0007293879170902073, + 0.0007303770980797708 + ], + "acc_eval": 0.1591796875, + "epoch": 51 + }, + { + "hidden_norms": [ + 6312.2314453125, + 935570.375, + 2299086.0, + 2963619.0, + 2627515.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000999285257421434, + 0.0007227054447866976, + 0.0007246703025884926, + 0.0007245387532748282, + 0.0007243558065965772 + ], + "acc_eval": 0.20703125, + "epoch": 52 + }, + { + "hidden_norms": [ + 6387.30322265625, + 977101.125, + 2387243.0, + 3077676.25, + 2733147.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001396833686158061, + 0.0007110408041626215, + 0.0007093287422321737, + 0.000708233390469104, + 0.0007085108081810176 + ], + "acc_eval": 0.1787109375, + "epoch": 53 + }, + { + "hidden_norms": [ + 6406.59033203125, + 1011753.1875, + 2450391.25, + 3158275.0, + 2807055.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0012408416951075196, + 0.0007304692408069968, + 0.000724659999832511, + 0.0007247650064527988, + 0.0007249858463183045 + ], + "acc_eval": 0.130859375, + "epoch": 54 + }, + { + "hidden_norms": [ + 6396.32080078125, + 1051044.375, + 2521085.5, + 3249326.75, + 2890642.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010854896390810609, + 0.0006957638543099165, + 0.0006896257400512695, + 0.0006964386557228863, + 0.0006897017010487616 + ], + "acc_eval": 0.234375, + "epoch": 55 + }, + { + "hidden_norms": [ + 6413.91357421875, + 1083474.5, + 2597945.5, + 3348271.5, + 2981405.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.00098806235473603, + 0.000719150179065764, + 0.0007170068565756083, + 0.0007178731029853225, + 0.0007173708290793002 + ], + "acc_eval": 0.205078125, + "epoch": 56 + }, + { + "hidden_norms": [ + 6406.4228515625, + 1124429.875, + 2675529.5, + 3447474.25, + 3073241.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001149638439528644, + 0.0007225789595395327, + 0.0007212197524495423, + 0.0007210947806015611, + 0.0007211659685708582 + ], + "acc_eval": 0.1494140625, + "epoch": 57 + }, + { + "hidden_norms": [ + 6443.423828125, + 1166184.375, + 2758561.25, + 3551879.75, + 3171214.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001115654013119638, + 0.000685695675201714, + 0.0006846366450190544, + 0.0006861463189125061, + 0.0006862673326395452 + ], + "acc_eval": 0.2490234375, + "epoch": 58 + }, + { + "hidden_norms": [ + 6477.5, + 1208826.0, + 2842194.75, + 3654862.0, + 3267617.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.000923235435038805, + 0.0006659153732471168, + 0.0006642267107963562, + 0.0006722065154463053, + 0.000664416525978595 + ], + "acc_eval": 0.2353515625, + "epoch": 59 + }, + { + "hidden_norms": [ + 6486.1689453125, + 1249377.0, + 2928293.75, + 3765881.75, + 3370835.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008846685523167253, + 0.0006866253679618239, + 0.000686973100528121, + 0.0006869880016893148, + 0.0006870955694466829 + ], + "acc_eval": 0.2373046875, + "epoch": 60 + }, + { + "hidden_norms": [ + 6499.3720703125, + 1291233.25, + 3012714.75, + 3873429.75, + 3471234.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009820004925131798, + 0.0007174524944275618, + 0.0007178467349149287, + 0.0007176626822911203, + 0.0007174718775786459 + ], + "acc_eval": 0.216796875, + "epoch": 61 + }, + { + "hidden_norms": [ + 6486.14404296875, + 1327247.75, + 3088322.75, + 3971415.75, + 3562299.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010241338750347495, + 0.0007171124452725053, + 0.0007174332858994603, + 0.0007172181503847241, + 0.0007169945747591555 + ], + "acc_eval": 0.18359375, + "epoch": 62 + }, + { + "hidden_norms": [ + 6455.17236328125, + 1355067.375, + 3142698.25, + 4041006.5, + 3627490.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009781530825421214, + 0.0007034538430161774, + 0.000703376077581197, + 0.0007118352805264294, + 0.0007080681971274316 + ], + "acc_eval": 0.189453125, + "epoch": 63 + }, + { + "hidden_norms": [ + 6454.62841796875, + 1384795.75, + 3199654.0, + 4114095.75, + 3696468.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009227422997355461, + 0.0007023688522167504, + 0.0007012909045442939, + 0.0007004260551184416, + 0.0007006779196672142 + ], + "acc_eval": 0.21484375, + "epoch": 64 + }, + { + "hidden_norms": [ + 6451.345703125, + 1420232.75, + 3260116.5, + 4190244.25, + 3768354.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008870494784787297, + 0.0007146014831960201, + 0.0007149986922740936, + 0.0007148014265112579, + 0.0007145918207243085 + ], + "acc_eval": 0.197265625, + "epoch": 65 + }, + { + "hidden_norms": [ + 6445.890625, + 1448264.875, + 3319505.0, + 4267505.0, + 3840047.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010003555798903108, + 0.0007171350298449397, + 0.0007168895681388676, + 0.0007169176824390888, + 0.0007170233875513077 + ], + "acc_eval": 0.1591796875, + "epoch": 66 + }, + { + "hidden_norms": [ + 6440.8212890625, + 1478082.75, + 3376291.25, + 4340727.0, + 3909334.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009646597318351269, + 0.0007130720769055188, + 0.0007134011830203235, + 0.0007131980964913964, + 0.0007129770237952471 + ], + "acc_eval": 0.171875, + "epoch": 67 + }, + { + "hidden_norms": [ + 6398.03955078125, + 1508487.5, + 3436526.25, + 4417271.5, + 3981251.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009445869363844395, + 0.0007122856914065778, + 0.0007126569980755448, + 0.0007124742260202765, + 0.0007122504175640643 + ], + "acc_eval": 0.189453125, + "epoch": 68 + }, + { + "hidden_norms": [ + 6389.02392578125, + 1530834.625, + 3480246.5, + 4471170.0, + 4032576.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009853171650320292, + 0.0006874292739666998, + 0.0006876476109027863, + 0.0006881517474539578, + 0.0006880395230837166 + ], + "acc_eval": 0.1904296875, + "epoch": 69 + }, + { + "hidden_norms": [ + 6338.54443359375, + 1561198.875, + 3541681.5, + 4548099.0, + 4105499.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009333671187050641, + 0.0006952910916879773, + 0.0006947650690563023, + 0.0006940987077541649, + 0.0006943742628209293 + ], + "acc_eval": 0.23046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 6280.18603515625, + 1585008.0, + 3589125.25, + 4608667.0, + 4162480.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009699579677544534, + 0.0007101434166543186, + 0.0007104446412995458, + 0.000710242718923837, + 0.0007100136135704815 + ], + "acc_eval": 0.146484375, + "epoch": 71 + }, + { + "hidden_norms": [ + 6252.455078125, + 1608187.875, + 3635014.75, + 4667478.5, + 4218253.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008955001248978078, + 0.0006863236776553094, + 0.0006864941096864641, + 0.000687020889017731, + 0.0006868807831779122 + ], + "acc_eval": 0.2431640625, + "epoch": 72 + }, + { + "hidden_norms": [ + 6201.6845703125, + 1619508.875, + 3661275.25, + 4700652.0, + 4249921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009069991065189242, + 0.0006539999740198255, + 0.0006531713879667222, + 0.0006594359292648733, + 0.000653320224955678 + ], + "acc_eval": 0.2216796875, + "epoch": 73 + }, + { + "hidden_norms": [ + 6182.8115234375, + 1632587.875, + 3679586.25, + 4722070.5, + 4271567.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009595821611583233, + 0.0007079984061419964, + 0.0007082773372530937, + 0.0007081056828610599, + 0.000707884959410876 + ], + "acc_eval": 0.193359375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6153.7392578125, + 1653576.875, + 3722935.0, + 4776921.0, + 4323508.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008598894928582013, + 0.0007073319284245372, + 0.0007075938628986478, + 0.0007074539898894727, + 0.0007072555599734187 + ], + "acc_eval": 0.201171875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6135.21240234375, + 1667474.375, + 3750912.75, + 4812450.5, + 4357575.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009454588289372623, + 0.0007068001432344317, + 0.0007069715647958219, + 0.0007067638216540217, + 0.0007065933896228671 + ], + "acc_eval": 0.2158203125, + "epoch": 76 + }, + { + "hidden_norms": [ + 6085.7109375, + 1679251.75, + 3774334.5, + 4840148.5, + 4384792.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008410231093876064, + 0.0006843701121397316, + 0.0006845371681265533, + 0.00068506138632074, + 0.0006849151104688644 + ], + "acc_eval": 0.2578125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6042.693359375, + 1685705.5, + 3787479.75, + 4856211.0, + 4400193.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008572259685024619, + 0.0006840305286459625, + 0.0006841861759312451, + 0.0006847094628028572, + 0.0006845552125014365 + ], + "acc_eval": 0.2568359375, + "epoch": 78 + }, + { + "hidden_norms": [ + 6003.5390625, + 1702685.5, + 3813174.5, + 4888481.0, + 4430612.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008342780056409538, + 0.0006777377566322684, + 0.0006779460818506777, + 0.0006789933540858328, + 0.0006781259435229003 + ], + "acc_eval": 0.2685546875, + "epoch": 79 + }, + { + "hidden_norms": [ + 5948.60107421875, + 1714243.125, + 3830846.5, + 4910337.5, + 4451921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008218465954996645, + 0.0006832804065197706, + 0.0006831764476373792, + 0.0006826326716691256, + 0.0006829035119153559 + ], + "acc_eval": 0.2529296875, + "epoch": 80 + }, + { + "hidden_norms": [ + 5881.8525390625, + 1718113.375, + 3838036.5, + 4920025.5, + 4461931.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007958809728734195, + 0.000677398347761482, + 0.0006775528891012073, + 0.0006775871734134853, + 0.0006777321686968207 + ], + "acc_eval": 0.2548828125, + "epoch": 81 + }, + { + "hidden_norms": [ + 5816.7880859375, + 1723461.25, + 3850904.75, + 4936806.0, + 4478473.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008361428044736385, + 0.0006769691244699061, + 0.0006771331536583602, + 0.0006771665066480637, + 0.0006773129571229219 + ], + "acc_eval": 0.251953125, + "epoch": 82 + }, + { + "hidden_norms": [ + 5760.41845703125, + 1732135.25, + 3859576.0, + 4947171.0, + 4488986.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008036325452849269, + 0.0006821549613960087, + 0.0006806753808632493, + 0.0006799713592045009, + 0.0006802318384870887 + ], + "acc_eval": 0.2490234375, + "epoch": 83 + }, + { + "hidden_norms": [ + 5710.22998046875, + 1740014.25, + 3871992.25, + 4962337.5, + 4503463.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008278922759927809, + 0.0006754198693670332, + 0.000675307004712522, + 0.0006768241291865706, + 0.0006769676692783833 + ], + "acc_eval": 0.26171875, + "epoch": 84 + }, + { + "hidden_norms": [ + 5685.73828125, + 1745863.25, + 3880256.75, + 4973639.5, + 4514457.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008255501161329448, + 0.0006466225022450089, + 0.0006466452032327652, + 0.0006467151688411832, + 0.0006467655766755342 + ], + "acc_eval": 0.283203125, + "epoch": 85 + }, + { + "hidden_norms": [ + 5637.498046875, + 1743128.375, + 3879796.5, + 4973009.0, + 4514424.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008148956694640219, + 0.0006465681362897158, + 0.0006463592289946973, + 0.0006491504609584808, + 0.0006464755861088634 + ], + "acc_eval": 0.2587890625, + "epoch": 86 + }, + { + "hidden_norms": [ + 5601.87744140625, + 1741859.375, + 3884447.75, + 4978445.5, + 4518886.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008254973217844963, + 0.0006783050484955311, + 0.0006774527719244361, + 0.0006768335006199777, + 0.0006770920008420944 + ], + "acc_eval": 0.298828125, + "epoch": 87 + }, + { + "hidden_norms": [ + 5587.505859375, + 1748285.875, + 3887730.5, + 4982144.0, + 4523151.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008113561780191958, + 0.0006764904828742146, + 0.000676542054861784, + 0.0006762324483133852, + 0.0006764894351363182 + ], + "acc_eval": 0.2734375, + "epoch": 88 + }, + { + "hidden_norms": [ + 5553.013671875, + 1748456.75, + 3890722.0, + 4986538.5, + 4527315.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007909060223028064, + 0.0006763285491615534, + 0.0006762049742974341, + 0.0006756742368452251, + 0.000675930583383888 + ], + "acc_eval": 0.2861328125, + "epoch": 89 + }, + { + "hidden_norms": [ + 5524.611328125, + 1748210.0, + 3893003.75, + 4989732.5, + 4530436.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000797618820797652, + 0.0006453269743360579, + 0.0006453663809224963, + 0.0006454290705733001, + 0.0006454723770730197 + ], + "acc_eval": 0.28515625, + "epoch": 90 + }, + { + "hidden_norms": [ + 5506.21923828125, + 1750958.0, + 3894639.5, + 4992073.0, + 4532399.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007834367570467293, + 0.0006762953125871718, + 0.0006754640489816666, + 0.0006748714949935675, + 0.0006751226610504091 + ], + "acc_eval": 0.2939453125, + "epoch": 91 + }, + { + "hidden_norms": [ + 5485.10791015625, + 1747546.25, + 3895030.0, + 4992480.5, + 4532805.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007779909064993262, + 0.0006450997898355126, + 0.0006451247027143836, + 0.0006455867551267147, + 0.0006452234229072928 + ], + "acc_eval": 0.2890625, + "epoch": 92 + }, + { + "hidden_norms": [ + 5464.07763671875, + 1749313.125, + 3894610.75, + 4991684.0, + 4532270.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008090221090242267, + 0.0006661301013082266, + 0.0006646219990216196, + 0.0006726695573888719, + 0.0006649038987234235 + ], + "acc_eval": 0.283203125, + "epoch": 93 + }, + { + "hidden_norms": [ + 5451.2841796875, + 1749389.0, + 3894315.25, + 4990837.5, + 4531011.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007907215040177107, + 0.0006448677740991116, + 0.0006448915228247643, + 0.0006451430963352323, + 0.0006449950742535293 + ], + "acc_eval": 0.2958984375, + "epoch": 94 + }, + { + "hidden_norms": [ + 5437.77099609375, + 1750653.125, + 3895251.75, + 4992303.0, + 4532441.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007774807745590806, + 0.000676269584801048, + 0.0006763145211152732, + 0.0006763775018043816, + 0.000676501716952771 + ], + "acc_eval": 0.2763671875, + "epoch": 95 + }, + { + "hidden_norms": [ + 5427.34619140625, + 1751408.875, + 3894547.75, + 4991554.5, + 4532145.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797307334840298, + 0.000664835621137172, + 0.0006642266525886953, + 0.000671364541631192, + 0.0006645115208812058 + ], + "acc_eval": 0.296875, + "epoch": 96 + }, + { + "hidden_norms": [ + 5420.30615234375, + 1751757.5, + 3894027.5, + 4991042.0, + 4531674.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797667058184743, + 0.0006446840125136077, + 0.0006447113119065762, + 0.0006447701598517597, + 0.0006448116037063301 + ], + "acc_eval": 0.2939453125, + "epoch": 97 + }, + { + "hidden_norms": [ + 5416.81396484375, + 1751629.625, + 3893959.25, + 4991021.5, + 4531639.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007706825854256749, + 0.0006446407060138881, + 0.0006406756583601236, + 0.0006447536870837212, + 0.0006393496878445148 + ], + "acc_eval": 0.306640625, + "epoch": 98 + }, + { + "hidden_norms": [ + 5415.3095703125, + 1751552.75, + 3893897.0, + 4990973.0, + 4531587.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007776900893077254, + 0.0006458400748670101, + 0.0006446869228966534, + 0.0006466003833338618, + 0.0006447876221500337 + ], + "acc_eval": 0.2978515625, + "epoch": 99 + }, + { + "hidden_norms": [ + 5414.92822265625, + 1751530.25, + 3893876.5, + 4990954.0, + 4531568.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007761479937471449, + 0.0006465426995418966, + 0.0006446881452575326, + 0.0006466349004767835, + 0.0006447875639423728 + ], + "acc_eval": 0.294921875, + "epoch": 100 + } + ], + "arch": "resmlp_noln", + "seed": 42 +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json new file mode 100644 index 0000000..7e5cb37 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json @@ -0,0 +1,1824 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "acc_eval": 0.1123046875, + "epoch": 0 + }, + { + "hidden_norms": [ + 736.34716796875, + 1637.1044921875, + 2033.1922607421875, + 2161.380859375, + 2126.18505859375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0006836718530394137, + 0.0006813183426856995, + 0.0006814387743361294, + 0.0006832550279796124, + 0.0006794488872401416 + ], + "acc_eval": 0.1953125, + "epoch": 1 + }, + { + "hidden_norms": [ + 1106.3868408203125, + 2963.552001953125, + 4087.33837890625, + 4421.4921875, + 4265.1083984375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007476353785023093, + 0.0007440777844749391, + 0.0007443943759426475, + 0.0007477496401406825, + 0.0007366884965449572 + ], + "acc_eval": 0.1044921875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1371.9425048828125, + 4214.05078125, + 6238.47265625, + 6697.2333984375, + 6399.22314453125 + ], + "bp_grad_norms_per_sample_med": [ + 0.000730870058760047, + 0.00072717375587672, + 0.0007270713686011732, + 0.0007290731882676482, + 0.0007233614451251924 + ], + "acc_eval": 0.1943359375, + "epoch": 3 + }, + { + "hidden_norms": [ + 1574.7962646484375, + 4805.0556640625, + 7044.64599609375, + 7593.78955078125, + 7215.32763671875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007098641362972558, + 0.0007034889422357082, + 0.0007031699060462415, + 0.0007120345253497362, + 0.000694308546371758 + ], + "acc_eval": 0.2451171875, + "epoch": 4 + }, + { + "hidden_norms": [ + 1726.088623046875, + 6184.34521484375, + 9521.791015625, + 10387.7236328125, + 9721.431640625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007400272879749537, + 0.0007343650795519352, + 0.0007334973197430372, + 0.0007343514007516205, + 0.0007319966680370271 + ], + "acc_eval": 0.212890625, + "epoch": 5 + }, + { + "hidden_norms": [ + 1902.689697265625, + 7697.52197265625, + 12328.0595703125, + 13597.1787109375, + 12504.158203125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007165716378949583, + 0.0007126733544282615, + 0.0007124089752323925, + 0.0007126083364710212, + 0.0007107863784767687 + ], + "acc_eval": 0.15625, + "epoch": 6 + }, + { + "hidden_norms": [ + 2069.750244140625, + 10379.2958984375, + 16444.7421875, + 18267.94921875, + 16595.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007099996437318623, + 0.0007088935235515237, + 0.0007090346189215779, + 0.000710709486156702, + 0.0007023006328381598 + ], + "acc_eval": 0.154296875, + "epoch": 7 + }, + { + "hidden_norms": [ + 2226.40673828125, + 12703.916015625, + 20184.30859375, + 22453.73828125, + 20183.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.00072157580871135, + 0.0007210742915049195, + 0.0007212630589492619, + 0.0007244180305860937, + 0.0007163899717852473 + ], + "acc_eval": 0.2236328125, + "epoch": 8 + }, + { + "hidden_norms": [ + 2289.455078125, + 15611.2138671875, + 24559.412109375, + 27336.787109375, + 24451.6796875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007243232685141265, + 0.0007221215637400746, + 0.0007219284889288247, + 0.0007259267731569707, + 0.0007173537742346525 + ], + "acc_eval": 0.169921875, + "epoch": 9 + }, + { + "hidden_norms": [ + 2396.09814453125, + 19678.587890625, + 30417.08203125, + 34140.70703125, + 30261.052734375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007124242256395519, + 0.0007074667955748737, + 0.0007074963650666177, + 0.0007131542661227286, + 0.0007022957433946431 + ], + "acc_eval": 0.1904296875, + "epoch": 10 + }, + { + "hidden_norms": [ + 2467.864013671875, + 24019.642578125, + 41156.921875, + 46706.38671875, + 41256.71484375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007333463290706277, + 0.0007277126424014568, + 0.0007268521003425121, + 0.000731462670955807, + 0.0007225224399007857 + ], + "acc_eval": 0.169921875, + "epoch": 11 + }, + { + "hidden_norms": [ + 2518.561767578125, + 28957.451171875, + 55737.69140625, + 64112.609375, + 56246.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007202349370345473, + 0.0007073598098941147, + 0.0007049349951557815, + 0.0007059182389639318, + 0.0007044971571303904 + ], + "acc_eval": 0.1513671875, + "epoch": 12 + }, + { + "hidden_norms": [ + 2614.843994140625, + 34279.15625, + 74158.109375, + 86073.96875, + 75187.59375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007299556746147573, + 0.0007100331713445485, + 0.0007101728115230799, + 0.0007166104041971266, + 0.0007030466804280877 + ], + "acc_eval": 0.24609375, + "epoch": 13 + }, + { + "hidden_norms": [ + 2697.871337890625, + 41263.5390625, + 96222.8984375, + 112901.9765625, + 98551.3046875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007336065755225718, + 0.0007151410100050271, + 0.0007150733144953847, + 0.0007166287978179753, + 0.0007151660392992198 + ], + "acc_eval": 0.134765625, + "epoch": 14 + }, + { + "hidden_norms": [ + 2815.983154296875, + 53842.3828125, + 126185.5625, + 149526.796875, + 130144.4765625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007365003693848848, + 0.0007177364313974977, + 0.0007168670417740941, + 0.000717108603566885, + 0.0007130720769055188 + ], + "acc_eval": 0.150390625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2928.448974609375, + 65162.98046875, + 153909.296875, + 184005.875, + 159483.03125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007613440393470228, + 0.000720723532140255, + 0.000720796815585345, + 0.0007208258030004799, + 0.0007211563643068075 + ], + "acc_eval": 0.166015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 2970.975341796875, + 76176.9609375, + 179093.75, + 216167.875, + 186723.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007602480472996831, + 0.0007191941258497536, + 0.0007163456757552922, + 0.0007164765265770257, + 0.0007142137037590146 + ], + "acc_eval": 0.1796875, + "epoch": 17 + }, + { + "hidden_norms": [ + 3078.336181640625, + 91839.40625, + 215980.015625, + 263515.15625, + 227071.515625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007584959384985268, + 0.0007150565506890416, + 0.0007151922909542918, + 0.000715585716534406, + 0.0007152389152906835 + ], + "acc_eval": 0.1767578125, + "epoch": 18 + }, + { + "hidden_norms": [ + 3202.803466796875, + 104358.6875, + 248325.390625, + 305395.84375, + 262365.46875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007867171661928296, + 0.0007155268103815615, + 0.0007155817584134638, + 0.0007157608633860946, + 0.0007155768107622862 + ], + "acc_eval": 0.138671875, + "epoch": 19 + }, + { + "hidden_norms": [ + 3282.27490234375, + 117747.359375, + 284217.3125, + 351018.15625, + 300903.65625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007691550417803228, + 0.0007147297146730125, + 0.0007147309370338917, + 0.0007150261080823839, + 0.0007147534633986652 + ], + "acc_eval": 0.1923828125, + "epoch": 20 + }, + { + "hidden_norms": [ + 3394.945556640625, + 129443.9765625, + 317078.65625, + 393509.375, + 336658.40625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008442914695478976, + 0.0007179519161581993, + 0.0007190873729996383, + 0.000723545381333679, + 0.0007175213540904224 + ], + "acc_eval": 0.1376953125, + "epoch": 21 + }, + { + "hidden_norms": [ + 3484.2763671875, + 140426.171875, + 355086.84375, + 443148.09375, + 378501.53125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007702927687205374, + 0.0006826652679592371, + 0.0006794629734940827, + 0.0006826536264270544, + 0.0006794703076593578 + ], + "acc_eval": 0.19140625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3529.414306640625, + 153612.265625, + 393522.9375, + 493183.03125, + 421284.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008731107809580863, + 0.0007047304534353316, + 0.0007038630428723991, + 0.000708943116478622, + 0.000701444165315479 + ], + "acc_eval": 0.16796875, + "epoch": 23 + }, + { + "hidden_norms": [ + 3604.90283203125, + 165405.75, + 423586.46875, + 533219.375, + 454992.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008110221242532134, + 0.0006812610663473606, + 0.0006812110659666359, + 0.0006817537359893322, + 0.0006813214858993888 + ], + "acc_eval": 0.20703125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3761.85400390625, + 178944.296875, + 464984.875, + 587869.375, + 501438.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008038324886001647, + 0.0006578225293196738, + 0.0006502956384792924, + 0.000664222112391144, + 0.0006502254982478917 + ], + "acc_eval": 0.240234375, + "epoch": 25 + }, + { + "hidden_norms": [ + 3818.5869140625, + 193167.4375, + 505599.375, + 643764.4375, + 550033.3125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007956585614010692, + 0.0007038708426989615, + 0.0007025190279819071, + 0.0007078333292156458, + 0.0006988184759393334 + ], + "acc_eval": 0.185546875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3924.1787109375, + 207801.1875, + 548741.125, + 701043.0625, + 599520.4375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009222823427990079, + 0.000673642847687006, + 0.0006724554114043713, + 0.0006726986612193286, + 0.0006725445855408907 + ], + "acc_eval": 0.216796875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4061.806884765625, + 222595.921875, + 590807.5, + 755718.75, + 646775.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008092334610410035, + 0.0007093537133187056, + 0.0007078479393385351, + 0.0007069098646752536, + 0.0007029378321021795 + ], + "acc_eval": 0.2158203125, + "epoch": 28 + }, + { + "hidden_norms": [ + 4216.11083984375, + 237549.296875, + 636429.5625, + 816954.9375, + 699524.9375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008620031294412911, + 0.0007326522027142346, + 0.00072627910412848, + 0.000725903722923249, + 0.0007269763154909015 + ], + "acc_eval": 0.1533203125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4319.05029296875, + 251667.5, + 681409.75, + 874567.9375, + 748820.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008448463049717247, + 0.0007160686072893441, + 0.000714016379788518, + 0.0007141274982132018, + 0.0007095346227288246 + ], + "acc_eval": 0.1591796875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4387.8330078125, + 268470.375, + 733153.125, + 943456.375, + 808793.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009849616326391697, + 0.0007160623208619654, + 0.0007154300110414624, + 0.0007152247708290815, + 0.0007160453242249787 + ], + "acc_eval": 0.1884765625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4495.54638671875, + 291274.59375, + 806698.75, + 1039374.875, + 892062.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008646573405712843, + 0.000731874315533787, + 0.0007177238585427403, + 0.0007205329020507634, + 0.0007192457560449839 + ], + "acc_eval": 0.17578125, + "epoch": 32 + }, + { + "hidden_norms": [ + 4596.96337890625, + 305228.46875, + 848072.5625, + 1092268.625, + 937583.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009474663529545069, + 0.0007221641135402024, + 0.000721680698916316, + 0.0007284134044311941, + 0.0007212713244371116 + ], + "acc_eval": 0.171875, + "epoch": 33 + }, + { + "hidden_norms": [ + 4724.111328125, + 321366.5, + 891238.9375, + 1149886.25, + 987910.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009131877450272441, + 0.0007397676818072796, + 0.0007398735033348203, + 0.0007397927111014724, + 0.0007406016811728477 + ], + "acc_eval": 0.125, + "epoch": 34 + }, + { + "hidden_norms": [ + 4865.970703125, + 344027.15625, + 946722.0625, + 1219714.625, + 1049445.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001010064734145999, + 0.0007341124583035707, + 0.0007336883572861552, + 0.0007345521007664502, + 0.0007338698487728834 + ], + "acc_eval": 0.119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5003.3857421875, + 373410.21875, + 1026535.0625, + 1321456.25, + 1139824.625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010555180488154292, + 0.0007112861494533718, + 0.0007111895247362554, + 0.0007112334715202451, + 0.000711193191818893 + ], + "acc_eval": 0.1591796875, + "epoch": 36 + }, + { + "hidden_norms": [ + 5121.19287109375, + 405646.9375, + 1111111.125, + 1430716.625, + 1237074.375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010308363707736135, + 0.0007563655963167548, + 0.0007560031372122467, + 0.000755665882024914, + 0.0007561628590337932 + ], + "acc_eval": 0.134765625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5212.7294921875, + 434054.15625, + 1180238.125, + 1518019.875, + 1314350.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001035128254443407, + 0.0007314062095247209, + 0.0007304889149963856, + 0.0007291524088941514, + 0.0007313747191801667 + ], + "acc_eval": 0.140625, + "epoch": 38 + }, + { + "hidden_norms": [ + 5322.74951171875, + 462000.6875, + 1248006.75, + 1606243.125, + 1392563.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009023830061778426, + 0.000720554031431675, + 0.0007195135112851858, + 0.0007197313825599849, + 0.0007196948863565922 + ], + "acc_eval": 0.1708984375, + "epoch": 39 + }, + { + "hidden_norms": [ + 5453.89111328125, + 498941.0625, + 1343521.0, + 1731177.375, + 1504101.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010444134240970016, + 0.0007362678297795355, + 0.0007352089160121977, + 0.0007340405718423426, + 0.0007357052527368069 + ], + "acc_eval": 0.1328125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5515.6982421875, + 529817.75, + 1409505.625, + 1816151.0, + 1580539.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011280628386884928, + 0.0007231750059872866, + 0.0007211649208329618, + 0.000721275107935071, + 0.0007212632917799056 + ], + "acc_eval": 0.1611328125, + "epoch": 41 + }, + { + "hidden_norms": [ + 5617.26513671875, + 567492.4375, + 1498097.5, + 1931607.875, + 1684206.875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010544253746047616, + 0.0007354306289926171, + 0.0007348860381171107, + 0.0007349851075559855, + 0.0007350810337811708 + ], + "acc_eval": 0.1416015625, + "epoch": 42 + }, + { + "hidden_norms": [ + 5740.7978515625, + 596215.625, + 1561745.25, + 2014107.25, + 1758526.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010764201870188117, + 0.0007244387525133789, + 0.000723967794328928, + 0.000724096957128495, + 0.0007241644198074937 + ], + "acc_eval": 0.19921875, + "epoch": 43 + }, + { + "hidden_norms": [ + 5808.19677734375, + 630780.3125, + 1636034.875, + 2109305.75, + 1845552.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010526466649025679, + 0.0007206913433037698, + 0.0007207048474811018, + 0.0007211468764580786, + 0.0007207895396277308 + ], + "acc_eval": 0.173828125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5868.3583984375, + 673578.625, + 1729325.25, + 2227518.0, + 1953361.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009479392319917679, + 0.0007091389270499349, + 0.0007090644794516265, + 0.0007082624360918999, + 0.0007085782708600163 + ], + "acc_eval": 0.1923828125, + "epoch": 45 + }, + { + "hidden_norms": [ + 5953.82421875, + 720273.0, + 1840695.5, + 2372038.0, + 2084658.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0014002618845552206, + 0.0007315247785300016, + 0.0007256051758304238, + 0.0007254919619299471, + 0.000725599646102637 + ], + "acc_eval": 0.17578125, + "epoch": 46 + }, + { + "hidden_norms": [ + 6054.7861328125, + 758000.6875, + 1930354.375, + 2488163.75, + 2190582.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001109408913180232, + 0.0007018125616014004, + 0.0007016566814854741, + 0.000701890152413398, + 0.0007018494652584195 + ], + "acc_eval": 0.203125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6155.0859375, + 790443.0, + 2009565.875, + 2590829.25, + 2285268.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010253023356199265, + 0.0007347314967773855, + 0.0007304528844542801, + 0.0007322027231566608, + 0.0007312395609915257 + ], + "acc_eval": 0.154296875, + "epoch": 48 + }, + { + "hidden_norms": [ + 6216.64453125, + 830678.125, + 2088773.5, + 2691122.0, + 2376731.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010403504129499197, + 0.0006902964669279754, + 0.0006906419876031578, + 0.0006905900663696229, + 0.0006906461785547435 + ], + "acc_eval": 0.1591796875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6252.98486328125, + 867790.1875, + 2159729.75, + 2781409.5, + 2460902.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011370684951543808, + 0.0007390088285319507, + 0.0007305812323465943, + 0.0007310720975510776, + 0.0007304322207346559 + ], + "acc_eval": 0.15234375, + "epoch": 50 + }, + { + "hidden_norms": [ + 6294.51611328125, + 897267.5625, + 2218282.5, + 2858224.75, + 2530432.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0013790406519547105, + 0.0007320911972783506, + 0.0007304649334400892, + 0.0007293879170902073, + 0.0007303770980797708 + ], + "acc_eval": 0.1591796875, + "epoch": 51 + }, + { + "hidden_norms": [ + 6312.2314453125, + 935570.375, + 2299086.0, + 2963619.0, + 2627515.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000999285257421434, + 0.0007227054447866976, + 0.0007246703025884926, + 0.0007245387532748282, + 0.0007243558065965772 + ], + "acc_eval": 0.20703125, + "epoch": 52 + }, + { + "hidden_norms": [ + 6387.30322265625, + 977101.125, + 2387243.0, + 3077676.25, + 2733147.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001396833686158061, + 0.0007110408041626215, + 0.0007093287422321737, + 0.000708233390469104, + 0.0007085108081810176 + ], + "acc_eval": 0.1787109375, + "epoch": 53 + }, + { + "hidden_norms": [ + 6406.59033203125, + 1011753.1875, + 2450391.25, + 3158275.0, + 2807055.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0012408416951075196, + 0.0007304692408069968, + 0.000724659999832511, + 0.0007247650064527988, + 0.0007249858463183045 + ], + "acc_eval": 0.130859375, + "epoch": 54 + }, + { + "hidden_norms": [ + 6396.32080078125, + 1051044.375, + 2521085.5, + 3249326.75, + 2890642.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010854896390810609, + 0.0006957638543099165, + 0.0006896257400512695, + 0.0006964386557228863, + 0.0006897017010487616 + ], + "acc_eval": 0.234375, + "epoch": 55 + }, + { + "hidden_norms": [ + 6413.91357421875, + 1083474.5, + 2597945.5, + 3348271.5, + 2981405.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.00098806235473603, + 0.000719150179065764, + 0.0007170068565756083, + 0.0007178731029853225, + 0.0007173708290793002 + ], + "acc_eval": 0.205078125, + "epoch": 56 + }, + { + "hidden_norms": [ + 6406.4228515625, + 1124429.875, + 2675529.5, + 3447474.25, + 3073241.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001149638439528644, + 0.0007225789595395327, + 0.0007212197524495423, + 0.0007210947806015611, + 0.0007211659685708582 + ], + "acc_eval": 0.1494140625, + "epoch": 57 + }, + { + "hidden_norms": [ + 6443.423828125, + 1166184.375, + 2758561.25, + 3551879.75, + 3171214.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001115654013119638, + 0.000685695675201714, + 0.0006846366450190544, + 0.0006861463189125061, + 0.0006862673326395452 + ], + "acc_eval": 0.2490234375, + "epoch": 58 + }, + { + "hidden_norms": [ + 6477.5, + 1208826.0, + 2842194.75, + 3654862.0, + 3267617.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.000923235435038805, + 0.0006659153732471168, + 0.0006642267107963562, + 0.0006722065154463053, + 0.000664416525978595 + ], + "acc_eval": 0.2353515625, + "epoch": 59 + }, + { + "hidden_norms": [ + 6486.1689453125, + 1249377.0, + 2928293.75, + 3765881.75, + 3370835.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008846685523167253, + 0.0006866253679618239, + 0.000686973100528121, + 0.0006869880016893148, + 0.0006870955694466829 + ], + "acc_eval": 0.2373046875, + "epoch": 60 + }, + { + "hidden_norms": [ + 6499.3720703125, + 1291233.25, + 3012714.75, + 3873429.75, + 3471234.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009820004925131798, + 0.0007174524944275618, + 0.0007178467349149287, + 0.0007176626822911203, + 0.0007174718775786459 + ], + "acc_eval": 0.216796875, + "epoch": 61 + }, + { + "hidden_norms": [ + 6486.14404296875, + 1327247.75, + 3088322.75, + 3971415.75, + 3562299.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010241338750347495, + 0.0007171124452725053, + 0.0007174332858994603, + 0.0007172181503847241, + 0.0007169945747591555 + ], + "acc_eval": 0.18359375, + "epoch": 62 + }, + { + "hidden_norms": [ + 6455.17236328125, + 1355067.375, + 3142698.25, + 4041006.5, + 3627490.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009781530825421214, + 0.0007034538430161774, + 0.000703376077581197, + 0.0007118352805264294, + 0.0007080681971274316 + ], + "acc_eval": 0.189453125, + "epoch": 63 + }, + { + "hidden_norms": [ + 6454.62841796875, + 1384795.75, + 3199654.0, + 4114095.75, + 3696468.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009227422997355461, + 0.0007023688522167504, + 0.0007012909045442939, + 0.0007004260551184416, + 0.0007006779196672142 + ], + "acc_eval": 0.21484375, + "epoch": 64 + }, + { + "hidden_norms": [ + 6451.345703125, + 1420232.75, + 3260116.5, + 4190244.25, + 3768354.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008870494784787297, + 0.0007146014831960201, + 0.0007149986922740936, + 0.0007148014265112579, + 0.0007145918207243085 + ], + "acc_eval": 0.197265625, + "epoch": 65 + }, + { + "hidden_norms": [ + 6445.890625, + 1448264.875, + 3319505.0, + 4267505.0, + 3840047.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010003555798903108, + 0.0007171350298449397, + 0.0007168895681388676, + 0.0007169176824390888, + 0.0007170233875513077 + ], + "acc_eval": 0.1591796875, + "epoch": 66 + }, + { + "hidden_norms": [ + 6440.8212890625, + 1478082.75, + 3376291.25, + 4340727.0, + 3909334.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009646597318351269, + 0.0007130720769055188, + 0.0007134011830203235, + 0.0007131980964913964, + 0.0007129770237952471 + ], + "acc_eval": 0.171875, + "epoch": 67 + }, + { + "hidden_norms": [ + 6398.03955078125, + 1508487.5, + 3436526.25, + 4417271.5, + 3981251.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009445869363844395, + 0.0007122856914065778, + 0.0007126569980755448, + 0.0007124742260202765, + 0.0007122504175640643 + ], + "acc_eval": 0.189453125, + "epoch": 68 + }, + { + "hidden_norms": [ + 6389.02392578125, + 1530834.625, + 3480246.5, + 4471170.0, + 4032576.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009853171650320292, + 0.0006874292739666998, + 0.0006876476109027863, + 0.0006881517474539578, + 0.0006880395230837166 + ], + "acc_eval": 0.1904296875, + "epoch": 69 + }, + { + "hidden_norms": [ + 6338.54443359375, + 1561198.875, + 3541681.5, + 4548099.0, + 4105499.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009333671187050641, + 0.0006952910916879773, + 0.0006947650690563023, + 0.0006940987077541649, + 0.0006943742628209293 + ], + "acc_eval": 0.23046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 6280.18603515625, + 1585008.0, + 3589125.25, + 4608667.0, + 4162480.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009699579677544534, + 0.0007101434166543186, + 0.0007104446412995458, + 0.000710242718923837, + 0.0007100136135704815 + ], + "acc_eval": 0.146484375, + "epoch": 71 + }, + { + "hidden_norms": [ + 6252.455078125, + 1608187.875, + 3635014.75, + 4667478.5, + 4218253.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008955001248978078, + 0.0006863236776553094, + 0.0006864941096864641, + 0.000687020889017731, + 0.0006868807831779122 + ], + "acc_eval": 0.2431640625, + "epoch": 72 + }, + { + "hidden_norms": [ + 6201.6845703125, + 1619508.875, + 3661275.25, + 4700652.0, + 4249921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009069991065189242, + 0.0006539999740198255, + 0.0006531713879667222, + 0.0006594359292648733, + 0.000653320224955678 + ], + "acc_eval": 0.2216796875, + "epoch": 73 + }, + { + "hidden_norms": [ + 6182.8115234375, + 1632587.875, + 3679586.25, + 4722070.5, + 4271567.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009595821611583233, + 0.0007079984061419964, + 0.0007082773372530937, + 0.0007081056828610599, + 0.000707884959410876 + ], + "acc_eval": 0.193359375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6153.7392578125, + 1653576.875, + 3722935.0, + 4776921.0, + 4323508.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008598894928582013, + 0.0007073319284245372, + 0.0007075938628986478, + 0.0007074539898894727, + 0.0007072555599734187 + ], + "acc_eval": 0.201171875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6135.21240234375, + 1667474.375, + 3750912.75, + 4812450.5, + 4357575.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009454588289372623, + 0.0007068001432344317, + 0.0007069715647958219, + 0.0007067638216540217, + 0.0007065933896228671 + ], + "acc_eval": 0.2158203125, + "epoch": 76 + }, + { + "hidden_norms": [ + 6085.7109375, + 1679251.75, + 3774334.5, + 4840148.5, + 4384792.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008410231093876064, + 0.0006843701121397316, + 0.0006845371681265533, + 0.00068506138632074, + 0.0006849151104688644 + ], + "acc_eval": 0.2578125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6042.693359375, + 1685705.5, + 3787479.75, + 4856211.0, + 4400193.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008572259685024619, + 0.0006840305286459625, + 0.0006841861759312451, + 0.0006847094628028572, + 0.0006845552125014365 + ], + "acc_eval": 0.2568359375, + "epoch": 78 + }, + { + "hidden_norms": [ + 6003.5390625, + 1702685.5, + 3813174.5, + 4888481.0, + 4430612.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008342780056409538, + 0.0006777377566322684, + 0.0006779460818506777, + 0.0006789933540858328, + 0.0006781259435229003 + ], + "acc_eval": 0.2685546875, + "epoch": 79 + }, + { + "hidden_norms": [ + 5948.60107421875, + 1714243.125, + 3830846.5, + 4910337.5, + 4451921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008218465954996645, + 0.0006832804065197706, + 0.0006831764476373792, + 0.0006826326716691256, + 0.0006829035119153559 + ], + "acc_eval": 0.2529296875, + "epoch": 80 + }, + { + "hidden_norms": [ + 5881.8525390625, + 1718113.375, + 3838036.5, + 4920025.5, + 4461931.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007958809728734195, + 0.000677398347761482, + 0.0006775528891012073, + 0.0006775871734134853, + 0.0006777321686968207 + ], + "acc_eval": 0.2548828125, + "epoch": 81 + }, + { + "hidden_norms": [ + 5816.7880859375, + 1723461.25, + 3850904.75, + 4936806.0, + 4478473.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008361428044736385, + 0.0006769691244699061, + 0.0006771331536583602, + 0.0006771665066480637, + 0.0006773129571229219 + ], + "acc_eval": 0.251953125, + "epoch": 82 + }, + { + "hidden_norms": [ + 5760.41845703125, + 1732135.25, + 3859576.0, + 4947171.0, + 4488986.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008036325452849269, + 0.0006821549613960087, + 0.0006806753808632493, + 0.0006799713592045009, + 0.0006802318384870887 + ], + "acc_eval": 0.2490234375, + "epoch": 83 + }, + { + "hidden_norms": [ + 5710.22998046875, + 1740014.25, + 3871992.25, + 4962337.5, + 4503463.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008278922759927809, + 0.0006754198693670332, + 0.000675307004712522, + 0.0006768241291865706, + 0.0006769676692783833 + ], + "acc_eval": 0.26171875, + "epoch": 84 + }, + { + "hidden_norms": [ + 5685.73828125, + 1745863.25, + 3880256.75, + 4973639.5, + 4514457.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008255501161329448, + 0.0006466225022450089, + 0.0006466452032327652, + 0.0006467151688411832, + 0.0006467655766755342 + ], + "acc_eval": 0.283203125, + "epoch": 85 + }, + { + "hidden_norms": [ + 5637.498046875, + 1743128.375, + 3879796.5, + 4973009.0, + 4514424.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008148956694640219, + 0.0006465681362897158, + 0.0006463592289946973, + 0.0006491504609584808, + 0.0006464755861088634 + ], + "acc_eval": 0.2587890625, + "epoch": 86 + }, + { + "hidden_norms": [ + 5601.87744140625, + 1741859.375, + 3884447.75, + 4978445.5, + 4518886.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008254973217844963, + 0.0006783050484955311, + 0.0006774527719244361, + 0.0006768335006199777, + 0.0006770920008420944 + ], + "acc_eval": 0.298828125, + "epoch": 87 + }, + { + "hidden_norms": [ + 5587.505859375, + 1748285.875, + 3887730.5, + 4982144.0, + 4523151.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008113561780191958, + 0.0006764904828742146, + 0.000676542054861784, + 0.0006762324483133852, + 0.0006764894351363182 + ], + "acc_eval": 0.2734375, + "epoch": 88 + }, + { + "hidden_norms": [ + 5553.013671875, + 1748456.75, + 3890722.0, + 4986538.5, + 4527315.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007909060223028064, + 0.0006763285491615534, + 0.0006762049742974341, + 0.0006756742368452251, + 0.000675930583383888 + ], + "acc_eval": 0.2861328125, + "epoch": 89 + }, + { + "hidden_norms": [ + 5524.611328125, + 1748210.0, + 3893003.75, + 4989732.5, + 4530436.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000797618820797652, + 0.0006453269743360579, + 0.0006453663809224963, + 0.0006454290705733001, + 0.0006454723770730197 + ], + "acc_eval": 0.28515625, + "epoch": 90 + }, + { + "hidden_norms": [ + 5506.21923828125, + 1750958.0, + 3894639.5, + 4992073.0, + 4532399.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007834367570467293, + 0.0006762953125871718, + 0.0006754640489816666, + 0.0006748714949935675, + 0.0006751226610504091 + ], + "acc_eval": 0.2939453125, + "epoch": 91 + }, + { + "hidden_norms": [ + 5485.10791015625, + 1747546.25, + 3895030.0, + 4992480.5, + 4532805.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007779909064993262, + 0.0006450997898355126, + 0.0006451247027143836, + 0.0006455867551267147, + 0.0006452234229072928 + ], + "acc_eval": 0.2890625, + "epoch": 92 + }, + { + "hidden_norms": [ + 5464.07763671875, + 1749313.125, + 3894610.75, + 4991684.0, + 4532270.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008090221090242267, + 0.0006661301013082266, + 0.0006646219990216196, + 0.0006726695573888719, + 0.0006649038987234235 + ], + "acc_eval": 0.283203125, + "epoch": 93 + }, + { + "hidden_norms": [ + 5451.2841796875, + 1749389.0, + 3894315.25, + 4990837.5, + 4531011.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007907215040177107, + 0.0006448677740991116, + 0.0006448915228247643, + 0.0006451430963352323, + 0.0006449950742535293 + ], + "acc_eval": 0.2958984375, + "epoch": 94 + }, + { + "hidden_norms": [ + 5437.77099609375, + 1750653.125, + 3895251.75, + 4992303.0, + 4532441.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007774807745590806, + 0.000676269584801048, + 0.0006763145211152732, + 0.0006763775018043816, + 0.000676501716952771 + ], + "acc_eval": 0.2763671875, + "epoch": 95 + }, + { + "hidden_norms": [ + 5427.34619140625, + 1751408.875, + 3894547.75, + 4991554.5, + 4532145.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797307334840298, + 0.000664835621137172, + 0.0006642266525886953, + 0.000671364541631192, + 0.0006645115208812058 + ], + "acc_eval": 0.296875, + "epoch": 96 + }, + { + "hidden_norms": [ + 5420.30615234375, + 1751757.5, + 3894027.5, + 4991042.0, + 4531674.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797667058184743, + 0.0006446840125136077, + 0.0006447113119065762, + 0.0006447701598517597, + 0.0006448116037063301 + ], + "acc_eval": 0.2939453125, + "epoch": 97 + }, + { + "hidden_norms": [ + 5416.81396484375, + 1751629.625, + 3893959.25, + 4991021.5, + 4531639.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007706825854256749, + 0.0006446407060138881, + 0.0006406756583601236, + 0.0006447536870837212, + 0.0006393496878445148 + ], + "acc_eval": 0.306640625, + "epoch": 98 + }, + { + "hidden_norms": [ + 5415.3095703125, + 1751552.75, + 3893897.0, + 4990973.0, + 4531587.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007776900893077254, + 0.0006458400748670101, + 0.0006446869228966534, + 0.0006466003833338618, + 0.0006447876221500337 + ], + "acc_eval": 0.2978515625, + "epoch": 99 + }, + { + "hidden_norms": [ + 5414.92822265625, + 1751530.25, + 3893876.5, + 4990954.0, + 4531568.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007761479937471449, + 0.0006465426995418966, + 0.0006446881452575326, + 0.0006466349004767835, + 0.0006447875639423728 + ], + "acc_eval": 0.294921875, + "epoch": 100 + } + ], + "arch": "resmlp_noln", + "seed": 42 +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s123.json b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json new file mode 100644 index 0000000..f3f6392 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005465824506245553, + 0.0005437708459794521, + 0.0005393712199293077, + 0.0005331890424713492, + 0.0005310169071890414 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1015625, + "loss_eval": 2.3754236698150635, + "epoch": 0 + }, + { + "hidden_norms": [ + 40.83987808227539, + 37.75401306152344, + 36.1661376953125, + 34.91564178466797, + 34.55687713623047 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012231437722221017, + 0.00012846711615566164, + 0.00013815351121593267, + 0.00015655385504942387, + 0.0002070761693175882 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.435546875, + "loss_eval": 1.5918896198272705, + "epoch": 1 + }, + { + "hidden_norms": [ + 54.60358810424805, + 49.46598434448242, + 46.75371170043945, + 44.21198272705078, + 42.52875900268555 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010624218703014776, + 0.00011056899529648945, + 0.0001174700737465173, + 0.00012732982577290386, + 0.00015480577712878585 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4755859375, + "loss_eval": 1.464656114578247, + "epoch": 2 + }, + { + "hidden_norms": [ + 65.05919647216797, + 58.81830596923828, + 54.65021896362305, + 50.87609100341797, + 48.61247253417969 + ], + "bp_grad_per_sample_l2_med": [ + 9.24510313780047e-05, + 9.810000483412296e-05, + 0.00010529180872254074, + 0.00011547923350008205, + 0.00013095361646264791 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.509765625, + "loss_eval": 1.4144818782806396, + "epoch": 3 + }, + { + "hidden_norms": [ + 71.89185333251953, + 63.81675338745117, + 58.61539077758789, + 53.633819580078125, + 50.85374450683594 + ], + "bp_grad_per_sample_l2_med": [ + 9.624486119719222e-05, + 0.00010101673979079351, + 0.00010665278387023136, + 0.00011629729851847515, + 0.0001258883421542123 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5009765625, + "loss_eval": 1.4042909145355225, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.86115264892578, + 68.96236419677734, + 62.764793395996094, + 56.297122955322266, + 51.927825927734375 + ], + "bp_grad_per_sample_l2_med": [ + 8.636285201646388e-05, + 9.12561226869002e-05, + 9.721348760649562e-05, + 0.0001029788691084832, + 0.00010866572119994089 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5048828125, + "loss_eval": 1.362424373626709, + "epoch": 5 + }, + { + "hidden_norms": [ + 86.97894287109375, + 76.51913452148438, + 68.91358947753906, + 61.691619873046875, + 55.97148132324219 + ], + "bp_grad_per_sample_l2_med": [ + 8.555527165299281e-05, + 9.211624274030328e-05, + 9.770254109753296e-05, + 0.00010545850091148168, + 0.00011015798372682184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4990234375, + "loss_eval": 1.4210331439971924, + "epoch": 6 + }, + { + "hidden_norms": [ + 91.98681640625, + 80.48826599121094, + 72.19147491455078, + 63.2117919921875, + 57.618526458740234 + ], + "bp_grad_per_sample_l2_med": [ + 8.108472684398293e-05, + 8.69045325089246e-05, + 9.184813097817823e-05, + 9.785865404410288e-05, + 0.00010359002772020176 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.50390625, + "loss_eval": 1.395978569984436, + "epoch": 7 + }, + { + "hidden_norms": [ + 97.7012939453125, + 84.81765747070312, + 75.55701446533203, + 65.7588119506836, + 58.28969955444336 + ], + "bp_grad_per_sample_l2_med": [ + 8.22104630060494e-05, + 8.808301208773628e-05, + 9.288280853070319e-05, + 0.0001000006013782695, + 0.00010321019362891093 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.525390625, + "loss_eval": 1.3341916799545288, + "epoch": 8 + }, + { + "hidden_norms": [ + 102.29643249511719, + 88.3180923461914, + 78.02013397216797, + 67.14125061035156, + 59.45139694213867 + ], + "bp_grad_per_sample_l2_med": [ + 8.297000749735162e-05, + 8.909840107662603e-05, + 9.493192192167044e-05, + 0.00010043827933259308, + 0.00010197651863563806 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5166015625, + "loss_eval": 1.3378056287765503, + "epoch": 9 + }, + { + "hidden_norms": [ + 107.60400390625, + 93.19139862060547, + 81.3952407836914, + 70.16273498535156, + 61.15400314331055 + ], + "bp_grad_per_sample_l2_med": [ + 7.625297439517453e-05, + 8.249503298429772e-05, + 8.778223127592355e-05, + 9.526272333459929e-05, + 9.708418656373397e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.54296875, + "loss_eval": 1.3057411909103394, + "epoch": 10 + }, + { + "hidden_norms": [ + 111.52012634277344, + 95.61714935302734, + 83.3553695678711, + 70.52283477783203, + 61.52479553222656 + ], + "bp_grad_per_sample_l2_med": [ + 7.589814777020365e-05, + 8.213706314563751e-05, + 8.74441975611262e-05, + 9.462270099902526e-05, + 9.573540592100471e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5400390625, + "loss_eval": 1.2877662181854248, + "epoch": 11 + }, + { + "hidden_norms": [ + 116.06771850585938, + 99.79177856445312, + 86.30980682373047, + 72.20254516601562, + 62.78416442871094 + ], + "bp_grad_per_sample_l2_med": [ + 7.193555939011276e-05, + 7.673310028621927e-05, + 8.175434049917385e-05, + 8.827414421830326e-05, + 9.135493019130081e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5478515625, + "loss_eval": 1.2685296535491943, + "epoch": 12 + }, + { + "hidden_norms": [ + 119.3271484375, + 102.65406799316406, + 88.69587707519531, + 74.90689849853516, + 63.780494689941406 + ], + "bp_grad_per_sample_l2_med": [ + 7.618113158969209e-05, + 8.220612653531134e-05, + 8.806472760625184e-05, + 9.463543392485008e-05, + 9.703192336019129e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.54296875, + "loss_eval": 1.276496410369873, + "epoch": 13 + }, + { + "hidden_norms": [ + 123.31849670410156, + 105.7769775390625, + 90.95068359375, + 76.97051239013672, + 64.97062683105469 + ], + "bp_grad_per_sample_l2_med": [ + 7.194027421064675e-05, + 7.883367652539164e-05, + 8.381865336559713e-05, + 9.018390846904367e-05, + 8.924194844439626e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.552734375, + "loss_eval": 1.2604155540466309, + "epoch": 14 + }, + { + "hidden_norms": [ + 127.73625946044922, + 109.2970199584961, + 94.82887268066406, + 79.42200469970703, + 66.68120574951172 + ], + "bp_grad_per_sample_l2_med": [ + 7.26957805454731e-05, + 7.816226570867002e-05, + 8.386534318560734e-05, + 9.044967737281695e-05, + 9.091151150641963e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.2421667575836182, + "epoch": 15 + }, + { + "hidden_norms": [ + 129.39227294921875, + 110.16195678710938, + 95.65125274658203, + 79.63654327392578, + 66.4422836303711 + ], + "bp_grad_per_sample_l2_med": [ + 7.170928438426927e-05, + 7.703503069933504e-05, + 8.211386011680588e-05, + 8.873116166796535e-05, + 9.066827624337748e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2539770603179932, + "epoch": 16 + }, + { + "hidden_norms": [ + 132.24916076660156, + 113.025634765625, + 96.19522857666016, + 80.5164566040039, + 67.23816680908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.194816862465814e-05, + 7.835567521397024e-05, + 8.341929060406983e-05, + 8.761802746448666e-05, + 8.926806913223118e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5732421875, + "loss_eval": 1.2596629858016968, + "epoch": 17 + }, + { + "hidden_norms": [ + 136.37730407714844, + 116.11273956298828, + 98.82146453857422, + 81.83920288085938, + 67.72627258300781 + ], + "bp_grad_per_sample_l2_med": [ + 7.331569941015914e-05, + 7.95917512732558e-05, + 8.647916547488421e-05, + 9.198131010634825e-05, + 9.28269510040991e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53515625, + "loss_eval": 1.2714436054229736, + "epoch": 18 + }, + { + "hidden_norms": [ + 137.7354736328125, + 119.1905288696289, + 102.62776184082031, + 84.3735580444336, + 69.55421447753906 + ], + "bp_grad_per_sample_l2_med": [ + 7.105377881089225e-05, + 7.70094629842788e-05, + 8.26972391223535e-05, + 8.802180673228577e-05, + 8.82365129655227e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5498046875, + "loss_eval": 1.25264310836792, + "epoch": 19 + }, + { + "hidden_norms": [ + 139.01124572753906, + 119.05533599853516, + 101.28179168701172, + 83.50191497802734, + 68.7996826171875 + ], + "bp_grad_per_sample_l2_med": [ + 7.610249303979799e-05, + 8.31697034300305e-05, + 8.997280383482575e-05, + 9.514019620837644e-05, + 9.370686893817037e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.517578125, + "loss_eval": 1.2884626388549805, + "epoch": 20 + }, + { + "hidden_norms": [ + 142.8061981201172, + 121.41246795654297, + 104.47654724121094, + 86.13514709472656, + 70.62234497070312 + ], + "bp_grad_per_sample_l2_med": [ + 7.287831977009773e-05, + 7.990973244886845e-05, + 8.473258640151471e-05, + 9.054663678398356e-05, + 9.23949119169265e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5498046875, + "loss_eval": 1.2458946704864502, + "epoch": 21 + }, + { + "hidden_norms": [ + 145.03463745117188, + 124.42599487304688, + 105.64387512207031, + 87.60891723632812, + 71.11911010742188 + ], + "bp_grad_per_sample_l2_med": [ + 6.878219573991373e-05, + 7.463164365617558e-05, + 7.942628144519404e-05, + 8.418951620114967e-05, + 8.709819667274132e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5654296875, + "loss_eval": 1.2031928300857544, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.368896484375, + 124.08200073242188, + 106.14088439941406, + 87.3053970336914, + 70.22563171386719 + ], + "bp_grad_per_sample_l2_med": [ + 6.987902452237904e-05, + 7.564797124359757e-05, + 8.058137609623373e-05, + 8.513103239238262e-05, + 8.664488268550485e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5830078125, + "loss_eval": 1.2048817873001099, + "epoch": 23 + }, + { + "hidden_norms": [ + 149.82542419433594, + 127.8211898803711, + 109.31559753417969, + 88.96003723144531, + 71.56672668457031 + ], + "bp_grad_per_sample_l2_med": [ + 7.123420073185116e-05, + 7.683804142288864e-05, + 8.418370271101594e-05, + 8.922854613047093e-05, + 8.777298353379592e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5654296875, + "loss_eval": 1.2408947944641113, + "epoch": 24 + }, + { + "hidden_norms": [ + 151.1898193359375, + 128.61166381835938, + 110.0819320678711, + 89.33537292480469, + 70.91573333740234 + ], + "bp_grad_per_sample_l2_med": [ + 7.046251994324848e-05, + 7.593455666210502e-05, + 8.183503086911514e-05, + 8.78809587447904e-05, + 8.738410542719066e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5849609375, + "loss_eval": 1.2345162630081177, + "epoch": 25 + }, + { + "hidden_norms": [ + 153.0899200439453, + 130.6381072998047, + 110.78546905517578, + 90.43073272705078, + 72.28581237792969 + ], + "bp_grad_per_sample_l2_med": [ + 7.224789442261681e-05, + 7.864048529881984e-05, + 8.493732457282022e-05, + 9.218508785124868e-05, + 9.127514931606129e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.548828125, + "loss_eval": 1.234302282333374, + "epoch": 26 + }, + { + "hidden_norms": [ + 156.78964233398438, + 132.35365295410156, + 114.26016998291016, + 93.03483581542969, + 73.8830337524414 + ], + "bp_grad_per_sample_l2_med": [ + 7.004363578744233e-05, + 7.51781408325769e-05, + 8.189951768144965e-05, + 8.64862377056852e-05, + 8.457603689748794e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.226435661315918, + "epoch": 27 + }, + { + "hidden_norms": [ + 154.7094268798828, + 132.68295288085938, + 112.78950500488281, + 91.68452453613281, + 72.69532012939453 + ], + "bp_grad_per_sample_l2_med": [ + 6.871543155284598e-05, + 7.408537931041792e-05, + 7.912247383501381e-05, + 8.584219176555052e-05, + 8.712658018339425e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.186962604522705, + "epoch": 28 + }, + { + "hidden_norms": [ + 156.5343475341797, + 133.95303344726562, + 113.44208526611328, + 91.55599212646484, + 72.66578674316406 + ], + "bp_grad_per_sample_l2_med": [ + 6.697547360090539e-05, + 7.314077083719894e-05, + 7.949489372549579e-05, + 8.466470171697438e-05, + 8.366732799913734e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.1845954656600952, + "epoch": 29 + }, + { + "hidden_norms": [ + 158.63601684570312, + 134.8338165283203, + 115.27066802978516, + 93.78146362304688, + 72.8468017578125 + ], + "bp_grad_per_sample_l2_med": [ + 6.742558616679162e-05, + 7.408189412672073e-05, + 7.9598423326388e-05, + 8.415436604991555e-05, + 8.754149166634306e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.208282470703125, + "epoch": 30 + }, + { + "hidden_norms": [ + 158.21023559570312, + 136.07545471191406, + 116.15364837646484, + 93.98001098632812, + 73.68004608154297 + ], + "bp_grad_per_sample_l2_med": [ + 7.207741873571649e-05, + 7.860636833356693e-05, + 8.520736446371302e-05, + 9.168307587970048e-05, + 8.956313104135916e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.2018094062805176, + "epoch": 31 + }, + { + "hidden_norms": [ + 160.46771240234375, + 136.1265411376953, + 116.0124282836914, + 93.3584976196289, + 73.7890396118164 + ], + "bp_grad_per_sample_l2_med": [ + 7.191704207798466e-05, + 7.717879634583369e-05, + 8.299856563098729e-05, + 8.967710164142773e-05, + 8.699094178155065e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1889103651046753, + "epoch": 32 + }, + { + "hidden_norms": [ + 160.90545654296875, + 137.0214080810547, + 115.83223724365234, + 94.28914642333984, + 73.96448516845703 + ], + "bp_grad_per_sample_l2_med": [ + 7.10546228219755e-05, + 7.790922973072156e-05, + 8.321165660163388e-05, + 8.87274945853278e-05, + 8.640237501822412e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1516971588134766, + "epoch": 33 + }, + { + "hidden_norms": [ + 163.9844207763672, + 138.9420166015625, + 118.25187683105469, + 94.9247817993164, + 73.99342346191406 + ], + "bp_grad_per_sample_l2_med": [ + 7.05249622114934e-05, + 7.705103053012863e-05, + 8.39303684188053e-05, + 8.84484761627391e-05, + 8.569705096306279e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1713684797286987, + "epoch": 34 + }, + { + "hidden_norms": [ + 162.2567596435547, + 139.536376953125, + 118.07953643798828, + 96.10607147216797, + 75.22054290771484 + ], + "bp_grad_per_sample_l2_med": [ + 6.98907533660531e-05, + 7.564698171336204e-05, + 8.246934885391966e-05, + 8.673300180817023e-05, + 8.65447727846913e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1986680030822754, + "epoch": 35 + }, + { + "hidden_norms": [ + 163.85494995117188, + 140.6683807373047, + 120.20167541503906, + 96.79766845703125, + 74.6565933227539 + ], + "bp_grad_per_sample_l2_med": [ + 6.933045369805768e-05, + 7.555640331702307e-05, + 8.187161438399926e-05, + 8.634777623228729e-05, + 8.516138041159138e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58203125, + "loss_eval": 1.17092764377594, + "epoch": 36 + }, + { + "hidden_norms": [ + 163.91464233398438, + 141.8627166748047, + 120.35345458984375, + 96.861083984375, + 74.91275024414062 + ], + "bp_grad_per_sample_l2_med": [ + 6.821981514804065e-05, + 7.462653593393043e-05, + 7.9863122664392e-05, + 8.513165812473744e-05, + 8.408474968746305e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1603121757507324, + "epoch": 37 + }, + { + "hidden_norms": [ + 166.6566162109375, + 142.48072814941406, + 120.16492462158203, + 96.4870376586914, + 75.0911636352539 + ], + "bp_grad_per_sample_l2_med": [ + 6.862134614493698e-05, + 7.509759598178789e-05, + 8.221028838306665e-05, + 8.709747635293752e-05, + 8.625433838460594e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.163398027420044, + "epoch": 38 + }, + { + "hidden_norms": [ + 165.2766571044922, + 140.6273193359375, + 119.01939392089844, + 96.45698547363281, + 74.86931610107422 + ], + "bp_grad_per_sample_l2_med": [ + 6.741421384504065e-05, + 7.467559044016525e-05, + 8.113843068713322e-05, + 8.498551324009895e-05, + 8.365403482457623e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1174335479736328, + "epoch": 39 + }, + { + "hidden_norms": [ + 166.8720703125, + 141.94195556640625, + 119.73834228515625, + 96.83306884765625, + 75.50749206542969 + ], + "bp_grad_per_sample_l2_med": [ + 6.83375183143653e-05, + 7.506174733862281e-05, + 8.1863887317013e-05, + 8.717682067072019e-05, + 8.521847485098988e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.128427267074585, + "epoch": 40 + }, + { + "hidden_norms": [ + 166.10345458984375, + 140.8309783935547, + 119.59312438964844, + 96.5144271850586, + 75.01549530029297 + ], + "bp_grad_per_sample_l2_med": [ + 7.117655331967399e-05, + 7.808134250808507e-05, + 8.549879566999152e-05, + 9.121275070356205e-05, + 8.961764251580462e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1407405138015747, + "epoch": 41 + }, + { + "hidden_norms": [ + 168.5572052001953, + 144.19313049316406, + 121.29338836669922, + 98.18904113769531, + 75.74433898925781 + ], + "bp_grad_per_sample_l2_med": [ + 7.024689693935215e-05, + 7.835906581021845e-05, + 8.28477568575181e-05, + 8.988843183033168e-05, + 9.142952330876142e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.188612699508667, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.82464599609375, + 142.2963104248047, + 120.96216583251953, + 98.01409149169922, + 76.0032730102539 + ], + "bp_grad_per_sample_l2_med": [ + 7.296045077964664e-05, + 7.839543832233176e-05, + 8.31817596917972e-05, + 9.021619916893542e-05, + 8.68452261784114e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1675610542297363, + "epoch": 43 + }, + { + "hidden_norms": [ + 168.66015625, + 143.3383026123047, + 121.46915435791016, + 97.43902587890625, + 75.26473236083984 + ], + "bp_grad_per_sample_l2_med": [ + 7.207799353636801e-05, + 8.018259541131556e-05, + 8.563740993849933e-05, + 9.22580948099494e-05, + 9.03013497008942e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1672401428222656, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.55662536621094, + 142.82704162597656, + 120.73102569580078, + 96.30245971679688, + 74.20568084716797 + ], + "bp_grad_per_sample_l2_med": [ + 7.172006007749587e-05, + 7.97949469415471e-05, + 8.564699237467721e-05, + 9.092836262425408e-05, + 9.031151421368122e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1739519834518433, + "epoch": 45 + }, + { + "hidden_norms": [ + 169.05859375, + 143.376953125, + 122.22779083251953, + 98.1865234375, + 75.46460723876953 + ], + "bp_grad_per_sample_l2_med": [ + 7.164492853917181e-05, + 8.059864194365218e-05, + 8.811463339952752e-05, + 9.420064452569932e-05, + 9.068247891264036e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1654919385910034, + "epoch": 46 + }, + { + "hidden_norms": [ + 167.85174560546875, + 143.98324584960938, + 121.09931945800781, + 97.61621856689453, + 75.3441390991211 + ], + "bp_grad_per_sample_l2_med": [ + 7.121654198272154e-05, + 7.876066229073331e-05, + 8.58678831718862e-05, + 9.374372893944383e-05, + 8.886006980901584e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6015625, + "loss_eval": 1.1619040966033936, + "epoch": 47 + }, + { + "hidden_norms": [ + 169.16136169433594, + 144.1681671142578, + 121.65021514892578, + 97.65489959716797, + 75.40325927734375 + ], + "bp_grad_per_sample_l2_med": [ + 7.085441029630601e-05, + 7.872789865359664e-05, + 8.54654426802881e-05, + 9.159239561995491e-05, + 8.735150913707912e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1553215980529785, + "epoch": 48 + }, + { + "hidden_norms": [ + 170.07469177246094, + 144.21502685546875, + 122.42488098144531, + 97.60433959960938, + 75.30228424072266 + ], + "bp_grad_per_sample_l2_med": [ + 7.460799679392949e-05, + 8.310206612804905e-05, + 8.914316276786849e-05, + 9.709167352411896e-05, + 9.34089912334457e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5947265625, + "loss_eval": 1.1511603593826294, + "epoch": 49 + }, + { + "hidden_norms": [ + 169.58541870117188, + 143.38230895996094, + 121.96705627441406, + 97.77040100097656, + 74.732177734375 + ], + "bp_grad_per_sample_l2_med": [ + 7.605904102092609e-05, + 8.306169183924794e-05, + 9.093777771340683e-05, + 9.604891965864226e-05, + 9.101478644879535e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.583984375, + "loss_eval": 1.150202751159668, + "epoch": 50 + }, + { + "hidden_norms": [ + 169.28955078125, + 143.6193084716797, + 122.43891906738281, + 97.91162109375, + 75.27656555175781 + ], + "bp_grad_per_sample_l2_med": [ + 7.325071055674925e-05, + 8.037279621930793e-05, + 8.85110639501363e-05, + 9.169802797259763e-05, + 8.926681766752154e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.1172325611114502, + "epoch": 51 + }, + { + "hidden_norms": [ + 170.01052856445312, + 143.45779418945312, + 122.65426635742188, + 98.24798583984375, + 75.68919372558594 + ], + "bp_grad_per_sample_l2_med": [ + 7.252323121065274e-05, + 8.011860336409882e-05, + 8.620596781838685e-05, + 9.34487470658496e-05, + 9.04093321878463e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1147592067718506, + "epoch": 52 + }, + { + "hidden_norms": [ + 168.67430114746094, + 143.25802612304688, + 119.88789367675781, + 96.92530822753906, + 74.42180633544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.410924445139244e-05, + 8.137265831464902e-05, + 8.864435949362814e-05, + 9.472777310293168e-05, + 9.015527029987425e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.625, + "loss_eval": 1.1209393739700317, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.25973510742188, + 142.8248291015625, + 120.75433349609375, + 96.85049438476562, + 74.96371459960938 + ], + "bp_grad_per_sample_l2_med": [ + 7.351540989475325e-05, + 8.063198038144037e-05, + 8.647661161376163e-05, + 9.411892096977681e-05, + 9.352037159260362e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1025673151016235, + "epoch": 54 + }, + { + "hidden_norms": [ + 170.8097381591797, + 143.562744140625, + 121.1410903930664, + 97.70262145996094, + 75.55540466308594 + ], + "bp_grad_per_sample_l2_med": [ + 7.382583135040477e-05, + 8.104312291834503e-05, + 8.895712380763143e-05, + 9.191031131194904e-05, + 8.924967551138252e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1013734340667725, + "epoch": 55 + }, + { + "hidden_norms": [ + 169.41827392578125, + 143.60491943359375, + 119.79347229003906, + 96.5761947631836, + 74.94788360595703 + ], + "bp_grad_per_sample_l2_med": [ + 7.506331166950986e-05, + 8.308376709464937e-05, + 9.05599954421632e-05, + 9.552844858262688e-05, + 9.322594269178808e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1202704906463623, + "epoch": 56 + }, + { + "hidden_norms": [ + 169.0540008544922, + 144.03970336914062, + 121.87033081054688, + 98.80317687988281, + 76.42084503173828 + ], + "bp_grad_per_sample_l2_med": [ + 7.446128438459709e-05, + 8.153915405273438e-05, + 8.840708323987201e-05, + 9.388235048390925e-05, + 9.186066017718986e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.1205706596374512, + "epoch": 57 + }, + { + "hidden_norms": [ + 168.36595153808594, + 141.80178833007812, + 120.2418212890625, + 96.8748779296875, + 75.01248168945312 + ], + "bp_grad_per_sample_l2_med": [ + 7.731275400146842e-05, + 8.405288099311292e-05, + 9.186116949422285e-05, + 9.942329052137211e-05, + 9.51286856434308e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1108977794647217, + "epoch": 58 + }, + { + "hidden_norms": [ + 169.39569091796875, + 142.4537353515625, + 120.81804656982422, + 97.19158172607422, + 75.20236206054688 + ], + "bp_grad_per_sample_l2_med": [ + 7.883378566475585e-05, + 8.777670154813677e-05, + 9.416328248335049e-05, + 0.00010057339386548847, + 9.685986879048869e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1141078472137451, + "epoch": 59 + }, + { + "hidden_norms": [ + 169.97256469726562, + 143.7432098388672, + 121.0943832397461, + 97.53318786621094, + 75.44910430908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.617164374096319e-05, + 8.471525507047772e-05, + 9.014597890200093e-05, + 9.796666563488543e-05, + 9.110565588343889e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0869580507278442, + "epoch": 60 + }, + { + "hidden_norms": [ + 168.3030242919922, + 142.93931579589844, + 120.8933334350586, + 97.99317932128906, + 75.29071044921875 + ], + "bp_grad_per_sample_l2_med": [ + 7.692870713071898e-05, + 8.63347522681579e-05, + 9.28592708078213e-05, + 9.994371794164181e-05, + 9.114396380027756e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6357421875, + "loss_eval": 1.102014183998108, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.24777221679688, + 142.03550720214844, + 120.25982666015625, + 97.82561492919922, + 75.54430389404297 + ], + "bp_grad_per_sample_l2_med": [ + 7.734074461041018e-05, + 8.487069862894714e-05, + 9.25088970689103e-05, + 9.827558096731082e-05, + 9.154371218755841e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.0736993551254272, + "epoch": 62 + }, + { + "hidden_norms": [ + 168.08807373046875, + 142.24661254882812, + 119.9559555053711, + 96.72630310058594, + 74.6895523071289 + ], + "bp_grad_per_sample_l2_med": [ + 8.049221651162952e-05, + 8.925019210437313e-05, + 9.64810824370943e-05, + 0.00010555233166087419, + 9.567404049448669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.0822858810424805, + "epoch": 63 + }, + { + "hidden_norms": [ + 167.2539825439453, + 141.55946350097656, + 119.37681579589844, + 97.13011169433594, + 75.02286529541016 + ], + "bp_grad_per_sample_l2_med": [ + 7.919344352558255e-05, + 8.567116310587153e-05, + 9.377488458994776e-05, + 9.892786329146475e-05, + 9.566175140207633e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.1096018552780151, + "epoch": 64 + }, + { + "hidden_norms": [ + 168.11643981933594, + 142.01052856445312, + 119.23418426513672, + 96.38211059570312, + 75.08849334716797 + ], + "bp_grad_per_sample_l2_med": [ + 7.787172216922045e-05, + 8.574797539040446e-05, + 9.008680353872478e-05, + 9.943459735950455e-05, + 9.4872091722209e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.1080338954925537, + "epoch": 65 + }, + { + "hidden_norms": [ + 168.09153747558594, + 141.83984375, + 120.16891479492188, + 97.12582397460938, + 74.98177337646484 + ], + "bp_grad_per_sample_l2_med": [ + 7.894716691225767e-05, + 8.66493719513528e-05, + 9.518097795080394e-05, + 0.00010154353367397562, + 9.530662646284327e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1069355010986328, + "epoch": 66 + }, + { + "hidden_norms": [ + 167.35382080078125, + 142.33642578125, + 120.0411148071289, + 96.53257751464844, + 75.0328598022461 + ], + "bp_grad_per_sample_l2_med": [ + 7.973265019245446e-05, + 8.856245403876528e-05, + 9.601243800716475e-05, + 0.00010215263318968937, + 9.676075569586828e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.100548505783081, + "epoch": 67 + }, + { + "hidden_norms": [ + 167.418701171875, + 140.93800354003906, + 119.4802017211914, + 96.3717269897461, + 74.67574310302734 + ], + "bp_grad_per_sample_l2_med": [ + 8.022025576792657e-05, + 8.782520308159292e-05, + 9.638317715143785e-05, + 0.0001046421384671703, + 9.856691031018272e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1227837800979614, + "epoch": 68 + }, + { + "hidden_norms": [ + 166.9136962890625, + 140.45266723632812, + 119.06848907470703, + 95.9060287475586, + 74.79631042480469 + ], + "bp_grad_per_sample_l2_med": [ + 7.995362102519721e-05, + 8.583935414208099e-05, + 9.508246148470789e-05, + 0.00010096231562783942, + 9.634289017412812e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1006299257278442, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.4694366455078, + 139.69601440429688, + 117.53054809570312, + 95.05348205566406, + 74.65673065185547 + ], + "bp_grad_per_sample_l2_med": [ + 7.79753245296888e-05, + 8.487935701850802e-05, + 9.169900295091793e-05, + 9.879520075628534e-05, + 9.398034308105707e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.0988688468933105, + "epoch": 70 + }, + { + "hidden_norms": [ + 165.3974609375, + 139.54141235351562, + 117.3493881225586, + 94.9970474243164, + 74.31880187988281 + ], + "bp_grad_per_sample_l2_med": [ + 7.893131260061637e-05, + 8.71433803695254e-05, + 9.492320532444865e-05, + 0.00010128845315193757, + 9.578587196301669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6484375, + "loss_eval": 1.0860004425048828, + "epoch": 71 + }, + { + "hidden_norms": [ + 165.16651916503906, + 138.63233947753906, + 117.15692138671875, + 94.41555786132812, + 74.16561889648438 + ], + "bp_grad_per_sample_l2_med": [ + 8.611902012489736e-05, + 9.412867802893743e-05, + 0.0001005554513540119, + 0.00010507499246159568, + 0.00010004997602663934 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.0985480546951294, + "epoch": 72 + }, + { + "hidden_norms": [ + 166.48802185058594, + 139.67433166503906, + 117.13744354248047, + 94.41883087158203, + 74.25392150878906 + ], + "bp_grad_per_sample_l2_med": [ + 8.272679406218231e-05, + 9.101553587242961e-05, + 9.994471474783495e-05, + 0.00010372102406108752, + 9.65072977123782e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1026251316070557, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.66531372070312, + 138.62359619140625, + 117.72949981689453, + 95.40411376953125, + 74.5541763305664 + ], + "bp_grad_per_sample_l2_med": [ + 8.516917296219617e-05, + 9.385120938532054e-05, + 0.00010402742918813601, + 0.00010775420378195122, + 0.00010169474262511358 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6298828125, + "loss_eval": 1.1083872318267822, + "epoch": 74 + }, + { + "hidden_norms": [ + 164.67889404296875, + 138.3468017578125, + 116.61951446533203, + 93.94100952148438, + 74.09746551513672 + ], + "bp_grad_per_sample_l2_med": [ + 8.641117165097967e-05, + 9.53027411014773e-05, + 0.0001029834384098649, + 0.0001086485426640138, + 0.0001005055892164819 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.1155339479446411, + "epoch": 75 + }, + { + "hidden_norms": [ + 164.2607421875, + 138.0647735595703, + 116.18480682373047, + 93.95038604736328, + 73.88935089111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.567768963985145e-05, + 9.307480650022626e-05, + 9.939757728716359e-05, + 0.00010579575609881431, + 9.849719936028123e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.1126312017440796, + "epoch": 76 + }, + { + "hidden_norms": [ + 163.9792938232422, + 137.88185119628906, + 116.34628295898438, + 93.93537139892578, + 73.83805084228516 + ], + "bp_grad_per_sample_l2_med": [ + 8.795045869192109e-05, + 9.678495553089306e-05, + 0.00010362159082433209, + 0.0001105417322833091, + 0.00010525066318223253 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.110876202583313, + "epoch": 77 + }, + { + "hidden_norms": [ + 164.1384735107422, + 137.82691955566406, + 115.94445037841797, + 94.01095581054688, + 73.68436431884766 + ], + "bp_grad_per_sample_l2_med": [ + 8.610311488155276e-05, + 9.507987851975486e-05, + 0.00010208813182543963, + 0.00010807226499309763, + 0.00010176940850215033 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1176977157592773, + "epoch": 78 + }, + { + "hidden_norms": [ + 163.91049194335938, + 136.9142608642578, + 115.37925720214844, + 93.2219009399414, + 73.2654800415039 + ], + "bp_grad_per_sample_l2_med": [ + 8.745997183723375e-05, + 9.566589869791642e-05, + 0.00010251311323372647, + 0.00011129804624943063, + 0.0001056971013895236 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1140623092651367, + "epoch": 79 + }, + { + "hidden_norms": [ + 163.40182495117188, + 137.21026611328125, + 115.46720123291016, + 93.46426391601562, + 73.12786102294922 + ], + "bp_grad_per_sample_l2_med": [ + 8.96864221431315e-05, + 9.8639284260571e-05, + 0.0001043426527758129, + 0.00010869379184441641, + 0.00010685920278774574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.1114736795425415, + "epoch": 80 + }, + { + "hidden_norms": [ + 163.22100830078125, + 136.5157012939453, + 115.2002944946289, + 93.15667724609375, + 73.07371520996094 + ], + "bp_grad_per_sample_l2_med": [ + 8.870210876921192e-05, + 9.846940520219505e-05, + 0.0001080361835192889, + 0.0001128382355091162, + 0.00010244990698993206 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1125456094741821, + "epoch": 81 + }, + { + "hidden_norms": [ + 163.21449279785156, + 136.63999938964844, + 114.51496124267578, + 92.76043701171875, + 73.22138214111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.551862265449017e-05, + 9.3683076556772e-05, + 0.00010453341383254156, + 0.00010722207662183791, + 0.00010129058500751853 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.0996887683868408, + "epoch": 82 + }, + { + "hidden_norms": [ + 162.75770568847656, + 136.49710083007812, + 114.6112060546875, + 92.87682342529297, + 73.25039672851562 + ], + "bp_grad_per_sample_l2_med": [ + 8.870910096447915e-05, + 9.74184149526991e-05, + 0.00010446018859511241, + 0.00011418589565437287, + 0.00010412647679913789 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1063097715377808, + "epoch": 83 + }, + { + "hidden_norms": [ + 163.11697387695312, + 136.4162139892578, + 114.9229507446289, + 93.17060089111328, + 73.40281677246094 + ], + "bp_grad_per_sample_l2_med": [ + 8.790192077867687e-05, + 9.763163689058274e-05, + 0.00010599731467664242, + 0.00011016600910807028, + 0.00010507069964660332 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1009955406188965, + "epoch": 84 + }, + { + "hidden_norms": [ + 162.4318389892578, + 136.2643280029297, + 114.47940826416016, + 92.43824005126953, + 72.75123596191406 + ], + "bp_grad_per_sample_l2_med": [ + 8.680798055138439e-05, + 9.524248889647424e-05, + 0.00010346775525249541, + 0.00010771532106446102, + 0.00010157373617403209 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.106760025024414, + "epoch": 85 + }, + { + "hidden_norms": [ + 162.55992126464844, + 136.00660705566406, + 114.44908142089844, + 92.65226745605469, + 73.14122772216797 + ], + "bp_grad_per_sample_l2_med": [ + 8.55888138175942e-05, + 9.422176663065329e-05, + 0.00010130204464076087, + 0.0001082807284547016, + 0.00010286335600540042 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1080232858657837, + "epoch": 86 + }, + { + "hidden_norms": [ + 162.33607482910156, + 136.22657775878906, + 114.64276885986328, + 92.26687622070312, + 72.99312591552734 + ], + "bp_grad_per_sample_l2_med": [ + 9.005892934510484e-05, + 9.746963041834533e-05, + 0.00010383747576270252, + 0.00010905141971306875, + 0.00010293527157045901 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.0989083051681519, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.69874572753906, + 135.9654998779297, + 113.88583374023438, + 91.72888946533203, + 72.5824966430664 + ], + "bp_grad_per_sample_l2_med": [ + 9.02136744116433e-05, + 9.903020691126585e-05, + 0.0001059234855347313, + 0.00011399909999454394, + 0.00010543780081206933 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1039698123931885, + "epoch": 88 + }, + { + "hidden_norms": [ + 162.3827362060547, + 136.0760498046875, + 114.07840728759766, + 91.95870971679688, + 72.59473419189453 + ], + "bp_grad_per_sample_l2_med": [ + 9.043919999385253e-05, + 9.950586536433548e-05, + 0.00010800046584336087, + 0.00011628754145931453, + 0.00010360861051594839 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1007411479949951, + "epoch": 89 + }, + { + "hidden_norms": [ + 161.50054931640625, + 135.7166748046875, + 113.83382415771484, + 91.96630096435547, + 72.61833953857422 + ], + "bp_grad_per_sample_l2_med": [ + 9.075389243662357e-05, + 9.988105011871085e-05, + 0.00010788880899781361, + 0.00011431374150561169, + 0.00010596351057756692 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.64453125, + "loss_eval": 1.0992103815078735, + "epoch": 90 + }, + { + "hidden_norms": [ + 161.48770141601562, + 135.71417236328125, + 114.12840270996094, + 91.98160552978516, + 72.64606475830078 + ], + "bp_grad_per_sample_l2_med": [ + 9.050803782884032e-05, + 9.805837908061221e-05, + 0.00010800142626976594, + 0.00011649157386273146, + 0.00010660875705070794 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.1021543741226196, + "epoch": 91 + }, + { + "hidden_norms": [ + 162.0372314453125, + 135.4561767578125, + 114.00292205810547, + 91.83483123779297, + 72.68809509277344 + ], + "bp_grad_per_sample_l2_med": [ + 8.82204039953649e-05, + 9.769284224603325e-05, + 0.00010632916382746771, + 0.00011439422814873978, + 0.00010489066335139796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1001535654067993, + "epoch": 92 + }, + { + "hidden_norms": [ + 161.88534545898438, + 135.54629516601562, + 113.90684509277344, + 91.81143188476562, + 72.64588165283203 + ], + "bp_grad_per_sample_l2_med": [ + 9.120439790422097e-05, + 9.779920219443738e-05, + 0.00010798833682201803, + 0.00011447365250205621, + 0.00010797424329211935 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.0961315631866455, + "epoch": 93 + }, + { + "hidden_norms": [ + 162.06427001953125, + 135.49281311035156, + 113.69275665283203, + 91.76304626464844, + 72.4867935180664 + ], + "bp_grad_per_sample_l2_med": [ + 9.100054739974439e-05, + 9.935065463650972e-05, + 0.00010879126784857363, + 0.00011589765199460089, + 0.00010837834270205349 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.097299337387085, + "epoch": 94 + }, + { + "hidden_norms": [ + 162.06063842773438, + 135.57981872558594, + 113.76399230957031, + 91.94515991210938, + 72.56278991699219 + ], + "bp_grad_per_sample_l2_med": [ + 9.139141184277833e-05, + 9.897649579215795e-05, + 0.00010867504897760227, + 0.0001159063758677803, + 0.00010943930828943849 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6376953125, + "loss_eval": 1.0986907482147217, + "epoch": 95 + }, + { + "hidden_norms": [ + 161.8842315673828, + 135.4130859375, + 113.66045379638672, + 91.80276489257812, + 72.58989715576172 + ], + "bp_grad_per_sample_l2_med": [ + 9.080857125809416e-05, + 0.00010123007814399898, + 0.00010883246432058513, + 0.00011908033775398508, + 0.00010963032400468364 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0988240242004395, + "epoch": 96 + }, + { + "hidden_norms": [ + 161.86744689941406, + 135.38331604003906, + 113.66378784179688, + 91.70223236083984, + 72.4896240234375 + ], + "bp_grad_per_sample_l2_med": [ + 9.091695392271504e-05, + 0.00010080484207719564, + 0.00010940106585621834, + 0.00011762498616008088, + 0.00010917771578533575 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0987744331359863, + "epoch": 97 + }, + { + "hidden_norms": [ + 161.89633178710938, + 135.33140563964844, + 113.67347717285156, + 91.68895721435547, + 72.49469757080078 + ], + "bp_grad_per_sample_l2_med": [ + 9.099576709559187e-05, + 0.00010038664186140522, + 0.0001086170959752053, + 0.00011788319534389302, + 0.00010914496670011431 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0990701913833618, + "epoch": 98 + }, + { + "hidden_norms": [ + 161.9002227783203, + 135.33474731445312, + 113.68601989746094, + 91.69290924072266, + 72.48957061767578 + ], + "bp_grad_per_sample_l2_med": [ + 9.096309076994658e-05, + 0.00010059915803140029, + 0.00010838409070856869, + 0.00011784962407546118, + 0.00010893247235799208 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.098876953125, + "epoch": 99 + }, + { + "hidden_norms": [ + 161.8989715576172, + 135.33889770507812, + 113.69281768798828, + 91.6856689453125, + 72.48480224609375 + ], + "bp_grad_per_sample_l2_med": [ + 9.085259807761759e-05, + 0.00010061707871500403, + 0.00010823038610396907, + 0.00011745247320504859, + 0.00010919221676886082 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0987944602966309, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005465824506245553, + 0.0005437708459794521, + 0.0005393712199293077, + 0.0005331890424713492, + 0.0005310169071890414 + ], + "gamma_dfa": 0.007568402143078856, + "gamma_dfa_per_layer": [ + 0.002326551591977477, + 0.0009101498289965093, + -0.013218702748417854, + 0.04025560989975929 + ], + "acc_eval": 0.1015625, + "loss_eval": 2.3754236698150635, + "epoch": 0 + }, + { + "hidden_norms": [ + 536.5761108398438, + 845.265625, + 979.7896118164062, + 1192.0323486328125, + 1230.83935546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006465085316449404, + 0.0006462159799411893, + 0.0006460825679823756, + 0.0006459451396949589, + 0.0006460213917307556 + ], + "gamma_dfa": 0.013024769607000053, + "gamma_dfa_per_layer": [ + 0.035579413175582886, + -0.0025600260123610497, + -0.0014369464479386806, + 0.020516637712717056 + ], + "acc_eval": 0.212890625, + "loss_eval": 8.137651443481445, + "epoch": 1 + }, + { + "hidden_norms": [ + 886.7508544921875, + 1871.2640380859375, + 2198.631591796875, + 2689.22412109375, + 2904.254150390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007187994197010994, + 0.0007172312471084297, + 0.0007172476034611464, + 0.0007177897496148944, + 0.000717311049811542 + ], + "gamma_dfa": 0.004487544531002641, + "gamma_dfa_per_layer": [ + 0.04744107276201248, + -0.011962954886257648, + -0.02088175155222416, + 0.003353811800479889 + ], + "acc_eval": 0.203125, + "loss_eval": 16.637451171875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1117.1649169921875, + 3064.644775390625, + 3849.060546875, + 4987.09130859375, + 5690.720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000734492321498692, + 0.0007317167473956943, + 0.0007317643612623215, + 0.0007318624993786216, + 0.0007319750147871673 + ], + "gamma_dfa": 0.0065072893630713224, + "gamma_dfa_per_layer": [ + 0.0597357451915741, + -0.0063293795101344585, + -0.033218011260032654, + 0.0058408030308783054 + ], + "acc_eval": 0.224609375, + "loss_eval": 29.753459930419922, + "epoch": 3 + }, + { + "hidden_norms": [ + 1279.7017822265625, + 4015.093017578125, + 5594.23828125, + 7459.69091796875, + 8727.64453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007434640428982675, + 0.0007419881876558065, + 0.0007416673470288515, + 0.000741377065423876, + 0.0007413675775751472 + ], + "gamma_dfa": 0.0072651703376322985, + "gamma_dfa_per_layer": [ + 0.07467889785766602, + -0.02277005836367607, + -0.009787362068891525, + -0.013060796074569225 + ], + "acc_eval": 0.1640625, + "loss_eval": 54.22368621826172, + "epoch": 4 + }, + { + "hidden_norms": [ + 1399.06787109375, + 4862.35302734375, + 9250.7666015625, + 10789.8828125, + 12902.6591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007491935975849628, + 0.0007442779606208205, + 0.0007423132774420083, + 0.0007422835915349424, + 0.0007422153139486909 + ], + "gamma_dfa": -0.005301014054566622, + "gamma_dfa_per_layer": [ + 0.06516245007514954, + -0.03411812335252762, + -0.034175027161836624, + -0.01807335577905178 + ], + "acc_eval": 0.2080078125, + "loss_eval": 62.78772735595703, + "epoch": 5 + }, + { + "hidden_norms": [ + 1478.1070556640625, + 5865.33935546875, + 15407.5283203125, + 16717.609375, + 19284.30078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000746070989407599, + 0.0007320672739297152, + 0.0007320406148210168, + 0.0007324790931306779, + 0.0007322196033783257 + ], + "gamma_dfa": -0.0043716938234865665, + "gamma_dfa_per_layer": [ + 0.0889529138803482, + -0.03475068882107735, + -0.06096648424863815, + -0.010722516104578972 + ], + "acc_eval": 0.21875, + "loss_eval": 84.72342681884766, + "epoch": 6 + }, + { + "hidden_norms": [ + 1569.764892578125, + 7991.109375, + 22041.46484375, + 23657.2890625, + 27372.69140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007371728424914181, + 0.0007328476058319211, + 0.0007317248382605612, + 0.0007321859593503177, + 0.0007314819958992302 + ], + "gamma_dfa": -0.006586531409993768, + "gamma_dfa_per_layer": [ + 0.08020298182964325, + -0.038106564432382584, + -0.05412164330482483, + -0.014320899732410908 + ], + "acc_eval": 0.21484375, + "loss_eval": 87.40310668945312, + "epoch": 7 + }, + { + "hidden_norms": [ + 1649.8133544921875, + 12248.005859375, + 30825.916015625, + 32827.55078125, + 38153.3828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007630810141563416, + 0.0007434195140376687, + 0.0007433100836351514, + 0.0007435025763697922, + 0.0007434298167936504 + ], + "gamma_dfa": -0.0035092607140541077, + "gamma_dfa_per_layer": [ + 0.1012866348028183, + -0.029570601880550385, + -0.04660683125257492, + -0.039146244525909424 + ], + "acc_eval": 0.1708984375, + "loss_eval": 157.51614379882812, + "epoch": 8 + }, + { + "hidden_norms": [ + 1712.73193359375, + 20302.939453125, + 43360.37109375, + 46000.90234375, + 53154.84765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007849909015931189, + 0.0007540763472206891, + 0.0007541946833953261, + 0.0007542177918367088, + 0.0007542550447396934 + ], + "gamma_dfa": 0.006478439085185528, + "gamma_dfa_per_layer": [ + 0.1487787812948227, + -0.03583626449108124, + -0.0212298221886158, + -0.06579893827438354 + ], + "acc_eval": 0.138671875, + "loss_eval": 512.7744750976562, + "epoch": 9 + }, + { + "hidden_norms": [ + 1763.957763671875, + 29818.015625, + 57092.5546875, + 60514.234375, + 69695.1015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00080581457586959, + 0.0007400442264042795, + 0.0007398677407763898, + 0.0007363590411841869, + 0.0007358043803833425 + ], + "gamma_dfa": -0.003822646103799343, + "gamma_dfa_per_layer": [ + 0.1044168770313263, + -0.0318819060921669, + -0.054846249520778656, + -0.03297930583357811 + ], + "acc_eval": 0.203125, + "loss_eval": 288.6083984375, + "epoch": 10 + }, + { + "hidden_norms": [ + 1841.6363525390625, + 43646.69921875, + 76665.53125, + 80991.453125, + 91946.4765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008064995636232197, + 0.0007405033684335649, + 0.0007410499965772033, + 0.0007410682155750692, + 0.0007410107646137476 + ], + "gamma_dfa": -0.005903353448957205, + "gamma_dfa_per_layer": [ + 0.15344271063804626, + -0.06077828258275986, + -0.0893951952457428, + -0.02688264660537243 + ], + "acc_eval": 0.1630859375, + "loss_eval": 462.175537109375, + "epoch": 11 + }, + { + "hidden_norms": [ + 1938.4581298828125, + 63804.453125, + 101178.828125, + 106970.6171875, + 119676.0390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008472055778838694, + 0.0007312041707336903, + 0.0007307010819204152, + 0.0007308369968086481, + 0.000730738160200417 + ], + "gamma_dfa": 0.015948185697197914, + "gamma_dfa_per_layer": [ + 0.19398558139801025, + -0.05326637625694275, + -0.057601772248744965, + -0.019324690103530884 + ], + "acc_eval": 0.1572265625, + "loss_eval": 481.7687072753906, + "epoch": 12 + }, + { + "hidden_norms": [ + 2059.50390625, + 86267.453125, + 127668.078125, + 134690.953125, + 148832.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008536268142051995, + 0.0007572658942081034, + 0.0007572331232950091, + 0.0007572534959763288, + 0.0007572824251838028 + ], + "gamma_dfa": 0.007115887477993965, + "gamma_dfa_per_layer": [ + 0.19894848763942719, + -0.06199394166469574, + -0.04606857895851135, + -0.06242241710424423 + ], + "acc_eval": 0.162109375, + "loss_eval": 442.7697448730469, + "epoch": 13 + }, + { + "hidden_norms": [ + 2162.650390625, + 111971.2421875, + 158544.5, + 167081.546875, + 183230.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009137325105257332, + 0.0007456843741238117, + 0.0007456432213075459, + 0.0007455914164893329, + 0.0007455993909388781 + ], + "gamma_dfa": 0.008699490688741207, + "gamma_dfa_per_layer": [ + 0.22433382272720337, + -0.07114191353321075, + -0.07720339298248291, + -0.041190553456544876 + ], + "acc_eval": 0.16796875, + "loss_eval": 631.255859375, + "epoch": 14 + }, + { + "hidden_norms": [ + 2287.1767578125, + 140028.015625, + 188737.5625, + 197952.296875, + 214414.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000864461821038276, + 0.0007380775641649961, + 0.0007383264601230621, + 0.000738749688025564, + 0.0007389392121694982 + ], + "gamma_dfa": 0.01581217348575592, + "gamma_dfa_per_layer": [ + 0.21350334584712982, + -0.05864371731877327, + -0.039877790957689285, + -0.051733143627643585 + ], + "acc_eval": 0.1806640625, + "loss_eval": 720.0626220703125, + "epoch": 15 + }, + { + "hidden_norms": [ + 2390.364013671875, + 180786.796875, + 233030.703125, + 243522.09375, + 260648.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010889085242524743, + 0.0007420245674438775, + 0.0007420974434353411, + 0.0007420690963044763, + 0.0007420206675305963 + ], + "gamma_dfa": 0.01692677615210414, + "gamma_dfa_per_layer": [ + 0.22792349755764008, + -0.06613948941230774, + -0.0679212138056755, + -0.026155689731240273 + ], + "acc_eval": 0.1904296875, + "loss_eval": 1348.43115234375, + "epoch": 16 + }, + { + "hidden_norms": [ + 2525.60009765625, + 226341.015625, + 282575.21875, + 294521.5, + 313155.65625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010620173998177052, + 0.0007694299565628171, + 0.0007695311214774847, + 0.0007694744854234159, + 0.000769737409427762 + ], + "gamma_dfa": 0.012939120642840862, + "gamma_dfa_per_layer": [ + 0.24798060953617096, + -0.07888300716876984, + -0.03452270105481148, + -0.0828184187412262 + ], + "acc_eval": 0.1572265625, + "loss_eval": 1277.5867919921875, + "epoch": 17 + }, + { + "hidden_norms": [ + 2738.423828125, + 284434.5625, + 346282.90625, + 359909.125, + 379330.46875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009644942474551499, + 0.0007429496035911143, + 0.0007425086805596948, + 0.0007422671769745648, + 0.0007426248048432171 + ], + "gamma_dfa": 0.02641105931252241, + "gamma_dfa_per_layer": [ + 0.2637922763824463, + -0.06210581958293915, + -0.05640384927392006, + -0.039638370275497437 + ], + "acc_eval": 0.220703125, + "loss_eval": 802.8688354492188, + "epoch": 18 + }, + { + "hidden_norms": [ + 2890.100830078125, + 346858.71875, + 414202.09375, + 429987.3125, + 451374.3125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010854159481823444, + 0.0007560763042420149, + 0.0007561030797660351, + 0.0007562912651337683, + 0.0007561809034086764 + ], + "gamma_dfa": -0.006043614819645882, + "gamma_dfa_per_layer": [ + 0.18550744652748108, + -0.07387037575244904, + -0.0915735587477684, + -0.04423797130584717 + ], + "acc_eval": 0.0927734375, + "loss_eval": 2067.48974609375, + "epoch": 19 + }, + { + "hidden_norms": [ + 3048.9677734375, + 416326.4375, + 488715.9375, + 506779.0, + 528907.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001142722088843584, + 0.0007379497401416302, + 0.0007378923473879695, + 0.0007379662129096687, + 0.0007378893787972629 + ], + "gamma_dfa": 0.020490088500082493, + "gamma_dfa_per_layer": [ + 0.21813809871673584, + -0.053681232035160065, + -0.04219571128487587, + -0.040300801396369934 + ], + "acc_eval": 0.2294921875, + "loss_eval": 1929.7166748046875, + "epoch": 20 + }, + { + "hidden_norms": [ + 3216.734619140625, + 499057.0, + 577401.1875, + 597297.0, + 620542.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014556541573256254, + 0.0007413470884785056, + 0.0007413764833472669, + 0.0007412104168906808, + 0.0007420589681714773 + ], + "gamma_dfa": 0.03948488784953952, + "gamma_dfa_per_layer": [ + 0.27680304646492004, + -0.05157003924250603, + -0.039460550993680954, + -0.02783290483057499 + ], + "acc_eval": 0.1474609375, + "loss_eval": 2699.9052734375, + "epoch": 21 + }, + { + "hidden_norms": [ + 3342.216064453125, + 584495.625, + 665696.625, + 687533.1875, + 710813.9375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001884044730104506, + 0.0007584495469927788, + 0.0007583577535115182, + 0.0007583281840197742, + 0.0007583273691125214 + ], + "gamma_dfa": 0.004080784507095814, + "gamma_dfa_per_layer": [ + 0.1770291030406952, + -0.056366197764873505, + -0.057933274656534195, + -0.046406492590904236 + ], + "acc_eval": 0.2373046875, + "loss_eval": 1742.9925537109375, + "epoch": 22 + }, + { + "hidden_norms": [ + 3566.038818359375, + 674756.3125, + 760463.3125, + 784571.125, + 808618.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.001965342788025737, + 0.0007340435404330492, + 0.0007341310847550631, + 0.0007343373727053404, + 0.0007337987190112472 + ], + "gamma_dfa": 0.030578704085201025, + "gamma_dfa_per_layer": [ + 0.24771088361740112, + -0.05749209225177765, + -0.04569869861006737, + -0.022205276414752007 + ], + "acc_eval": 0.1611328125, + "loss_eval": 2397.3916015625, + "epoch": 23 + }, + { + "hidden_norms": [ + 3779.54296875, + 786509.5, + 877152.1875, + 903987.8125, + 928449.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016364307375624776, + 0.0007935749599710107, + 0.000793365528807044, + 0.0007934189052321017, + 0.0007935216999612749 + ], + "gamma_dfa": 0.01740677817724645, + "gamma_dfa_per_layer": [ + 0.2701166570186615, + -0.0851234570145607, + 0.004913746379315853, + -0.12027983367443085 + ], + "acc_eval": 0.12109375, + "loss_eval": 4908.0458984375, + "epoch": 24 + }, + { + "hidden_norms": [ + 3969.119873046875, + 900145.9375, + 993945.75, + 1023047.9375, + 1047156.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012235429603606462, + 0.0007582573452964425, + 0.0007582195685245097, + 0.000758210604544729, + 0.0007582050748169422 + ], + "gamma_dfa": -0.005556041374802589, + "gamma_dfa_per_layer": [ + 0.2166597992181778, + -0.09299580752849579, + -0.09515514969825745, + -0.05073300749063492 + ], + "acc_eval": 0.1728515625, + "loss_eval": 3738.029541015625, + "epoch": 25 + }, + { + "hidden_norms": [ + 4167.24169921875, + 1027096.125, + 1126300.25, + 1158199.625, + 1183064.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015538743464276195, + 0.0007320540607906878, + 0.0007321767043322325, + 0.0007325086044147611, + 0.0007322292076423764 + ], + "gamma_dfa": 0.013890675269067287, + "gamma_dfa_per_layer": [ + 0.25793927907943726, + -0.09288333356380463, + -0.07571414113044739, + -0.03377910330891609 + ], + "acc_eval": 0.10546875, + "loss_eval": 6202.408203125, + "epoch": 26 + }, + { + "hidden_norms": [ + 4332.73046875, + 1157313.5, + 1261637.875, + 1297158.5, + 1323617.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015948566142469645, + 0.0007783056935295463, + 0.00077825813787058, + 0.0007782406755723059, + 0.0007781987660564482 + ], + "gamma_dfa": 0.02306488621979952, + "gamma_dfa_per_layer": [ + 0.2585013508796692, + -0.07491485029459, + -0.058371271938085556, + -0.03295568376779556 + ], + "acc_eval": 0.208984375, + "loss_eval": 4646.37451171875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4508.3486328125, + 1310938.125, + 1421261.875, + 1460382.75, + 1487384.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001599438488483429, + 0.0007645513396710157, + 0.0007644708384759724, + 0.00076470518251881, + 0.0007645483710803092 + ], + "gamma_dfa": 0.017900947481393814, + "gamma_dfa_per_layer": [ + 0.24153774976730347, + -0.06473007053136826, + -0.06562119722366333, + -0.039582692086696625 + ], + "acc_eval": 0.173828125, + "loss_eval": 5292.640625, + "epoch": 28 + }, + { + "hidden_norms": [ + 4729.70556640625, + 1458380.25, + 1572980.125, + 1615003.0, + 1642261.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014249716186895967, + 0.0007341640302911401, + 0.00073421117849648, + 0.0007345581543631852, + 0.0007344211917370558 + ], + "gamma_dfa": 0.03120402991771698, + "gamma_dfa_per_layer": [ + 0.2725849747657776, + -0.07284568250179291, + -0.05128118395805359, + -0.02364198863506317 + ], + "acc_eval": 0.17578125, + "loss_eval": 4871.27001953125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4886.33984375, + 1617197.25, + 1735577.625, + 1780813.375, + 1808887.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018187292153015733, + 0.0007682304712943733, + 0.0007675564847886562, + 0.0007677674293518066, + 0.0007678233087062836 + ], + "gamma_dfa": 0.017138252966105938, + "gamma_dfa_per_layer": [ + 0.2494080811738968, + -0.08018361777067184, + -0.027287419885396957, + -0.07338403165340424 + ], + "acc_eval": 0.193359375, + "loss_eval": 3960.6728515625, + "epoch": 30 + }, + { + "hidden_norms": [ + 5119.7841796875, + 1765219.5, + 1886735.375, + 1934213.125, + 1961976.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022127064876258373, + 0.000754481996409595, + 0.0007539362413808703, + 0.0007542265811935067, + 0.0007539446814917028 + ], + "gamma_dfa": 0.0332237659022212, + "gamma_dfa_per_layer": [ + 0.30639636516571045, + -0.08304375410079956, + -0.06092921271920204, + -0.029528334736824036 + ], + "acc_eval": 0.193359375, + "loss_eval": 4306.7734375, + "epoch": 31 + }, + { + "hidden_norms": [ + 5354.88720703125, + 1941186.125, + 2066860.125, + 2117348.25, + 2144884.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013304626336321235, + 0.0007719467394053936, + 0.0007719435379840434, + 0.0007721700239926577, + 0.0007720825960859656 + ], + "gamma_dfa": 0.01764332875609398, + "gamma_dfa_per_layer": [ + 0.2670303285121918, + -0.07338991016149521, + -0.05201137810945511, + -0.07105572521686554 + ], + "acc_eval": 0.1845703125, + "loss_eval": 4018.3662109375, + "epoch": 32 + }, + { + "hidden_norms": [ + 5519.78759765625, + 2116056.25, + 2246081.5, + 2300078.25, + 2327378.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016995095647871494, + 0.0007534062024205923, + 0.0007532716845162213, + 0.0007533822790719569, + 0.0007532139425165951 + ], + "gamma_dfa": 0.021287068724632263, + "gamma_dfa_per_layer": [ + 0.2717400789260864, + -0.08038187026977539, + -0.05876553803682327, + -0.04744439572095871 + ], + "acc_eval": 0.216796875, + "loss_eval": 6509.134765625, + "epoch": 33 + }, + { + "hidden_norms": [ + 5700.9130859375, + 2317603.75, + 2452612.5, + 2509779.5, + 2537064.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001880816649645567, + 0.0007947525009512901, + 0.0007945421966724098, + 0.0007944482495076954, + 0.0007949797436594963 + ], + "gamma_dfa": 0.02851281687617302, + "gamma_dfa_per_layer": [ + 0.2822743058204651, + -0.08248982578516006, + -0.05187612026929855, + -0.03385709226131439 + ], + "acc_eval": 0.1337890625, + "loss_eval": 8231.9248046875, + "epoch": 34 + }, + { + "hidden_norms": [ + 5855.8310546875, + 2515524.75, + 2653569.0, + 2713748.5, + 2740903.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018560283351689577, + 0.0007757823332212865, + 0.0007757038110867143, + 0.0007756180129945278, + 0.0007759004947729409 + ], + "gamma_dfa": 0.018099953944329172, + "gamma_dfa_per_layer": [ + 0.2729976773262024, + -0.08800812810659409, + -0.002550901612266898, + -0.11003883183002472 + ], + "acc_eval": 0.150390625, + "loss_eval": 7247.7216796875, + "epoch": 35 + }, + { + "hidden_norms": [ + 6036.9033203125, + 2711563.0, + 2854179.0, + 2918077.75, + 2945814.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001862754113972187, + 0.0007525583496317267, + 0.0007525330875068903, + 0.0007526627741754055, + 0.0007525623659603298 + ], + "gamma_dfa": 0.02487885858863592, + "gamma_dfa_per_layer": [ + 0.29685819149017334, + -0.08635345101356506, + -0.056181322783231735, + -0.054807983338832855 + ], + "acc_eval": 0.1435546875, + "loss_eval": 7513.36376953125, + "epoch": 36 + }, + { + "hidden_norms": [ + 6188.01611328125, + 2906995.5, + 3054202.25, + 3121279.0, + 3149996.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013340733712539077, + 0.0007529910071752965, + 0.0007524905377067626, + 0.0007527912384830415, + 0.0007525555556640029 + ], + "gamma_dfa": 0.027058321982622147, + "gamma_dfa_per_layer": [ + 0.25763267278671265, + -0.06575162708759308, + -0.04412994533777237, + -0.03951781243085861 + ], + "acc_eval": 0.2431640625, + "loss_eval": 12329.697265625, + "epoch": 37 + }, + { + "hidden_norms": [ + 6390.7060546875, + 3133419.5, + 3288636.0, + 3360502.75, + 3390539.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014776778407394886, + 0.0007607035804539919, + 0.0007607110310345888, + 0.0007606975850649178, + 0.000760715629439801 + ], + "gamma_dfa": 0.022189474664628506, + "gamma_dfa_per_layer": [ + 0.2616554796695709, + -0.07128072530031204, + -0.06259018927812576, + -0.039026666432619095 + ], + "acc_eval": 0.173828125, + "loss_eval": 6832.28955078125, + "epoch": 38 + }, + { + "hidden_norms": [ + 6548.68115234375, + 3356773.75, + 3517968.25, + 3593598.5, + 3624375.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002129003871232271, + 0.0007741872104816139, + 0.000774160900618881, + 0.0007743749301880598, + 0.0007743173046037555 + ], + "gamma_dfa": 0.034090133383870125, + "gamma_dfa_per_layer": [ + 0.3182219862937927, + -0.08398662507534027, + -0.06546281278133392, + -0.03241201490163803 + ], + "acc_eval": 0.1904296875, + "loss_eval": 5371.0859375, + "epoch": 39 + }, + { + "hidden_norms": [ + 6723.9697265625, + 3592963.25, + 3757696.25, + 3837777.75, + 3868088.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018772021867334843, + 0.0007547365385107696, + 0.0007547002169303596, + 0.0007546909037046134, + 0.000754650856833905 + ], + "gamma_dfa": 0.003609549254179001, + "gamma_dfa_per_layer": [ + 0.282962441444397, + -0.10840916633605957, + -0.10053665935993195, + -0.05957841873168945 + ], + "acc_eval": 0.1376953125, + "loss_eval": 8650.76953125, + "epoch": 40 + }, + { + "hidden_norms": [ + 6887.81005859375, + 3829273.5, + 3999416.75, + 4084005.5, + 4113581.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020062020048499107, + 0.0007521071238443255, + 0.0007519447826780379, + 0.0007520412327721715, + 0.0007518909987993538 + ], + "gamma_dfa": 0.01951257325708866, + "gamma_dfa_per_layer": [ + 0.2743881344795227, + -0.08543786406517029, + -0.05402272939682007, + -0.056877247989177704 + ], + "acc_eval": 0.1796875, + "loss_eval": 15509.98828125, + "epoch": 41 + }, + { + "hidden_norms": [ + 7027.42626953125, + 4050130.5, + 4223340.0, + 4310667.5, + 4340882.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016777552664279938, + 0.0007508718408644199, + 0.0007508369744755328, + 0.0007509454735554755, + 0.0007508718408644199 + ], + "gamma_dfa": 0.02786387037485838, + "gamma_dfa_per_layer": [ + 0.2803051769733429, + -0.07360324263572693, + -0.04823639243841171, + -0.04701006039977074 + ], + "acc_eval": 0.2275390625, + "loss_eval": 7618.71533203125, + "epoch": 42 + }, + { + "hidden_norms": [ + 7157.845703125, + 4292685.0, + 4471049.5, + 4562175.0, + 4591811.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016224944265559316, + 0.0007538175559602678, + 0.0007538740755990148, + 0.0007538648205809295, + 0.0007538393838331103 + ], + "gamma_dfa": 0.0053657907992601395, + "gamma_dfa_per_layer": [ + 0.26428842544555664, + -0.10051027685403824, + -0.08806045353412628, + -0.05425453186035156 + ], + "acc_eval": 0.166015625, + "loss_eval": 7869.64111328125, + "epoch": 43 + }, + { + "hidden_norms": [ + 7275.4365234375, + 4532040.5, + 4714971.5, + 4809776.0, + 4839258.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002823092043399811, + 0.0007887987303547561, + 0.0007888769032433629, + 0.0007889135158620775, + 0.0007889300468377769 + ], + "gamma_dfa": 0.008974121417850256, + "gamma_dfa_per_layer": [ + 0.25932246446609497, + -0.10199789702892303, + 0.012336602434515953, + -0.13376468420028687 + ], + "acc_eval": 0.091796875, + "loss_eval": 19789.41796875, + "epoch": 44 + }, + { + "hidden_norms": [ + 7393.93212890625, + 4772152.5, + 4958566.0, + 5058113.0, + 5086560.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019131727749481797, + 0.0007677456014789641, + 0.0007676532259210944, + 0.000767527730204165, + 0.0007678664987906814 + ], + "gamma_dfa": 0.014807725325226784, + "gamma_dfa_per_layer": [ + 0.23344306647777557, + -0.08349616825580597, + -0.0560825914144516, + -0.03463340550661087 + ], + "acc_eval": 0.224609375, + "loss_eval": 12636.65625, + "epoch": 45 + }, + { + "hidden_norms": [ + 7527.99462890625, + 5048336.0, + 5239027.5, + 5342244.0, + 5370085.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018555351998656988, + 0.000769329781178385, + 0.0007686647586524487, + 0.0007689501508139074, + 0.0007690390921197832 + ], + "gamma_dfa": 0.004876136779785156, + "gamma_dfa_per_layer": [ + 0.21739649772644043, + -0.08506827056407928, + -0.03674054145812988, + -0.07608313858509064 + ], + "acc_eval": 0.232421875, + "loss_eval": 12248.12109375, + "epoch": 46 + }, + { + "hidden_norms": [ + 7638.85693359375, + 5287113.0, + 5479795.0, + 5586404.5, + 5613225.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0025236238725483418, + 0.0007688805344514549, + 0.000768228666856885, + 0.0007684807060286403, + 0.0007685597520321608 + ], + "gamma_dfa": -0.006854387931525707, + "gamma_dfa_per_layer": [ + 0.17993390560150146, + -0.08751687407493591, + -0.030272338539361954, + -0.08956224471330643 + ], + "acc_eval": 0.1796875, + "loss_eval": 18537.177734375, + "epoch": 47 + }, + { + "hidden_norms": [ + 7754.390625, + 5527426.0, + 5724221.0, + 5833576.5, + 5860100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020714402198791504, + 0.0007631001644767821, + 0.0007630567415617406, + 0.0007630541222169995, + 0.0007631017942912877 + ], + "gamma_dfa": 0.02875693328678608, + "gamma_dfa_per_layer": [ + 0.29564130306243896, + -0.08437579870223999, + -0.050235565751791, + -0.04600220546126366 + ], + "acc_eval": 0.208984375, + "loss_eval": 10527.2578125, + "epoch": 48 + }, + { + "hidden_norms": [ + 7888.46923828125, + 5787159.5, + 5987915.0, + 6101035.0, + 6127097.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0026283818297088146, + 0.0007835617288947105, + 0.0007836156873963773, + 0.000783648225478828, + 0.0007836673175916076 + ], + "gamma_dfa": 0.011204172391444445, + "gamma_dfa_per_layer": [ + 0.26796066761016846, + -0.10181419551372528, + 0.010023357346653938, + -0.13135313987731934 + ], + "acc_eval": 0.0966796875, + "loss_eval": 15481.84375, + "epoch": 49 + }, + { + "hidden_norms": [ + 7975.13671875, + 6029198.0, + 6234359.5, + 6352162.0, + 6377873.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001740386476740241, + 0.0007632866618223488, + 0.0007632256019860506, + 0.0007631148328073323, + 0.0007634586072526872 + ], + "gamma_dfa": -0.000985240563750267, + "gamma_dfa_per_layer": [ + 0.20569762587547302, + -0.0866088718175888, + -0.04746733605861664, + -0.07556238025426865 + ], + "acc_eval": 0.2001953125, + "loss_eval": 12020.572265625, + "epoch": 50 + }, + { + "hidden_norms": [ + 8109.23095703125, + 6280213.0, + 6488845.5, + 6610432.5, + 6636101.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018630403792485595, + 0.0007671525236219168, + 0.000766951881814748, + 0.0007671291241422296, + 0.0007672281353734434 + ], + "gamma_dfa": -0.0027379142120480537, + "gamma_dfa_per_layer": [ + 0.22697225213050842, + -0.10085368156433105, + -0.059774767607450485, + -0.0772954598069191 + ], + "acc_eval": 0.13671875, + "loss_eval": 12490.904296875, + "epoch": 51 + }, + { + "hidden_norms": [ + 8223.3388671875, + 6520398.5, + 6731145.5, + 6855487.0, + 6880542.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020134998485445976, + 0.0007573508773930371, + 0.0007573754992336035, + 0.0007574421470053494, + 0.0007576147909276187 + ], + "gamma_dfa": 0.00887075625360012, + "gamma_dfa_per_layer": [ + 0.260132372379303, + -0.08125708997249603, + -0.07711100578308105, + -0.06628125160932541 + ], + "acc_eval": 0.12890625, + "loss_eval": 13286.50390625, + "epoch": 52 + }, + { + "hidden_norms": [ + 8317.2099609375, + 6773551.0, + 6990263.5, + 7117609.5, + 7143509.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016349060460925102, + 0.000744542689062655, + 0.0007445236551575363, + 0.000744638848118484, + 0.0007445821538567543 + ], + "gamma_dfa": 0.036132486537098885, + "gamma_dfa_per_layer": [ + 0.35822737216949463, + -0.09246134012937546, + -0.05995674431324005, + -0.06127934157848358 + ], + "acc_eval": 0.1318359375, + "loss_eval": 12961.923828125, + "epoch": 53 + }, + { + "hidden_norms": [ + 8396.16015625, + 7036334.0, + 7256480.5, + 7388541.0, + 7414023.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016424244968220592, + 0.0007655483204871416, + 0.0007653584470972419, + 0.0007655261433683336, + 0.0007656112429685891 + ], + "gamma_dfa": 0.00855250470340252, + "gamma_dfa_per_layer": [ + 0.31318342685699463, + -0.11486171185970306, + -0.07210143655538559, + -0.0920102596282959 + ], + "acc_eval": 0.0986328125, + "loss_eval": 14289.1396484375, + "epoch": 54 + }, + { + "hidden_norms": [ + 8425.91796875, + 7268265.0, + 7491250.5, + 7626377.5, + 7651502.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014321975177153945, + 0.0007547372952103615, + 0.0007547161658294499, + 0.0007547704153694212, + 0.000754979089833796 + ], + "gamma_dfa": 0.019777772948145866, + "gamma_dfa_per_layer": [ + 0.3146383762359619, + -0.0827077254652977, + -0.0876566469669342, + -0.06516291201114655 + ], + "acc_eval": 0.0908203125, + "loss_eval": 12761.185546875, + "epoch": 55 + }, + { + "hidden_norms": [ + 8519.505859375, + 7514964.5, + 7741589.0, + 7880037.0, + 7905207.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017787133110687137, + 0.0007505406392738223, + 0.0007507357513532043, + 0.0007507326663471758, + 0.0007507237605750561 + ], + "gamma_dfa": -0.012186199426651001, + "gamma_dfa_per_layer": [ + 0.2306034117937088, + -0.11392365396022797, + -0.1025918573141098, + -0.06283269822597504 + ], + "acc_eval": 0.1455078125, + "loss_eval": 8573.3310546875, + "epoch": 56 + }, + { + "hidden_norms": [ + 8575.814453125, + 7701015.5, + 7930432.0, + 8070523.0, + 8095346.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013273135991767049, + 0.0007214294746518135, + 0.0007213159115053713, + 0.0007215962978079915, + 0.0007215975201688707 + ], + "gamma_dfa": 0.02046024613082409, + "gamma_dfa_per_layer": [ + 0.2830252945423126, + -0.09345690906047821, + -0.06962529569864273, + -0.038102105259895325 + ], + "acc_eval": 0.1923828125, + "loss_eval": 6201.162109375, + "epoch": 57 + }, + { + "hidden_norms": [ + 8635.1220703125, + 7939687.0, + 8172801.5, + 8315327.5, + 8340462.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002125338651239872, + 0.0007551790331490338, + 0.0007551065064035356, + 0.0007549694273620844, + 0.000755314074922353 + ], + "gamma_dfa": 0.019076894968748093, + "gamma_dfa_per_layer": [ + 0.25508445501327515, + -0.07673472911119461, + -0.04303552210330963, + -0.059006623923778534 + ], + "acc_eval": 0.1865234375, + "loss_eval": 12055.595703125, + "epoch": 58 + }, + { + "hidden_norms": [ + 8706.6689453125, + 8158003.0, + 8394169.0, + 8539798.0, + 8565165.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001350156613625586, + 0.0007560249068774283, + 0.0007559725781902671, + 0.0007558663492091, + 0.0007561935926787555 + ], + "gamma_dfa": 0.028152598068118095, + "gamma_dfa_per_layer": [ + 0.28580546379089355, + -0.08475945889949799, + -0.05238167941570282, + -0.03605393320322037 + ], + "acc_eval": 0.220703125, + "loss_eval": 12085.9541015625, + "epoch": 59 + }, + { + "hidden_norms": [ + 8758.453125, + 8374766.0, + 8613513.0, + 8761622.0, + 8786363.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002377285622060299, + 0.0007197813247330487, + 0.0007195555372163653, + 0.0007198317907750607, + 0.000719684932846576 + ], + "gamma_dfa": 0.025455349124968052, + "gamma_dfa_per_layer": [ + 0.27419814467430115, + -0.08699844777584076, + -0.04594934359192848, + -0.0394289568066597 + ], + "acc_eval": 0.1669921875, + "loss_eval": 13302.744140625, + "epoch": 60 + }, + { + "hidden_norms": [ + 8795.5654296875, + 8572136.0, + 8812910.0, + 8963599.0, + 8987706.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015984047204256058, + 0.0007187420851550996, + 0.0007185072172433138, + 0.000718816474545747, + 0.000718718278221786 + ], + "gamma_dfa": 0.020128127187490463, + "gamma_dfa_per_layer": [ + 0.3066103458404541, + -0.1022094339132309, + -0.07834567129611969, + -0.04554273188114166 + ], + "acc_eval": 0.1181640625, + "loss_eval": 6553.7236328125, + "epoch": 61 + }, + { + "hidden_norms": [ + 8811.46875, + 8766653.0, + 9009529.0, + 9162389.0, + 9185680.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019123096717521548, + 0.0007724921451881528, + 0.0007725215400569141, + 0.0007725482573732734, + 0.0007725649629719555 + ], + "gamma_dfa": 0.03271363768726587, + "gamma_dfa_per_layer": [ + 0.2947639226913452, + -0.08735189586877823, + -0.04557036980986595, + -0.030987106263637543 + ], + "acc_eval": 0.18359375, + "loss_eval": 11607.7158203125, + "epoch": 62 + }, + { + "hidden_norms": [ + 8860.6220703125, + 8977001.0, + 9224122.0, + 9379773.0, + 9402851.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013403806369751692, + 0.0007685344316996634, + 0.0007685531745664775, + 0.0007685986929573119, + 0.0007685821619816124 + ], + "gamma_dfa": 0.020242065889760852, + "gamma_dfa_per_layer": [ + 0.30239802598953247, + -0.09480112791061401, + -0.014634584076702595, + -0.11199405044317245 + ], + "acc_eval": 0.1337890625, + "loss_eval": 9788.81640625, + "epoch": 63 + }, + { + "hidden_norms": [ + 8904.9482421875, + 9185937.0, + 9436793.0, + 9595000.0, + 9618183.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012845145538449287, + 0.0007421535556204617, + 0.0007421503541991115, + 0.0007421293412335217, + 0.0007421668851748109 + ], + "gamma_dfa": 0.02229973580688238, + "gamma_dfa_per_layer": [ + 0.2927352786064148, + -0.08628389239311218, + -0.060364432632923126, + -0.05688801035284996 + ], + "acc_eval": 0.1728515625, + "loss_eval": 8114.20458984375, + "epoch": 64 + }, + { + "hidden_norms": [ + 8892.296875, + 9356716.0, + 9611136.0, + 9771064.0, + 9794530.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001351315644569695, + 0.0007599962409585714, + 0.0007597811054438353, + 0.0007599799428135157, + 0.0007600505487062037 + ], + "gamma_dfa": 0.019069598987698555, + "gamma_dfa_per_layer": [ + 0.29072487354278564, + -0.0944916158914566, + -0.05359811335802078, + -0.06635674834251404 + ], + "acc_eval": 0.169921875, + "loss_eval": 8773.3408203125, + "epoch": 65 + }, + { + "hidden_norms": [ + 8905.83984375, + 9511506.0, + 9766884.0, + 9928659.0, + 9951002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017338081961497664, + 0.0007696599350310862, + 0.0007696837419643998, + 0.0007697126129642129, + 0.0007697291439399123 + ], + "gamma_dfa": 0.028427925892174244, + "gamma_dfa_per_layer": [ + 0.3319295644760132, + -0.09938425570726395, + 0.004324089735746384, + -0.12315769493579865 + ], + "acc_eval": 0.1142578125, + "loss_eval": 12823.435546875, + "epoch": 66 + }, + { + "hidden_norms": [ + 8944.53125, + 9692436.0, + 9950194.0, + 10113948.0, + 10136307.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017030658200383186, + 0.000714489258825779, + 0.0007141575333662331, + 0.0007145405979827046, + 0.0007144163828343153 + ], + "gamma_dfa": 0.055724941194057465, + "gamma_dfa_per_layer": [ + 0.3514706492424011, + -0.07685236632823944, + -0.031716104596853256, + -0.020002413541078568 + ], + "acc_eval": 0.18359375, + "loss_eval": 10412.890625, + "epoch": 67 + }, + { + "hidden_norms": [ + 8926.98828125, + 9838798.0, + 10099141.0, + 10264565.0, + 10286604.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015448650810867548, + 0.0007684402517043054, + 0.0007684584707021713, + 0.0007684882148168981, + 0.0007685049204155803 + ], + "gamma_dfa": 0.032529132440686226, + "gamma_dfa_per_layer": [ + 0.3082513213157654, + -0.0888272076845169, + -0.032446227967739105, + -0.056861355900764465 + ], + "acc_eval": 0.19921875, + "loss_eval": 8345.18359375, + "epoch": 68 + }, + { + "hidden_norms": [ + 8903.689453125, + 10005445.0, + 10266980.0, + 10434005.0, + 10454617.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017746278317645192, + 0.0007130402373149991, + 0.0007127230055630207, + 0.0007131076999939978, + 0.0007130174781195819 + ], + "gamma_dfa": 0.05443635303527117, + "gamma_dfa_per_layer": [ + 0.35508570075035095, + -0.08241431415081024, + -0.03841204196214676, + -0.01651393249630928 + ], + "acc_eval": 0.140625, + "loss_eval": 7877.36181640625, + "epoch": 69 + }, + { + "hidden_norms": [ + 8910.42578125, + 10173785.0, + 10439506.0, + 10609011.0, + 10630571.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011222161119803786, + 0.0007312637171708047, + 0.0007313191890716553, + 0.0007313672685995698, + 0.0007313768728636205 + ], + "gamma_dfa": 0.023520448245108128, + "gamma_dfa_per_layer": [ + 0.29335978627204895, + -0.08935706317424774, + -0.06947942078113556, + -0.04044150933623314 + ], + "acc_eval": 0.2421875, + "loss_eval": 5653.23388671875, + "epoch": 70 + }, + { + "hidden_norms": [ + 8876.2041015625, + 10317365.0, + 10586095.0, + 10757344.0, + 10779691.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011208312353119254, + 0.0007571111200377345, + 0.0007568965083919466, + 0.0007570943562313914, + 0.0007571595488116145 + ], + "gamma_dfa": 0.025294490158557892, + "gamma_dfa_per_layer": [ + 0.331506609916687, + -0.09467847645282745, + -0.06287634372711182, + -0.07277382910251617 + ], + "acc_eval": 0.1884765625, + "loss_eval": 3869.094970703125, + "epoch": 71 + }, + { + "hidden_norms": [ + 8852.7001953125, + 10449657.0, + 10719980.0, + 10891483.0, + 10913594.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001109768869355321, + 0.0007331773522309959, + 0.0007331601809710264, + 0.0007332302629947662, + 0.0007332285749725997 + ], + "gamma_dfa": 0.03539558406919241, + "gamma_dfa_per_layer": [ + 0.3268349766731262, + -0.08062416315078735, + -0.055393531918525696, + -0.04923494532704353 + ], + "acc_eval": 0.2353515625, + "loss_eval": 7111.935546875, + "epoch": 72 + }, + { + "hidden_norms": [ + 8827.3955078125, + 10582167.0, + 10855077.0, + 11028114.0, + 11050690.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001240618177689612, + 0.0007623998681083322, + 0.0007624404970556498, + 0.0007624777499586344, + 0.0007624629070051014 + ], + "gamma_dfa": 0.03839550958946347, + "gamma_dfa_per_layer": [ + 0.36802345514297485, + -0.09764832258224487, + -0.0042990874499082565, + -0.11249400675296783 + ], + "acc_eval": 0.1357421875, + "loss_eval": 6752.0322265625, + "epoch": 73 + }, + { + "hidden_norms": [ + 8814.1962890625, + 10696667.0, + 10971925.0, + 11146316.0, + 11168931.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001309843035414815, + 0.0007403214112855494, + 0.0007405314245261252, + 0.0007405264186672866, + 0.0007405087817460299 + ], + "gamma_dfa": 0.038134077563881874, + "gamma_dfa_per_layer": [ + 0.3364037275314331, + -0.08192241191864014, + -0.03633008152246475, + -0.06561492383480072 + ], + "acc_eval": 0.212890625, + "loss_eval": 6998.021484375, + "epoch": 74 + }, + { + "hidden_norms": [ + 8779.0400390625, + 10798076.0, + 11075004.0, + 11250115.0, + 11272600.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011087025050073862, + 0.0007316112169064581, + 0.0007316232076846063, + 0.0007316932315006852, + 0.00073169672396034 + ], + "gamma_dfa": 0.04451032355427742, + "gamma_dfa_per_layer": [ + 0.34500744938850403, + -0.07661331444978714, + -0.04388073831796646, + -0.04647210240364075 + ], + "acc_eval": 0.2490234375, + "loss_eval": 3624.614013671875, + "epoch": 75 + }, + { + "hidden_norms": [ + 8751.8486328125, + 10906611.0, + 11185716.0, + 11362176.0, + 11384611.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001067605335265398, + 0.0007393756532110274, + 0.0007396025466732681, + 0.000739598530344665, + 0.000739583745598793 + ], + "gamma_dfa": 0.03648093156516552, + "gamma_dfa_per_layer": [ + 0.31906285881996155, + -0.07843812555074692, + -0.051880721002817154, + -0.0428202860057354 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2816.3427734375, + "epoch": 76 + }, + { + "hidden_norms": [ + 8743.0078125, + 10999747.0, + 11279813.0, + 11457343.0, + 11479737.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010900371707975864, + 0.0007332717068493366, + 0.0007332694949582219, + 0.0007332508685067296, + 0.0007332859677262604 + ], + "gamma_dfa": 0.03520212788134813, + "gamma_dfa_per_layer": [ + 0.3010096549987793, + -0.07223288714885712, + -0.05185239389538765, + -0.036115862429142 + ], + "acc_eval": 0.2451171875, + "loss_eval": 3747.66748046875, + "epoch": 77 + }, + { + "hidden_norms": [ + 8693.3349609375, + 11081850.0, + 11362476.0, + 11540274.0, + 11562006.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010161141399294138, + 0.0007433417486026883, + 0.0007432828424498439, + 0.000743163691367954, + 0.0007434578728862107 + ], + "gamma_dfa": 0.04203554056584835, + "gamma_dfa_per_layer": [ + 0.3622134029865265, + -0.08443501591682434, + -0.020812533795833588, + -0.08882369101047516 + ], + "acc_eval": 0.1953125, + "loss_eval": 3283.453125, + "epoch": 78 + }, + { + "hidden_norms": [ + 8679.0673828125, + 11176062.0, + 11458995.0, + 11637744.0, + 11660108.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010180213721469045, + 0.0007298000273294747, + 0.000729813240468502, + 0.0007298758719116449, + 0.0007298807031475008 + ], + "gamma_dfa": 0.03867925424128771, + "gamma_dfa_per_layer": [ + 0.3430703282356262, + -0.08001460134983063, + -0.05243712291121483, + -0.05590158700942993 + ], + "acc_eval": 0.22265625, + "loss_eval": 3249.233154296875, + "epoch": 79 + }, + { + "hidden_norms": [ + 8630.8896484375, + 11249126.0, + 11532709.0, + 11711592.0, + 11733760.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001043561496771872, + 0.0007425911608152092, + 0.0007425197982229292, + 0.0007423801580443978, + 0.000742721778806299 + ], + "gamma_dfa": 0.028339628130197525, + "gamma_dfa_per_layer": [ + 0.32279035449028015, + -0.09357395768165588, + -0.06377816200256348, + -0.05207972228527069 + ], + "acc_eval": 0.1904296875, + "loss_eval": 3085.4638671875, + "epoch": 80 + }, + { + "hidden_norms": [ + 8578.060546875, + 11304050.0, + 11589802.0, + 11769234.0, + 11792299.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000967628788203001, + 0.0007289479253813624, + 0.0007289598579518497, + 0.0007290169014595449, + 0.0007290222565643489 + ], + "gamma_dfa": 0.02121756039559841, + "gamma_dfa_per_layer": [ + 0.31049084663391113, + -0.09504136443138123, + -0.07916043698787689, + -0.05141880363225937 + ], + "acc_eval": 0.236328125, + "loss_eval": 1885.889404296875, + "epoch": 81 + }, + { + "hidden_norms": [ + 8522.4794921875, + 11393685.0, + 11680880.0, + 11860855.0, + 11883774.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010794082190841436, + 0.0007521919906139374, + 0.0007519960636273026, + 0.0007521732477471232, + 0.0007522284286096692 + ], + "gamma_dfa": 0.026587368920445442, + "gamma_dfa_per_layer": [ + 0.37745779752731323, + -0.11168865859508514, + -0.0728297159075737, + -0.08658994734287262 + ], + "acc_eval": 0.1220703125, + "loss_eval": 2588.15478515625, + "epoch": 82 + }, + { + "hidden_norms": [ + 8482.1484375, + 11447732.0, + 11736021.0, + 11916302.0, + 11939110.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009376976522617042, + 0.0007250583730638027, + 0.000724694284144789, + 0.0007250410853885114, + 0.0007250093622133136 + ], + "gamma_dfa": 0.0355191919952631, + "gamma_dfa_per_layer": [ + 0.31943440437316895, + -0.07911509275436401, + -0.0536213181912899, + -0.04462122544646263 + ], + "acc_eval": 0.2783203125, + "loss_eval": 1507.2919921875, + "epoch": 83 + }, + { + "hidden_norms": [ + 8430.1455078125, + 11492522.0, + 11781554.0, + 11962317.0, + 11985175.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009387033060193062, + 0.0007079826318658888, + 0.0007078545750118792, + 0.0007080811192281544, + 0.0007080849609337747 + ], + "gamma_dfa": 0.036465028300881386, + "gamma_dfa_per_layer": [ + 0.3066443204879761, + -0.07488954067230225, + -0.03129498288035393, + -0.05459968373179436 + ], + "acc_eval": 0.275390625, + "loss_eval": 1614.5029296875, + "epoch": 84 + }, + { + "hidden_norms": [ + 8369.6298828125, + 11532036.0, + 11821641.0, + 12002443.0, + 12025323.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009389162878505886, + 0.0007232772768475115, + 0.0007233347278088331, + 0.0007233632495626807, + 0.000723376520909369 + ], + "gamma_dfa": 0.040183850564062595, + "gamma_dfa_per_layer": [ + 0.34539365768432617, + -0.08373545110225677, + -0.05380668863654137, + -0.04711611568927765 + ], + "acc_eval": 0.25, + "loss_eval": 1501.9444580078125, + "epoch": 85 + }, + { + "hidden_norms": [ + 8319.4169921875, + 11569238.0, + 11860199.0, + 12041371.0, + 12064573.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009176665917038918, + 0.0007041870849207044, + 0.0007039242191240191, + 0.0007042758516035974, + 0.0007042170618660748 + ], + "gamma_dfa": 0.035514961928129196, + "gamma_dfa_per_layer": [ + 0.2879785895347595, + -0.07180146872997284, + -0.037917762994766235, + -0.03619951009750366 + ], + "acc_eval": 0.30859375, + "loss_eval": 1078.8165283203125, + "epoch": 86 + }, + { + "hidden_norms": [ + 8282.478515625, + 11596869.0, + 11888039.0, + 12069453.0, + 12092582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00098571612033993, + 0.000731602602172643, + 0.0007312855450436473, + 0.0007312477100640535, + 0.0007316134287975729 + ], + "gamma_dfa": 0.04066215269267559, + "gamma_dfa_per_layer": [ + 0.33381348848342896, + -0.08063024282455444, + -0.055662885308265686, + -0.034871749579906464 + ], + "acc_eval": 0.234375, + "loss_eval": 1841.648193359375, + "epoch": 87 + }, + { + "hidden_norms": [ + 8242.1005859375, + 11624052.0, + 11916218.0, + 12098548.0, + 12121911.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009184937225654721, + 0.0007233315263874829, + 0.000723001197911799, + 0.0007232833886519074, + 0.0007232468342408538 + ], + "gamma_dfa": 0.03233872726559639, + "gamma_dfa_per_layer": [ + 0.2990570068359375, + -0.07802218198776245, + -0.04814079403877258, + -0.04353912174701691 + ], + "acc_eval": 0.2890625, + "loss_eval": 980.395751953125, + "epoch": 88 + }, + { + "hidden_norms": [ + 8216.91796875, + 11647355.0, + 11939175.0, + 12121172.0, + 12144056.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008776114555075765, + 0.0007067625410854816, + 0.0007066249381750822, + 0.0007068619015626609, + 0.0007068667327985168 + ], + "gamma_dfa": 0.027417242527008057, + "gamma_dfa_per_layer": [ + 0.28433892130851746, + -0.07622525095939636, + -0.050822652876377106, + -0.04762204736471176 + ], + "acc_eval": 0.326171875, + "loss_eval": 776.0946044921875, + "epoch": 89 + }, + { + "hidden_norms": [ + 8169.76513671875, + 11658648.0, + 11950474.0, + 12132456.0, + 12155182.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008986471802927554, + 0.0007065801764838398, + 0.0007064181263558567, + 0.000706693041138351, + 0.0007066999096423388 + ], + "gamma_dfa": 0.03352018166333437, + "gamma_dfa_per_layer": [ + 0.296892374753952, + -0.07546264678239822, + -0.04814247041940689, + -0.03920653089880943 + ], + "acc_eval": 0.3095703125, + "loss_eval": 893.558349609375, + "epoch": 90 + }, + { + "hidden_norms": [ + 8142.11669921875, + 11667783.0, + 11959690.0, + 12141714.0, + 12164439.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009172433638013899, + 0.0007064292440190911, + 0.0007062776712700725, + 0.0007065359968692064, + 0.000706541701219976 + ], + "gamma_dfa": 0.03799809701740742, + "gamma_dfa_per_layer": [ + 0.31104975938796997, + -0.07753260433673859, + -0.04483959078788757, + -0.03668517619371414 + ], + "acc_eval": 0.2763671875, + "loss_eval": 918.902099609375, + "epoch": 91 + }, + { + "hidden_norms": [ + 8113.36474609375, + 11673688.0, + 11965558.0, + 12147558.0, + 12170198.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009179572225548327, + 0.0007257050601765513, + 0.0007257269462570548, + 0.0007257769466377795, + 0.0007257869001477957 + ], + "gamma_dfa": 0.03620104119181633, + "gamma_dfa_per_layer": [ + 0.3097808361053467, + -0.07722775638103485, + -0.0500766858458519, + -0.03767222911119461 + ], + "acc_eval": 0.2880859375, + "loss_eval": 1033.579833984375, + "epoch": 92 + }, + { + "hidden_norms": [ + 8085.35595703125, + 11678927.0, + 11970798.0, + 12152808.0, + 12175446.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008720594923943281, + 0.0007061808719299734, + 0.0007060291827656329, + 0.0007062855875119567, + 0.0007062909426167607 + ], + "gamma_dfa": 0.03221010882407427, + "gamma_dfa_per_layer": [ + 0.2895042598247528, + -0.07448285818099976, + -0.04004380851984024, + -0.04613715782761574 + ], + "acc_eval": 0.3046875, + "loss_eval": 827.44140625, + "epoch": 93 + }, + { + "hidden_norms": [ + 8072.322265625, + 11682684.0, + 11974490.0, + 12156499.0, + 12179080.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008837314089760184, + 0.0007061065407469869, + 0.0007059663184918463, + 0.00070620869519189, + 0.000706215447280556 + ], + "gamma_dfa": 0.026722624897956848, + "gamma_dfa_per_layer": [ + 0.28959959745407104, + -0.08210700005292892, + -0.05253326892852783, + -0.048068828880786896 + ], + "acc_eval": 0.291015625, + "loss_eval": 795.6766357421875, + "epoch": 94 + }, + { + "hidden_norms": [ + 8063.02001953125, + 11684947.0, + 11976758.0, + 12158785.0, + 12181362.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008943622815422714, + 0.0007086708792485297, + 0.0007086790283210576, + 0.0007087094127200544, + 0.0007087020785547793 + ], + "gamma_dfa": 0.02946585137397051, + "gamma_dfa_per_layer": [ + 0.29232603311538696, + -0.08056485652923584, + -0.05102770775556564, + -0.042870063334703445 + ], + "acc_eval": 0.2919921875, + "loss_eval": 839.8633422851562, + "epoch": 95 + }, + { + "hidden_norms": [ + 8055.40576171875, + 11685775.0, + 11977584.0, + 12159594.0, + 12182165.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008769903797656298, + 0.0007059753406792879, + 0.0007058423361741006, + 0.0007060715579427779, + 0.0007060769130475819 + ], + "gamma_dfa": 0.02765239030122757, + "gamma_dfa_per_layer": [ + 0.2855387032032013, + -0.07872132211923599, + -0.051525406539440155, + -0.04468241333961487 + ], + "acc_eval": 0.3115234375, + "loss_eval": 736.9282836914062, + "epoch": 96 + }, + { + "hidden_norms": [ + 8050.93310546875, + 11685670.0, + 11977453.0, + 12159452.0, + 12182004.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008705379441380501, + 0.0007085780380293727, + 0.0007085860124789178, + 0.0007086164550855756, + 0.0007086091791279614 + ], + "gamma_dfa": 0.026861276477575302, + "gamma_dfa_per_layer": [ + 0.2898082733154297, + -0.07899712026119232, + -0.046087510883808136, + -0.05727853626012802 + ], + "acc_eval": 0.302734375, + "loss_eval": 737.6731567382812, + "epoch": 97 + }, + { + "hidden_norms": [ + 8048.384765625, + 11685821.0, + 11977554.0, + 12159347.0, + 12182068.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008696588920429349, + 0.0007085675024427474, + 0.0007085754186846316, + 0.0007086056284606457, + 0.0007085986435413361 + ], + "gamma_dfa": 0.02852465771138668, + "gamma_dfa_per_layer": [ + 0.2933640480041504, + -0.07862062007188797, + -0.04777185618877411, + -0.05287294089794159 + ], + "acc_eval": 0.30859375, + "loss_eval": 716.3431396484375, + "epoch": 98 + }, + { + "hidden_norms": [ + 8047.294921875, + 11685550.0, + 11977281.0, + 12159072.0, + 12181796.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000868224713485688, + 0.0007059023482725024, + 0.0007057614857330918, + 0.0007060033385641873, + 0.0007060095085762441 + ], + "gamma_dfa": 0.026804575696587563, + "gamma_dfa_per_layer": [ + 0.2827316224575043, + -0.07767541706562042, + -0.051301658153533936, + -0.046536244451999664 + ], + "acc_eval": 0.32421875, + "loss_eval": 693.041259765625, + "epoch": 99 + }, + { + "hidden_norms": [ + 8047.01025390625, + 11685479.0, + 11977214.0, + 12159006.0, + 12181733.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008688519592396915, + 0.0007085604593157768, + 0.0007085682009346783, + 0.0007085984107106924, + 0.0007085916586220264 + ], + "gamma_dfa": 0.027284779585897923, + "gamma_dfa_per_layer": [ + 0.2883991003036499, + -0.07865853607654572, + -0.04951424151659012, + -0.05108720436692238 + ], + "acc_eval": 0.3134765625, + "loss_eval": 705.9644775390625, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s42.json b/results/snapshot_no_outln_v1/snapshot_noLN_s42.json new file mode 100644 index 0000000..6bf0a61 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s42.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1123046875, + "loss_eval": 2.3168468475341797, + "epoch": 0 + }, + { + "hidden_norms": [ + 39.5714225769043, + 36.241031646728516, + 34.50772476196289, + 33.32059097290039, + 33.10130310058594 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001264682796318084, + 0.00013185068382881582, + 0.0001420896005583927, + 0.00016605440760031343, + 0.0002204339689342305 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4228515625, + "loss_eval": 1.6010748147964478, + "epoch": 1 + }, + { + "hidden_norms": [ + 52.47050857543945, + 48.28652572631836, + 45.496219635009766, + 43.2078857421875, + 41.36874008178711 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010761933663161471, + 0.00011420303053455427, + 0.00012131234689150006, + 0.00013399586896412075, + 0.00016239506658166647 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.453125, + "loss_eval": 1.4937903881072998, + "epoch": 2 + }, + { + "hidden_norms": [ + 62.092323303222656, + 56.274635314941406, + 52.64373016357422, + 49.852622985839844, + 46.636131286621094 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010067893890663981, + 0.00010744533210527152, + 0.000112645146145951, + 0.00012268377759028226, + 0.00014184287283569574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.46484375, + "loss_eval": 1.495908498764038, + "epoch": 3 + }, + { + "hidden_norms": [ + 70.92781829833984, + 62.570072174072266, + 57.76173400878906, + 53.9067497253418, + 49.468414306640625 + ], + "bp_grad_per_sample_l2_med": [ + 9.065420454135165e-05, + 9.659545321483165e-05, + 0.00010056291648652405, + 0.00010604548879200593, + 0.0001232008944498375 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5048828125, + "loss_eval": 1.4103548526763916, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.77008056640625, + 68.82622528076172, + 62.881927490234375, + 57.43979263305664, + 52.381675720214844 + ], + "bp_grad_per_sample_l2_med": [ + 8.967184840003029e-05, + 9.561960905557498e-05, + 9.984008647734299e-05, + 0.0001043190059135668, + 0.00011724776413757354 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5009765625, + "loss_eval": 1.3900126218795776, + "epoch": 5 + }, + { + "hidden_norms": [ + 84.3420639038086, + 73.14466094970703, + 66.25099182128906, + 60.290985107421875, + 54.196815490722656 + ], + "bp_grad_per_sample_l2_med": [ + 8.548566984245554e-05, + 9.279063669964671e-05, + 9.806034358916804e-05, + 0.00010389943781774491, + 0.00011231016833335161 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.509765625, + "loss_eval": 1.3721935749053955, + "epoch": 6 + }, + { + "hidden_norms": [ + 91.67733764648438, + 79.67963409423828, + 70.7928466796875, + 63.614192962646484, + 56.76249694824219 + ], + "bp_grad_per_sample_l2_med": [ + 8.422173414146528e-05, + 9.07716530491598e-05, + 9.6989817393478e-05, + 0.00010211832704953849, + 0.00011144059681100771 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5166015625, + "loss_eval": 1.344391107559204, + "epoch": 7 + }, + { + "hidden_norms": [ + 96.60388946533203, + 83.8042221069336, + 74.53706359863281, + 66.99102020263672, + 58.020408630371094 + ], + "bp_grad_per_sample_l2_med": [ + 8.360752690350637e-05, + 9.003488958114758e-05, + 9.634223533794284e-05, + 0.00010073634621221572, + 0.00010698751430027187 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5185546875, + "loss_eval": 1.3327906131744385, + "epoch": 8 + }, + { + "hidden_norms": [ + 101.24382781982422, + 87.08720397949219, + 76.92607116699219, + 68.23351287841797, + 59.4285888671875 + ], + "bp_grad_per_sample_l2_med": [ + 8.019094821065664e-05, + 8.715572766959667e-05, + 9.189714910462499e-05, + 9.61213736445643e-05, + 0.00010296071559423581 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.533203125, + "loss_eval": 1.3403639793395996, + "epoch": 9 + }, + { + "hidden_norms": [ + 107.04126739501953, + 91.77833557128906, + 80.73109436035156, + 70.98918914794922, + 61.11309051513672 + ], + "bp_grad_per_sample_l2_med": [ + 7.710429053986445e-05, + 8.402510866289958e-05, + 8.972393698059022e-05, + 9.477136336499825e-05, + 9.921709715854377e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5517578125, + "loss_eval": 1.3021693229675293, + "epoch": 10 + }, + { + "hidden_norms": [ + 111.9730224609375, + 94.8844985961914, + 83.01356506347656, + 72.39442443847656, + 61.61451721191406 + ], + "bp_grad_per_sample_l2_med": [ + 7.266257307492197e-05, + 8.069563045864925e-05, + 8.615722617832944e-05, + 8.979514677776024e-05, + 9.45624997257255e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5458984375, + "loss_eval": 1.298128604888916, + "epoch": 11 + }, + { + "hidden_norms": [ + 116.69439697265625, + 99.29745483398438, + 84.83220672607422, + 72.58226013183594, + 61.799560546875 + ], + "bp_grad_per_sample_l2_med": [ + 7.808519876562059e-05, + 8.509745384799317e-05, + 9.162558853859082e-05, + 9.594277798896655e-05, + 0.00010088863200508058 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5361328125, + "loss_eval": 1.327142596244812, + "epoch": 12 + }, + { + "hidden_norms": [ + 118.57154083251953, + 100.65165710449219, + 86.92396545410156, + 75.52800750732422, + 63.40058898925781 + ], + "bp_grad_per_sample_l2_med": [ + 7.507520058425143e-05, + 8.161060395650566e-05, + 8.807337144389749e-05, + 9.307889558840543e-05, + 9.839278209256008e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.529296875, + "loss_eval": 1.301376223564148, + "epoch": 13 + }, + { + "hidden_norms": [ + 123.16495513916016, + 104.0947265625, + 90.54090118408203, + 79.24758911132812, + 66.25940704345703 + ], + "bp_grad_per_sample_l2_med": [ + 7.567028660560027e-05, + 8.223088661907241e-05, + 8.735521987546235e-05, + 9.217277693096548e-05, + 9.719380614114925e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2765182256698608, + "epoch": 14 + }, + { + "hidden_norms": [ + 126.89250946044922, + 107.54840087890625, + 93.0474853515625, + 79.41374206542969, + 66.3965835571289 + ], + "bp_grad_per_sample_l2_med": [ + 7.546511915279552e-05, + 8.2636863226071e-05, + 8.891599281923845e-05, + 9.294570190832019e-05, + 9.809954644879326e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.51953125, + "loss_eval": 1.300541877746582, + "epoch": 15 + }, + { + "hidden_norms": [ + 130.00201416015625, + 110.14152526855469, + 95.71183776855469, + 81.57356262207031, + 68.07804107666016 + ], + "bp_grad_per_sample_l2_med": [ + 7.271749927895144e-05, + 7.90783524280414e-05, + 8.341569628100842e-05, + 8.888234879123047e-05, + 9.289903391618282e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.253805160522461, + "epoch": 16 + }, + { + "hidden_norms": [ + 132.4821014404297, + 112.55132293701172, + 96.15247344970703, + 82.20439147949219, + 67.68408203125 + ], + "bp_grad_per_sample_l2_med": [ + 7.47043450246565e-05, + 8.161538426065817e-05, + 8.696810255059972e-05, + 9.05536362552084e-05, + 9.490203956374899e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5634765625, + "loss_eval": 1.2818918228149414, + "epoch": 17 + }, + { + "hidden_norms": [ + 136.31614685058594, + 116.76542663574219, + 100.04906463623047, + 85.71382141113281, + 70.02954864501953 + ], + "bp_grad_per_sample_l2_med": [ + 7.14207926648669e-05, + 7.859354082029313e-05, + 8.420498488703743e-05, + 8.882852853275836e-05, + 9.116062574321404e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5595703125, + "loss_eval": 1.2435299158096313, + "epoch": 18 + }, + { + "hidden_norms": [ + 138.36990356445312, + 117.38836669921875, + 101.75880432128906, + 86.79072570800781, + 70.66394805908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.72569328546524e-05, + 8.451085159322247e-05, + 8.929366595111787e-05, + 9.467442578170449e-05, + 9.868820779956877e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53515625, + "loss_eval": 1.3142390251159668, + "epoch": 19 + }, + { + "hidden_norms": [ + 140.71449279785156, + 119.23265838623047, + 101.22541809082031, + 85.75491333007812, + 69.77205657958984 + ], + "bp_grad_per_sample_l2_med": [ + 7.5247859058436e-05, + 8.147219341481104e-05, + 8.72978416737169e-05, + 9.33377887122333e-05, + 9.715931082610041e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.548828125, + "loss_eval": 1.26747465133667, + "epoch": 20 + }, + { + "hidden_norms": [ + 143.37794494628906, + 121.56777954101562, + 105.97654724121094, + 90.9666748046875, + 72.01183319091797 + ], + "bp_grad_per_sample_l2_med": [ + 7.179555541370064e-05, + 7.918629125924781e-05, + 8.409017755184323e-05, + 8.838798385113478e-05, + 9.469009819440544e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.564453125, + "loss_eval": 1.2752306461334229, + "epoch": 21 + }, + { + "hidden_norms": [ + 144.44107055664062, + 122.94657135009766, + 106.18299102783203, + 89.72506713867188, + 71.56814575195312 + ], + "bp_grad_per_sample_l2_med": [ + 7.250273483805358e-05, + 7.833781273802742e-05, + 8.349631389137357e-05, + 8.67474009282887e-05, + 8.975700620794669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.56640625, + "loss_eval": 1.214519739151001, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.68658447265625, + 123.7938232421875, + 107.63272857666016, + 91.90914154052734, + 72.97653198242188 + ], + "bp_grad_per_sample_l2_med": [ + 6.909506919328123e-05, + 7.67810779507272e-05, + 8.248597441706806e-05, + 8.500050898874179e-05, + 8.80209991009906e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.578125, + "loss_eval": 1.2490482330322266, + "epoch": 23 + }, + { + "hidden_norms": [ + 149.15159606933594, + 125.77446746826172, + 106.84111022949219, + 90.89909362792969, + 72.29488372802734 + ], + "bp_grad_per_sample_l2_med": [ + 7.051522698020563e-05, + 7.787953654769808e-05, + 8.355934551218525e-05, + 8.837382483761758e-05, + 9.125470387516543e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5634765625, + "loss_eval": 1.2157257795333862, + "epoch": 24 + }, + { + "hidden_norms": [ + 149.9364776611328, + 126.3508529663086, + 107.00386047363281, + 89.69956970214844, + 70.79742431640625 + ], + "bp_grad_per_sample_l2_med": [ + 7.40521791158244e-05, + 8.231549145421013e-05, + 8.598146814620122e-05, + 9.036294795805588e-05, + 9.211329597746953e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5546875, + "loss_eval": 1.2515935897827148, + "epoch": 25 + }, + { + "hidden_norms": [ + 152.33641052246094, + 127.60247039794922, + 109.31637573242188, + 91.78147888183594, + 71.85491180419922 + ], + "bp_grad_per_sample_l2_med": [ + 7.096086483215913e-05, + 7.774732512189075e-05, + 8.330845594173297e-05, + 8.756548049859703e-05, + 9.018366108648479e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.234102487564087, + "epoch": 26 + }, + { + "hidden_norms": [ + 154.90924072265625, + 129.49365234375, + 111.0758285522461, + 94.2232666015625, + 73.4395523071289 + ], + "bp_grad_per_sample_l2_med": [ + 7.217184611363336e-05, + 7.90508056525141e-05, + 8.487315790262073e-05, + 9.130351099884138e-05, + 9.386075544171035e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.2473926544189453, + "epoch": 27 + }, + { + "hidden_norms": [ + 155.88226318359375, + 130.6912384033203, + 111.4398193359375, + 93.5534896850586, + 73.1227035522461 + ], + "bp_grad_per_sample_l2_med": [ + 7.115830521797761e-05, + 7.749604992568493e-05, + 8.24403905426152e-05, + 8.617334970040247e-05, + 8.857186185196042e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5625, + "loss_eval": 1.232407569885254, + "epoch": 28 + }, + { + "hidden_norms": [ + 155.35606384277344, + 131.03033447265625, + 112.69044494628906, + 95.1001968383789, + 74.01049041748047 + ], + "bp_grad_per_sample_l2_med": [ + 7.353001274168491e-05, + 8.054459613049403e-05, + 8.64928078954108e-05, + 8.998846897156909e-05, + 9.453124948777258e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.576171875, + "loss_eval": 1.2427477836608887, + "epoch": 29 + }, + { + "hidden_norms": [ + 157.87423706054688, + 132.91993713378906, + 114.23269653320312, + 96.04922485351562, + 74.40912628173828 + ], + "bp_grad_per_sample_l2_med": [ + 7.218361861305311e-05, + 8.000781963346526e-05, + 8.621480083093047e-05, + 9.079690062208101e-05, + 9.179109474644065e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.2170917987823486, + "epoch": 30 + }, + { + "hidden_norms": [ + 159.94407653808594, + 134.98342895507812, + 116.59188842773438, + 96.52700805664062, + 74.13409423828125 + ], + "bp_grad_per_sample_l2_med": [ + 6.996722368057817e-05, + 7.723316957708448e-05, + 8.291137055493891e-05, + 8.800445357337594e-05, + 8.874708146322519e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1662731170654297, + "epoch": 31 + }, + { + "hidden_norms": [ + 159.40000915527344, + 134.68307495117188, + 115.32740783691406, + 95.89759826660156, + 73.79962158203125 + ], + "bp_grad_per_sample_l2_med": [ + 7.17860457370989e-05, + 7.931615255074576e-05, + 8.509325562044978e-05, + 8.835212793201208e-05, + 9.002821025205776e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5732421875, + "loss_eval": 1.1779483556747437, + "epoch": 32 + }, + { + "hidden_norms": [ + 160.3310089111328, + 135.494140625, + 116.1007308959961, + 96.30546569824219, + 74.54843139648438 + ], + "bp_grad_per_sample_l2_med": [ + 6.925644993316382e-05, + 7.548897701781243e-05, + 8.256838918896392e-05, + 8.621955930721015e-05, + 8.84741239133291e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1561952829360962, + "epoch": 33 + }, + { + "hidden_norms": [ + 161.94854736328125, + 135.6446075439453, + 116.58970642089844, + 96.99983978271484, + 74.31636810302734 + ], + "bp_grad_per_sample_l2_med": [ + 7.260960410349071e-05, + 8.003232505870983e-05, + 8.696899749338627e-05, + 9.040992881637067e-05, + 9.149286051979288e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1946098804473877, + "epoch": 34 + }, + { + "hidden_norms": [ + 163.52120971679688, + 138.41390991210938, + 118.427490234375, + 98.19206237792969, + 75.36811828613281 + ], + "bp_grad_per_sample_l2_med": [ + 6.831327482359484e-05, + 7.447604730259627e-05, + 7.990537415025756e-05, + 8.471667388221249e-05, + 8.780926145846024e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.184380054473877, + "epoch": 35 + }, + { + "hidden_norms": [ + 164.48324584960938, + 138.1424102783203, + 118.34252166748047, + 98.4327621459961, + 75.36869049072266 + ], + "bp_grad_per_sample_l2_med": [ + 7.150783494580537e-05, + 7.926567923277617e-05, + 8.36653562146239e-05, + 8.762039215071127e-05, + 8.95786433829926e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.2110118865966797, + "epoch": 36 + }, + { + "hidden_norms": [ + 164.0553741455078, + 138.08517456054688, + 118.49005126953125, + 98.67227172851562, + 74.64473724365234 + ], + "bp_grad_per_sample_l2_med": [ + 7.029619155218825e-05, + 7.684711454203352e-05, + 8.26816976768896e-05, + 8.846465789247304e-05, + 9.003532613860443e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.1644396781921387, + "epoch": 37 + }, + { + "hidden_norms": [ + 165.32000732421875, + 138.64366149902344, + 119.2437515258789, + 99.25880432128906, + 75.45353698730469 + ], + "bp_grad_per_sample_l2_med": [ + 7.045984239084646e-05, + 7.836698205210268e-05, + 8.392294694203883e-05, + 8.778785559115931e-05, + 8.954900113167241e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.18137526512146, + "epoch": 38 + }, + { + "hidden_norms": [ + 164.7397918701172, + 138.3001251220703, + 117.6864242553711, + 97.29838562011719, + 73.79444122314453 + ], + "bp_grad_per_sample_l2_med": [ + 7.162813562899828e-05, + 7.83513969508931e-05, + 8.275063009932637e-05, + 8.855803025653586e-05, + 8.704853098606691e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.583984375, + "loss_eval": 1.1727752685546875, + "epoch": 39 + }, + { + "hidden_norms": [ + 166.1660919189453, + 138.93536376953125, + 118.51292419433594, + 97.88706970214844, + 75.51615905761719 + ], + "bp_grad_per_sample_l2_med": [ + 7.430704863509163e-05, + 8.242860349128023e-05, + 8.74657926033251e-05, + 9.10981761990115e-05, + 9.303457773057744e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1664979457855225, + "epoch": 40 + }, + { + "hidden_norms": [ + 167.8816375732422, + 140.1188201904297, + 119.77051544189453, + 99.83518981933594, + 75.69395446777344 + ], + "bp_grad_per_sample_l2_med": [ + 7.187369919847697e-05, + 7.945671677589417e-05, + 8.597246051067486e-05, + 8.931689808377996e-05, + 8.963213622337207e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.587890625, + "loss_eval": 1.19194757938385, + "epoch": 41 + }, + { + "hidden_norms": [ + 168.21185302734375, + 141.76817321777344, + 121.40872192382812, + 100.61127471923828, + 76.76028442382812 + ], + "bp_grad_per_sample_l2_med": [ + 7.174632628448308e-05, + 7.968613499542698e-05, + 8.514403452863917e-05, + 8.922909910324961e-05, + 9.091905667446554e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1679599285125732, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.2344207763672, + 140.6108856201172, + 120.0829849243164, + 99.8038330078125, + 76.13324737548828 + ], + "bp_grad_per_sample_l2_med": [ + 7.436795567627996e-05, + 8.090144547168165e-05, + 8.729894761927426e-05, + 9.00863014976494e-05, + 8.991207869257778e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.1705546379089355, + "epoch": 43 + }, + { + "hidden_norms": [ + 167.59393310546875, + 140.7035369873047, + 120.24620056152344, + 99.91508483886719, + 75.96212005615234 + ], + "bp_grad_per_sample_l2_med": [ + 7.446305971825495e-05, + 8.234894630732015e-05, + 8.821392111713067e-05, + 9.209391282638535e-05, + 9.261125524062663e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.1846892833709717, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.69448852539062, + 141.26541137695312, + 121.04974365234375, + 100.46004486083984, + 75.70881652832031 + ], + "bp_grad_per_sample_l2_med": [ + 7.222096610348672e-05, + 7.875960727687925e-05, + 8.227298530982807e-05, + 8.841860108077526e-05, + 9.022892481880262e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1577212810516357, + "epoch": 45 + }, + { + "hidden_norms": [ + 169.7440185546875, + 142.39825439453125, + 121.89653778076172, + 100.77093505859375, + 76.56221008300781 + ], + "bp_grad_per_sample_l2_med": [ + 7.555038610007614e-05, + 8.296242594951764e-05, + 9.037082054419443e-05, + 9.527869406156242e-05, + 9.701496310299262e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.1768805980682373, + "epoch": 46 + }, + { + "hidden_norms": [ + 167.24928283691406, + 140.36639404296875, + 119.20468139648438, + 99.04094696044922, + 75.62102508544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.741156878182665e-05, + 8.454316412098706e-05, + 9.005220636026934e-05, + 9.321123798144981e-05, + 9.260981460101902e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.166186809539795, + "epoch": 47 + }, + { + "hidden_norms": [ + 170.72845458984375, + 142.466796875, + 120.5933837890625, + 100.26793670654297, + 76.15065002441406 + ], + "bp_grad_per_sample_l2_med": [ + 7.659869879717007e-05, + 8.334196172654629e-05, + 9.012148075271398e-05, + 9.564686479279771e-05, + 9.513212717138231e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1720219850540161, + "epoch": 48 + }, + { + "hidden_norms": [ + 169.83580017089844, + 141.82705688476562, + 121.11093139648438, + 100.64865112304688, + 76.17137145996094 + ], + "bp_grad_per_sample_l2_med": [ + 7.593600457767025e-05, + 8.458431693725288e-05, + 9.001771832117811e-05, + 9.566119115334004e-05, + 9.762388071976602e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.184555172920227, + "epoch": 49 + }, + { + "hidden_norms": [ + 168.68116760253906, + 141.1621856689453, + 119.57838439941406, + 98.55834197998047, + 75.13648223876953 + ], + "bp_grad_per_sample_l2_med": [ + 8.207417704397812e-05, + 9.170681732939556e-05, + 9.716026397654787e-05, + 0.0001007765022222884, + 0.0001005034864647314 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1981369256973267, + "epoch": 50 + }, + { + "hidden_norms": [ + 171.0980682373047, + 143.56202697753906, + 121.67494201660156, + 101.36307525634766, + 76.57723999023438 + ], + "bp_grad_per_sample_l2_med": [ + 7.634361099917442e-05, + 8.294743747683242e-05, + 8.85644112713635e-05, + 9.305671119363979e-05, + 9.303687693318352e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.1646153926849365, + "epoch": 51 + }, + { + "hidden_norms": [ + 170.58717346191406, + 143.18809509277344, + 120.9772720336914, + 100.8180923461914, + 77.12872314453125 + ], + "bp_grad_per_sample_l2_med": [ + 7.599191303597763e-05, + 8.41239161673002e-05, + 8.960344712249935e-05, + 9.63989004958421e-05, + 9.756541112437844e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1623225212097168, + "epoch": 52 + }, + { + "hidden_norms": [ + 169.49244689941406, + 142.66770935058594, + 122.00574493408203, + 101.84593963623047, + 77.40425109863281 + ], + "bp_grad_per_sample_l2_med": [ + 7.701734284637496e-05, + 8.374643221031874e-05, + 9.025474719237536e-05, + 9.504661284154281e-05, + 9.925573249347508e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59765625, + "loss_eval": 1.1574187278747559, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.3027801513672, + 143.11941528320312, + 120.9614486694336, + 101.5257797241211, + 77.17151641845703 + ], + "bp_grad_per_sample_l2_med": [ + 7.559885852970183e-05, + 8.217129652621225e-05, + 8.892706682672724e-05, + 9.235734614776447e-05, + 9.276533091906458e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6015625, + "loss_eval": 1.149141788482666, + "epoch": 54 + }, + { + "hidden_norms": [ + 168.70281982421875, + 141.82730102539062, + 120.2729263305664, + 99.75395965576172, + 76.92571258544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.91895727161318e-05, + 8.787367551121861e-05, + 9.60014876909554e-05, + 0.0001018140246742405, + 9.86503655440174e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6005859375, + "loss_eval": 1.1657415628433228, + "epoch": 55 + }, + { + "hidden_norms": [ + 169.94361877441406, + 142.49684143066406, + 120.18767547607422, + 100.32206726074219, + 76.59700012207031 + ], + "bp_grad_per_sample_l2_med": [ + 7.673597428947687e-05, + 8.517439709976315e-05, + 9.201091597788036e-05, + 9.491065429756418e-05, + 9.497139399172738e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.170656442642212, + "epoch": 56 + }, + { + "hidden_norms": [ + 168.98934936523438, + 142.45361328125, + 120.9234848022461, + 101.12970733642578, + 76.8805160522461 + ], + "bp_grad_per_sample_l2_med": [ + 7.979186193551868e-05, + 8.849770529195666e-05, + 9.661864896770567e-05, + 0.00010212804772891104, + 9.96212984318845e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.153792142868042, + "epoch": 57 + }, + { + "hidden_norms": [ + 169.1288604736328, + 141.414306640625, + 119.56535339355469, + 99.89313507080078, + 76.44340515136719 + ], + "bp_grad_per_sample_l2_med": [ + 8.042863919399679e-05, + 8.848145080264658e-05, + 9.505209163762629e-05, + 0.00010096383630298078, + 9.844720625551417e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1363590955734253, + "epoch": 58 + }, + { + "hidden_norms": [ + 167.93479919433594, + 140.53518676757812, + 118.76004028320312, + 99.56035614013672, + 76.20387268066406 + ], + "bp_grad_per_sample_l2_med": [ + 8.038699888857082e-05, + 8.754427108215168e-05, + 9.549371316097677e-05, + 0.00010098952043335885, + 0.0001008743784041144 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.1666439771652222, + "epoch": 59 + }, + { + "hidden_norms": [ + 168.28646850585938, + 140.67718505859375, + 118.55599975585938, + 98.98268127441406, + 75.81230163574219 + ], + "bp_grad_per_sample_l2_med": [ + 8.297240128740668e-05, + 8.875853382050991e-05, + 9.902577585307881e-05, + 0.00010285823373124003, + 0.00010488184489076957 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1589187383651733, + "epoch": 60 + }, + { + "hidden_norms": [ + 168.05776977539062, + 140.5435791015625, + 119.5470962524414, + 99.72227478027344, + 76.00287628173828 + ], + "bp_grad_per_sample_l2_med": [ + 8.011830504983664e-05, + 8.830082515487447e-05, + 9.65106810326688e-05, + 0.00010251552885165438, + 0.00010001847840612754 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.615234375, + "loss_eval": 1.157954216003418, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.4709014892578, + 140.92843627929688, + 119.31693267822266, + 98.76548767089844, + 75.95777893066406 + ], + "bp_grad_per_sample_l2_med": [ + 8.56209808262065e-05, + 9.390609193360433e-05, + 0.00010086362453876063, + 0.00010554264736128971, + 0.00010187114821746945 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.147390365600586, + "epoch": 62 + }, + { + "hidden_norms": [ + 167.48707580566406, + 139.8479766845703, + 118.25393676757812, + 99.32323455810547, + 75.72100830078125 + ], + "bp_grad_per_sample_l2_med": [ + 8.738139877095819e-05, + 9.79254036792554e-05, + 0.00010459231998538598, + 0.00011052342597395182, + 0.00010695838136598468 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5966796875, + "loss_eval": 1.1785132884979248, + "epoch": 63 + }, + { + "hidden_norms": [ + 167.5928955078125, + 140.20948791503906, + 118.63544464111328, + 99.02739715576172, + 75.8176040649414 + ], + "bp_grad_per_sample_l2_med": [ + 8.539798727724701e-05, + 9.423612937098369e-05, + 0.00010523338278289884, + 0.00010897681931965053, + 0.00010739201388787478 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1509130001068115, + "epoch": 64 + }, + { + "hidden_norms": [ + 167.19003295898438, + 138.91221618652344, + 117.57588195800781, + 98.43026733398438, + 75.48680114746094 + ], + "bp_grad_per_sample_l2_med": [ + 8.238407463068143e-05, + 9.25329077290371e-05, + 0.00010089747956953943, + 0.00010575826308922842, + 0.00010581395326880738 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6220703125, + "loss_eval": 1.151381254196167, + "epoch": 65 + }, + { + "hidden_norms": [ + 165.7104034423828, + 138.99298095703125, + 117.33794403076172, + 98.08374786376953, + 75.52032470703125 + ], + "bp_grad_per_sample_l2_med": [ + 8.850001177052036e-05, + 9.699742804514244e-05, + 0.00010492365981917828, + 0.00011017896758858114, + 0.00010667099559213966 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.151253581047058, + "epoch": 66 + }, + { + "hidden_norms": [ + 165.87271118164062, + 138.727783203125, + 118.21571350097656, + 97.76729583740234, + 75.68400573730469 + ], + "bp_grad_per_sample_l2_med": [ + 9.00067898328416e-05, + 9.841559221968055e-05, + 0.00010505259706405923, + 0.00010942742665065452, + 0.00010504219244467095 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1535770893096924, + "epoch": 67 + }, + { + "hidden_norms": [ + 165.17666625976562, + 138.45004272460938, + 117.10303497314453, + 97.36707305908203, + 75.38941192626953 + ], + "bp_grad_per_sample_l2_med": [ + 8.911191252991557e-05, + 9.853249503066763e-05, + 0.00010691725765354931, + 0.00011312783317407593, + 0.0001101552988984622 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59765625, + "loss_eval": 1.1582581996917725, + "epoch": 68 + }, + { + "hidden_norms": [ + 165.94325256347656, + 138.6524200439453, + 117.50881958007812, + 97.7616958618164, + 75.20433807373047 + ], + "bp_grad_per_sample_l2_med": [ + 8.616734703537077e-05, + 9.347109880764037e-05, + 0.00010103159002028406, + 0.00010616267536533996, + 0.00010419132013339549 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.1453883647918701, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.7154541015625, + 138.506591796875, + 117.28874206542969, + 97.05110168457031, + 75.29759979248047 + ], + "bp_grad_per_sample_l2_med": [ + 8.980780694400892e-05, + 9.973136184271425e-05, + 0.00010883707000175491, + 0.00011757094762288034, + 0.00011409710714360699 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1474578380584717, + "epoch": 70 + }, + { + "hidden_norms": [ + 164.83221435546875, + 138.6868133544922, + 116.98916625976562, + 96.52086639404297, + 75.43351745605469 + ], + "bp_grad_per_sample_l2_med": [ + 8.988294575829059e-05, + 9.790070907911286e-05, + 0.00010740302968770266, + 0.00011267260560998693, + 0.0001108170035877265 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.143803358078003, + "epoch": 71 + }, + { + "hidden_norms": [ + 164.63592529296875, + 137.5937042236328, + 116.08668518066406, + 96.16253662109375, + 74.92699432373047 + ], + "bp_grad_per_sample_l2_med": [ + 9.160200715996325e-05, + 0.00010001687769545242, + 0.00010771892993943766, + 0.00011699824244715273, + 0.00011338551848893985 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.609375, + "loss_eval": 1.1410948038101196, + "epoch": 72 + }, + { + "hidden_norms": [ + 164.91123962402344, + 137.8173828125, + 116.79219818115234, + 96.76990509033203, + 74.76392364501953 + ], + "bp_grad_per_sample_l2_med": [ + 8.93947362783365e-05, + 9.948704246198758e-05, + 0.00010810969251906499, + 0.00011499693209771067, + 0.0001114657279686071 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.1341216564178467, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.64288330078125, + 137.3013153076172, + 116.4471206665039, + 96.7668228149414, + 74.69876861572266 + ], + "bp_grad_per_sample_l2_med": [ + 8.85727204149589e-05, + 9.913302346831188e-05, + 0.00011003073450410739, + 0.00011727867240551859, + 0.00011272053234279156 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1379802227020264, + "epoch": 74 + }, + { + "hidden_norms": [ + 163.62106323242188, + 137.2855682373047, + 115.62771606445312, + 95.8958969116211, + 74.53977966308594 + ], + "bp_grad_per_sample_l2_med": [ + 8.984863961813971e-05, + 9.98539908323437e-05, + 0.00010817578731803223, + 0.00011364965030224994, + 0.00011257777805440128 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.130206823348999, + "epoch": 75 + }, + { + "hidden_norms": [ + 164.09976196289062, + 137.23387145996094, + 116.05545043945312, + 96.66761016845703, + 75.32057189941406 + ], + "bp_grad_per_sample_l2_med": [ + 8.984812302514911e-05, + 9.734687773743644e-05, + 0.00010578137880656868, + 0.00011179807916050777, + 0.0001108815340558067 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1422557830810547, + "epoch": 76 + }, + { + "hidden_norms": [ + 162.94369506835938, + 136.59678649902344, + 115.43162536621094, + 95.96286010742188, + 74.39228057861328 + ], + "bp_grad_per_sample_l2_med": [ + 9.308777953265235e-05, + 0.00010392161493655294, + 0.00011047742736991495, + 0.00011820423969766125, + 0.00011209066724404693 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.1316850185394287, + "epoch": 77 + }, + { + "hidden_norms": [ + 163.14993286132812, + 136.48724365234375, + 115.7430648803711, + 96.20491790771484, + 74.71761322021484 + ], + "bp_grad_per_sample_l2_med": [ + 9.024026803672314e-05, + 0.00010025065421359614, + 0.00011008324509020895, + 0.00011521186388563365, + 0.00011174430255778134 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.1380174160003662, + "epoch": 78 + }, + { + "hidden_norms": [ + 163.56654357910156, + 136.04368591308594, + 114.58287048339844, + 95.99482727050781, + 74.26864624023438 + ], + "bp_grad_per_sample_l2_med": [ + 9.700806549517438e-05, + 0.0001051941653713584, + 0.00011597082630032673, + 0.0001224641309818253, + 0.00011469785385997966 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.1528915166854858, + "epoch": 79 + }, + { + "hidden_norms": [ + 162.7240753173828, + 135.9139862060547, + 114.86207580566406, + 95.29146575927734, + 74.25565338134766 + ], + "bp_grad_per_sample_l2_med": [ + 9.666816185927019e-05, + 0.0001055657266988419, + 0.00011615711264312267, + 0.00012476630217861384, + 0.00011797657498391345 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.1539390087127686, + "epoch": 80 + }, + { + "hidden_norms": [ + 162.158203125, + 135.1398468017578, + 114.53036499023438, + 94.93306732177734, + 73.95748901367188 + ], + "bp_grad_per_sample_l2_med": [ + 9.333287016488612e-05, + 0.0001032597865560092, + 0.00011410381557652727, + 0.00012122129555791616, + 0.00011711813567671925 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1506534814834595, + "epoch": 81 + }, + { + "hidden_norms": [ + 162.415283203125, + 135.51370239257812, + 114.56376647949219, + 94.92838287353516, + 74.06205749511719 + ], + "bp_grad_per_sample_l2_med": [ + 9.082158794626594e-05, + 0.00010185714199906215, + 0.00011048805754398927, + 0.00011587562767090276, + 0.0001120776214520447 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1497812271118164, + "epoch": 82 + }, + { + "hidden_norms": [ + 161.77337646484375, + 135.19717407226562, + 114.20987701416016, + 94.77679443359375, + 73.99730682373047 + ], + "bp_grad_per_sample_l2_med": [ + 9.745426359586418e-05, + 0.00010718397970777005, + 0.00011704466305673122, + 0.00012522070028353482, + 0.00012164646614110097 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.155759572982788, + "epoch": 83 + }, + { + "hidden_norms": [ + 161.48892211914062, + 135.2348175048828, + 114.12451171875, + 94.8083267211914, + 73.4517822265625 + ], + "bp_grad_per_sample_l2_med": [ + 9.549259266350418e-05, + 0.00010579569061519578, + 0.00011430429003667086, + 0.00012098137813154608, + 0.00011664297198876739 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.15834379196167, + "epoch": 84 + }, + { + "hidden_norms": [ + 161.6995849609375, + 135.2989959716797, + 114.2784194946289, + 94.69004821777344, + 73.529541015625 + ], + "bp_grad_per_sample_l2_med": [ + 9.579937614034861e-05, + 0.00010731106885941699, + 0.00011613505921559408, + 0.00012203569349367172, + 0.00011712868581525981 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.1583144664764404, + "epoch": 85 + }, + { + "hidden_norms": [ + 161.00369262695312, + 134.7657012939453, + 114.10606384277344, + 94.362060546875, + 73.65673065185547 + ], + "bp_grad_per_sample_l2_med": [ + 9.818092075875029e-05, + 0.00010859747999347746, + 0.00011724254727596417, + 0.00012138402962591499, + 0.00011800935317296535 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1536951065063477, + "epoch": 86 + }, + { + "hidden_norms": [ + 161.0053253173828, + 134.59410095214844, + 113.69575500488281, + 94.29032135009766, + 73.46531677246094 + ], + "bp_grad_per_sample_l2_med": [ + 9.722611866891384e-05, + 0.00010765776823973283, + 0.0001188350870506838, + 0.00012322816473897547, + 0.00011940464901272207 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.15749192237854, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.33126831054688, + 134.94166564941406, + 113.90135955810547, + 94.50862884521484, + 73.39297485351562 + ], + "bp_grad_per_sample_l2_med": [ + 9.938049333868548e-05, + 0.0001076548287528567, + 0.00011934098438359797, + 0.00012375488586258143, + 0.00011877582437591627 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.157106637954712, + "epoch": 88 + }, + { + "hidden_norms": [ + 161.05789184570312, + 134.59825134277344, + 113.87554931640625, + 94.37042999267578, + 73.5987548828125 + ], + "bp_grad_per_sample_l2_med": [ + 9.70072578638792e-05, + 0.00010533058957662433, + 0.00011765053932322189, + 0.00012162782513769343, + 0.00012223162048030645 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.1565823554992676, + "epoch": 89 + }, + { + "hidden_norms": [ + 160.39405822753906, + 134.43434143066406, + 113.540283203125, + 94.05237579345703, + 73.39077758789062 + ], + "bp_grad_per_sample_l2_med": [ + 9.608148684492335e-05, + 0.00010612589539960027, + 0.00011680866009555757, + 0.00012219352356623858, + 0.00011590561916818842 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.1539617776870728, + "epoch": 90 + }, + { + "hidden_norms": [ + 160.60440063476562, + 134.6214141845703, + 113.45699310302734, + 93.85929870605469, + 73.18849182128906 + ], + "bp_grad_per_sample_l2_med": [ + 9.81277771643363e-05, + 0.00010970587754854932, + 0.00011871931201312691, + 0.00012303274706937373, + 0.00011832414020318538 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1519787311553955, + "epoch": 91 + }, + { + "hidden_norms": [ + 160.69932556152344, + 134.37420654296875, + 113.30387115478516, + 93.87930297851562, + 73.2369384765625 + ], + "bp_grad_per_sample_l2_med": [ + 9.748790762387216e-05, + 0.00010789754742290825, + 0.00011884274135809392, + 0.00012259349750820547, + 0.00012160756887169555 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1536774635314941, + "epoch": 92 + }, + { + "hidden_norms": [ + 160.83596801757812, + 134.3319854736328, + 113.4552230834961, + 94.0063705444336, + 73.16248321533203 + ], + "bp_grad_per_sample_l2_med": [ + 9.70613255049102e-05, + 0.00010844107600860298, + 0.0001184809225378558, + 0.00012342457193881273, + 0.00011970168998232111 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6220703125, + "loss_eval": 1.152658462524414, + "epoch": 93 + }, + { + "hidden_norms": [ + 160.8366241455078, + 134.48265075683594, + 113.25139617919922, + 93.83488464355469, + 73.08296203613281 + ], + "bp_grad_per_sample_l2_med": [ + 9.66933585004881e-05, + 0.00010815998393809423, + 0.00011774426093325019, + 0.0001224545994773507, + 0.00011890953464899212 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6181640625, + "loss_eval": 1.1551861763000488, + "epoch": 94 + }, + { + "hidden_norms": [ + 160.7191162109375, + 134.44659423828125, + 113.33219146728516, + 93.93790435791016, + 73.0753402709961 + ], + "bp_grad_per_sample_l2_med": [ + 9.675837645772845e-05, + 0.00010675707017071545, + 0.00011643637844827026, + 0.00012197842443129048, + 0.0001190306429634802 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.15492582321167, + "epoch": 95 + }, + { + "hidden_norms": [ + 160.51898193359375, + 134.29307556152344, + 113.27383422851562, + 94.04198455810547, + 73.003662109375 + ], + "bp_grad_per_sample_l2_med": [ + 9.737682557897642e-05, + 0.00010710594506235793, + 0.00011601457663346082, + 0.0001232696376973763, + 0.0001181336774607189 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1535921096801758, + "epoch": 96 + }, + { + "hidden_norms": [ + 160.5992431640625, + 134.43368530273438, + 113.30790710449219, + 94.0107192993164, + 73.01823425292969 + ], + "bp_grad_per_sample_l2_med": [ + 9.668481652624905e-05, + 0.00010705058230087161, + 0.0001163838169304654, + 0.0001232351060025394, + 0.00011791065480792895 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.615234375, + "loss_eval": 1.1539404392242432, + "epoch": 97 + }, + { + "hidden_norms": [ + 160.6013946533203, + 134.46824645996094, + 113.25690460205078, + 93.99237060546875, + 73.00788879394531 + ], + "bp_grad_per_sample_l2_med": [ + 9.74524809862487e-05, + 0.00010689684131648391, + 0.00011608003114815801, + 0.00012245487596374005, + 0.00011877176439156756 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.615234375, + "loss_eval": 1.1537361145019531, + "epoch": 98 + }, + { + "hidden_norms": [ + 160.6110076904297, + 134.44720458984375, + 113.29548645019531, + 93.96721649169922, + 72.96358489990234 + ], + "bp_grad_per_sample_l2_med": [ + 9.775274520507082e-05, + 0.00010722322622314095, + 0.00011578563862713054, + 0.00012414308730512857, + 0.00011851716408273205 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1537935733795166, + "epoch": 99 + }, + { + "hidden_norms": [ + 160.61090087890625, + 134.45262145996094, + 113.2977066040039, + 93.9543685913086, + 72.96540069580078 + ], + "bp_grad_per_sample_l2_med": [ + 9.751630568644032e-05, + 0.00010700579878175631, + 0.00011575232201721519, + 0.0001240932324435562, + 0.00011847950372612104 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.153747320175171, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "gamma_dfa": 0.008468771702609956, + "gamma_dfa_per_layer": [ + 0.0002397641073912382, + 0.021293632686138153, + -0.0031478723976761103, + 0.015489562414586544 + ], + "acc_eval": 0.1123046875, + "loss_eval": 2.3168468475341797, + "epoch": 0 + }, + { + "hidden_norms": [ + 481.5912780761719, + 951.0988159179688, + 1076.1094970703125, + 1320.2431640625, + 1560.1331787109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006860869470983744, + 0.000686013896483928, + 0.0006859428831376135, + 0.0006858126726001501, + 0.0006857643602415919 + ], + "gamma_dfa": 0.008383387292269617, + "gamma_dfa_per_layer": [ + 0.030579306185245514, + 0.012463560327887535, + -0.009617818519473076, + 0.00010850117541849613 + ], + "acc_eval": 0.1494140625, + "loss_eval": 6.441287040710449, + "epoch": 1 + }, + { + "hidden_norms": [ + 803.455322265625, + 1877.8646240234375, + 2352.25390625, + 2999.778564453125, + 3690.3037109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007094781612977386, + 0.0007074660388752818, + 0.0007073783199302852, + 0.0007076358306221664, + 0.0007076164474710822 + ], + "gamma_dfa": -0.002415801805909723, + "gamma_dfa_per_layer": [ + 0.04413381963968277, + -0.0021541656460613012, + -0.028202872723340988, + -0.023439988493919373 + ], + "acc_eval": 0.236328125, + "loss_eval": 9.331591606140137, + "epoch": 2 + }, + { + "hidden_norms": [ + 1023.6770629882812, + 2787.596923828125, + 3518.2734375, + 4732.96337890625, + 6139.98486328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007535111508332193, + 0.00075019511859864, + 0.0007504230597987771, + 0.0007509100250899792, + 0.0007509145070798695 + ], + "gamma_dfa": -0.004518487432505935, + "gamma_dfa_per_layer": [ + 0.049626171588897705, + -0.0017164160963147879, + -0.029111474752426147, + -0.03687223047018051 + ], + "acc_eval": 0.1943359375, + "loss_eval": 33.82752990722656, + "epoch": 3 + }, + { + "hidden_norms": [ + 1163.0250244140625, + 3340.40087890625, + 4668.20654296875, + 6551.25927734375, + 8839.166015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007571951719000936, + 0.0007542021339759231, + 0.0007538797217421234, + 0.0007539798971265554, + 0.0007538445643149316 + ], + "gamma_dfa": -0.0057786391116678715, + "gamma_dfa_per_layer": [ + 0.06502002477645874, + -0.02495962381362915, + -0.035328082740306854, + -0.02784687466919422 + ], + "acc_eval": 0.1875, + "loss_eval": 50.81904983520508, + "epoch": 4 + }, + { + "hidden_norms": [ + 1288.871337890625, + 3822.7880859375, + 5365.59130859375, + 7605.025390625, + 10502.0478515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007548240246251225, + 0.0007521823281422257, + 0.0007521542138420045, + 0.00075240881415084, + 0.0007523542735725641 + ], + "gamma_dfa": -0.006262022419832647, + "gamma_dfa_per_layer": [ + 0.0670417994260788, + -0.00757558410987258, + -0.044654928147792816, + -0.03985937684774399 + ], + "acc_eval": 0.1748046875, + "loss_eval": 41.77630615234375, + "epoch": 5 + }, + { + "hidden_norms": [ + 1393.3045654296875, + 4566.75341796875, + 6398.4619140625, + 9144.8193359375, + 12855.005859375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007480952190235257, + 0.0007420883048325777, + 0.0007418331224471331, + 0.0007423029164783657, + 0.0007423472707159817 + ], + "gamma_dfa": -0.012987596448510885, + "gamma_dfa_per_layer": [ + 0.07368794828653336, + -0.022242246195673943, + -0.04769526422023773, + -0.05570082366466522 + ], + "acc_eval": 0.2255859375, + "loss_eval": 34.67824172973633, + "epoch": 6 + }, + { + "hidden_norms": [ + 1492.14599609375, + 4914.71142578125, + 7309.0888671875, + 10380.2900390625, + 14994.3798828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007586176507174969, + 0.0007474496378563344, + 0.0007472135475836694, + 0.0007474484154954553, + 0.0007475449237972498 + ], + "gamma_dfa": -0.009481166722252965, + "gamma_dfa_per_layer": [ + 0.07966121286153793, + -0.014550731517374516, + -0.05317254737019539, + -0.04986260086297989 + ], + "acc_eval": 0.2265625, + "loss_eval": 47.53326416015625, + "epoch": 7 + }, + { + "hidden_norms": [ + 1561.8521728515625, + 5346.5771484375, + 8036.01171875, + 11400.638671875, + 16846.158203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007513429154641926, + 0.000743337906897068, + 0.0007433209684677422, + 0.0007435117149725556, + 0.0007433460559695959 + ], + "gamma_dfa": -0.020332499407231808, + "gamma_dfa_per_layer": [ + 0.07914174348115921, + -0.03499722480773926, + -0.0528150238096714, + -0.07265949249267578 + ], + "acc_eval": 0.203125, + "loss_eval": 44.3652458190918, + "epoch": 8 + }, + { + "hidden_norms": [ + 1634.708740234375, + 5771.3779296875, + 9056.50390625, + 14017.43359375, + 18666.166015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007612781482748687, + 0.000746309058740735, + 0.0007445007795467973, + 0.000742616830393672, + 0.000742737902328372 + ], + "gamma_dfa": -0.02017525304108858, + "gamma_dfa_per_layer": [ + 0.07873347401618958, + -0.0398627370595932, + -0.05772021412849426, + -0.061851534992456436 + ], + "acc_eval": 0.1962890625, + "loss_eval": 76.75175476074219, + "epoch": 9 + }, + { + "hidden_norms": [ + 1703.975830078125, + 6538.35400390625, + 10825.435546875, + 18506.091796875, + 22004.94140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007676634704694152, + 0.0007641310803592205, + 0.0007641207776032388, + 0.0007640842813998461, + 0.0007641611155122519 + ], + "gamma_dfa": -0.016695345751941204, + "gamma_dfa_per_layer": [ + 0.08918984234333038, + -0.029809486120939255, + -0.06516598165035248, + -0.06099575757980347 + ], + "acc_eval": 0.14453125, + "loss_eval": 82.11173248291016, + "epoch": 10 + }, + { + "hidden_norms": [ + 1742.7552490234375, + 10617.021484375, + 14353.39453125, + 26320.365234375, + 29618.58984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007739505381323397, + 0.0007467114483006299, + 0.0007445442606694996, + 0.0007397353765554726, + 0.0007397329318337142 + ], + "gamma_dfa": -0.01567553821951151, + "gamma_dfa_per_layer": [ + 0.08600987493991852, + -0.03431041166186333, + -0.056060850620269775, + -0.05834076553583145 + ], + "acc_eval": 0.1943359375, + "loss_eval": 223.91172790527344, + "epoch": 11 + }, + { + "hidden_norms": [ + 1824.1932373046875, + 15453.6865234375, + 18834.18359375, + 34960.33984375, + 37989.41796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007750834338366985, + 0.0007619780953973532, + 0.0007621922995895147, + 0.0007620578981004655, + 0.0007621044642291963 + ], + "gamma_dfa": -0.010786167811602354, + "gamma_dfa_per_layer": [ + 0.12150975316762924, + -0.02778821997344494, + -0.057943932712078094, + -0.07892227172851562 + ], + "acc_eval": 0.2236328125, + "loss_eval": 176.59576416015625, + "epoch": 12 + }, + { + "hidden_norms": [ + 1874.6923828125, + 24413.89453125, + 27520.30859375, + 49373.3984375, + 52416.24609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007790470262989402, + 0.0007622907287441194, + 0.0007622726843692362, + 0.0007622543489560485, + 0.0007623030105605721 + ], + "gamma_dfa": -0.014462455175817013, + "gamma_dfa_per_layer": [ + 0.12855470180511475, + -0.04145955294370651, + -0.05751717463135719, + -0.08742779493331909 + ], + "acc_eval": 0.1787109375, + "loss_eval": 262.8403625488281, + "epoch": 13 + }, + { + "hidden_norms": [ + 1946.8936767578125, + 36272.8125, + 40333.21875, + 69530.5, + 73388.2890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008108754991553724, + 0.0007635678630322218, + 0.0007621092372573912, + 0.0007623478886671364, + 0.0007624892168678343 + ], + "gamma_dfa": -0.0001736646518111229, + "gamma_dfa_per_layer": [ + 0.17327094078063965, + -0.03242593631148338, + -0.06580278277397156, + -0.0757368803024292 + ], + "acc_eval": 0.203125, + "loss_eval": 413.348876953125, + "epoch": 14 + }, + { + "hidden_norms": [ + 2032.87255859375, + 51780.58984375, + 56919.1484375, + 94829.1484375, + 100403.8828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008237292058765888, + 0.0007614542846567929, + 0.0007608170853927732, + 0.0007589491433463991, + 0.0007590141030959785 + ], + "gamma_dfa": -0.011795124970376492, + "gamma_dfa_per_layer": [ + 0.1382066011428833, + -0.05588943883776665, + -0.061218664050102234, + -0.06827899813652039 + ], + "acc_eval": 0.173828125, + "loss_eval": 476.64752197265625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2114.94287109375, + 69492.1875, + 75388.1796875, + 119789.3125, + 127585.7109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000832556514069438, + 0.0007537039346061647, + 0.000749573518987745, + 0.0007496002363041043, + 0.0007496204925701022 + ], + "gamma_dfa": 0.0006226245313882828, + "gamma_dfa_per_layer": [ + 0.18075576424598694, + -0.03305089473724365, + -0.06780679523944855, + -0.07740757614374161 + ], + "acc_eval": 0.1982421875, + "loss_eval": 537.6473388671875, + "epoch": 16 + }, + { + "hidden_norms": [ + 2253.870849609375, + 95625.234375, + 102645.28125, + 154236.78125, + 164149.109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008362202788703144, + 0.0007716236286796629, + 0.0007702361326664686, + 0.0007688606856390834, + 0.0007688601035624743 + ], + "gamma_dfa": 0.0006011892110109329, + "gamma_dfa_per_layer": [ + 0.16114464402198792, + -0.029663734138011932, + -0.06491248309612274, + -0.06416366994380951 + ], + "acc_eval": 0.1640625, + "loss_eval": 581.9083251953125, + "epoch": 17 + }, + { + "hidden_norms": [ + 2351.805419921875, + 125897.7421875, + 133955.1875, + 192500.78125, + 204528.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009331249166280031, + 0.0007676270324736834, + 0.000767629942856729, + 0.0007676497916691005, + 0.0007678864640183747 + ], + "gamma_dfa": 0.0174247776158154, + "gamma_dfa_per_layer": [ + 0.2389061450958252, + -0.028650319203734398, + -0.08226999640464783, + -0.058286719024181366 + ], + "acc_eval": 0.18359375, + "loss_eval": 913.2538452148438, + "epoch": 18 + }, + { + "hidden_norms": [ + 2513.170166015625, + 162182.9375, + 171449.59375, + 239781.78125, + 254673.765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010568156139925122, + 0.0007681881543248892, + 0.0007537052151747048, + 0.0007537882192991674, + 0.0007537372293882072 + ], + "gamma_dfa": -0.005793072283267975, + "gamma_dfa_per_layer": [ + 0.16605031490325928, + -0.03780411183834076, + -0.07320450246334076, + -0.07821398973464966 + ], + "acc_eval": 0.16796875, + "loss_eval": 1265.55859375, + "epoch": 19 + }, + { + "hidden_norms": [ + 2644.6826171875, + 207142.84375, + 218342.21875, + 296423.21875, + 314992.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011496657971292734, + 0.0007783269393257797, + 0.0007782486500218511, + 0.0007782430038787425, + 0.0007782124448567629 + ], + "gamma_dfa": 0.0026588989421725273, + "gamma_dfa_per_layer": [ + 0.23294636607170105, + -0.04264959320425987, + -0.083626389503479, + -0.09603478759527206 + ], + "acc_eval": 0.20703125, + "loss_eval": 1426.623046875, + "epoch": 20 + }, + { + "hidden_norms": [ + 2796.434814453125, + 252884.71875, + 265445.65625, + 352069.8125, + 373355.1875 + ], + "bp_grad_per_sample_l2_med": [ + 0.001035262132063508, + 0.0007528892601840198, + 0.0007526214467361569, + 0.0007527145207859576, + 0.0007528204005211592 + ], + "gamma_dfa": 0.006789525970816612, + "gamma_dfa_per_layer": [ + 0.22278103232383728, + -0.04876326024532318, + -0.07404369860887527, + -0.07281596958637238 + ], + "acc_eval": 0.1640625, + "loss_eval": 1487.587158203125, + "epoch": 21 + }, + { + "hidden_norms": [ + 2927.763671875, + 309847.03125, + 323644.75, + 419166.875, + 443365.71875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010502212680876255, + 0.0007627566810697317, + 0.0007627056329511106, + 0.000762629380915314, + 0.0007625716971233487 + ], + "gamma_dfa": 0.02364537864923477, + "gamma_dfa_per_layer": [ + 0.29678860306739807, + -0.041244715452194214, + -0.08115403354167938, + -0.07980833947658539 + ], + "acc_eval": 0.169921875, + "loss_eval": 920.2720947265625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3096.798583984375, + 369599.1875, + 385129.65625, + 491132.78125, + 518903.8125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001009905245155096, + 0.0007581011741422117, + 0.0007581054233014584, + 0.0007580683450214565, + 0.0007581928512081504 + ], + "gamma_dfa": 0.003264583647251129, + "gamma_dfa_per_layer": [ + 0.2218201905488968, + -0.04958157241344452, + -0.07964619994163513, + -0.07953408360481262 + ], + "acc_eval": 0.2001953125, + "loss_eval": 1496.309814453125, + "epoch": 23 + }, + { + "hidden_norms": [ + 3268.982666015625, + 428585.28125, + 445459.5625, + 561163.625, + 592376.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001033863751217723, + 0.0007647433667443693, + 0.0007646661251783371, + 0.0007653636857867241, + 0.0007653713691979647 + ], + "gamma_dfa": -0.0003395974636077881, + "gamma_dfa_per_layer": [ + 0.2477388083934784, + -0.05594494938850403, + -0.08699506521224976, + -0.10615718364715576 + ], + "acc_eval": 0.1669921875, + "loss_eval": 1579.9014892578125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3455.88134765625, + 503646.0, + 521880.0, + 646881.0, + 681678.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001110030454583466, + 0.000788405304774642, + 0.0007884047226980329, + 0.0007886688108555973, + 0.0007884959923103452 + ], + "gamma_dfa": 0.03397770132869482, + "gamma_dfa_per_layer": [ + 0.325829416513443, + -0.034700896590948105, + -0.09419499337673187, + -0.061022721230983734 + ], + "acc_eval": 0.1572265625, + "loss_eval": 3785.62744140625, + "epoch": 25 + }, + { + "hidden_norms": [ + 3642.92626953125, + 585772.8125, + 606436.25, + 744826.125, + 783648.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014668661169707775, + 0.0007638748502358794, + 0.000763841497246176, + 0.0007643977296538651, + 0.000764367519877851 + ], + "gamma_dfa": 0.01312381774187088, + "gamma_dfa_per_layer": [ + 0.23922428488731384, + -0.0393734946846962, + -0.07718683779239655, + -0.07016868144273758 + ], + "acc_eval": 0.232421875, + "loss_eval": 4151.03466796875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3766.637939453125, + 680946.4375, + 702914.3125, + 850315.25, + 892276.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012596967862918973, + 0.0007629106985405087, + 0.0007628659950569272, + 0.0007628875900991261, + 0.0007628927705809474 + ], + "gamma_dfa": 0.034322043880820274, + "gamma_dfa_per_layer": [ + 0.2786872386932373, + -0.04257660359144211, + -0.046638332307338715, + -0.052184127271175385 + ], + "acc_eval": 0.1396484375, + "loss_eval": 3629.718017578125, + "epoch": 27 + }, + { + "hidden_norms": [ + 3968.325927734375, + 788450.875, + 812297.0625, + 972239.1875, + 1018608.3125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001368838595226407, + 0.0007680156268179417, + 0.0007679847767576575, + 0.0007678329711779952, + 0.0007678261026740074 + ], + "gamma_dfa": -0.004100106656551361, + "gamma_dfa_per_layer": [ + 0.2793079614639282, + -0.07087238132953644, + -0.09966391324996948, + -0.12517209351062775 + ], + "acc_eval": 0.0908203125, + "loss_eval": 4779.9248046875, + "epoch": 28 + }, + { + "hidden_norms": [ + 4129.07666015625, + 894723.3125, + 920476.5, + 1091407.125, + 1142044.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012168982066214085, + 0.0007647873135283589, + 0.0007647885358892381, + 0.0007647658349014819, + 0.0007648474420420825 + ], + "gamma_dfa": 0.008089051581919193, + "gamma_dfa_per_layer": [ + 0.24180662631988525, + -0.05241226777434349, + -0.08961856365203857, + -0.06741958856582642 + ], + "acc_eval": 0.2158203125, + "loss_eval": 4783.03515625, + "epoch": 29 + }, + { + "hidden_norms": [ + 4306.06396484375, + 1029326.875, + 1057140.5, + 1242169.625, + 1298018.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011723857605829835, + 0.0007771517848595977, + 0.000777057372033596, + 0.0007771223317831755, + 0.0007771406089887023 + ], + "gamma_dfa": 0.039280178025364876, + "gamma_dfa_per_layer": [ + 0.3913160562515259, + -0.04802073538303375, + -0.09416519105434418, + -0.09200941771268845 + ], + "acc_eval": 0.1298828125, + "loss_eval": 3595.0546875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4460.63916015625, + 1158344.75, + 1187641.625, + 1385118.375, + 1445341.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001693590427748859, + 0.0007734080427326262, + 0.0007734334794804454, + 0.0007733569364063442, + 0.0007734467508271337 + ], + "gamma_dfa": 0.023572785779833794, + "gamma_dfa_per_layer": [ + 0.2822916507720947, + -0.054915353655815125, + -0.06488456577062607, + -0.06820058822631836 + ], + "acc_eval": 0.1728515625, + "loss_eval": 4587.541015625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4647.95556640625, + 1300320.625, + 1331227.625, + 1539845.25, + 1603645.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012949237134307623, + 0.0007672033389098942, + 0.000767192745115608, + 0.0007670199265703559, + 0.0007670176564715803 + ], + "gamma_dfa": 0.004104164429008961, + "gamma_dfa_per_layer": [ + 0.2596903145313263, + -0.053032513707876205, + -0.0918058454990387, + -0.09843529760837555 + ], + "acc_eval": 0.236328125, + "loss_eval": 3593.60400390625, + "epoch": 32 + }, + { + "hidden_norms": [ + 4817.267578125, + 1453979.25, + 1486502.375, + 1706268.875, + 1774371.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014480708632618189, + 0.0007800625753588974, + 0.000779640453401953, + 0.0007796672289259732, + 0.000779696914833039 + ], + "gamma_dfa": 0.02201501652598381, + "gamma_dfa_per_layer": [ + 0.310447633266449, + -0.051143430173397064, + -0.08497071266174316, + -0.0862734243273735 + ], + "acc_eval": 0.1708984375, + "loss_eval": 5472.59521484375, + "epoch": 33 + }, + { + "hidden_norms": [ + 4990.40625, + 1611329.25, + 1646018.625, + 1880434.25, + 1953768.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018194144358858466, + 0.000765332777518779, + 0.0007653048378415406, + 0.0007655462250113487, + 0.0007656100788153708 + ], + "gamma_dfa": 0.033283455297350883, + "gamma_dfa_per_layer": [ + 0.3083266317844391, + -0.04947835952043533, + -0.06329820305109024, + -0.06241624802350998 + ], + "acc_eval": 0.2021484375, + "loss_eval": 4069.216796875, + "epoch": 34 + }, + { + "hidden_norms": [ + 5174.12255859375, + 1781529.0, + 1818275.25, + 2064802.5, + 2142905.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015505037736147642, + 0.0007980199297890067, + 0.0007979664951562881, + 0.0007982755196280777, + 0.000798304914496839 + ], + "gamma_dfa": 0.019624613225460052, + "gamma_dfa_per_layer": [ + 0.3409179449081421, + -0.05889412760734558, + -0.10494701564311981, + -0.09857834875583649 + ], + "acc_eval": 0.099609375, + "loss_eval": 8309.7119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5347.279296875, + 1968104.0, + 2006811.625, + 2265948.5, + 2349278.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001387596596032381, + 0.0007817883160896599, + 0.0007816275465302169, + 0.000781797047238797, + 0.0007817737059667706 + ], + "gamma_dfa": 0.000422419048845768, + "gamma_dfa_per_layer": [ + 0.25772032141685486, + -0.06083279475569725, + -0.09708747267723083, + -0.0981103777885437 + ], + "acc_eval": 0.1689453125, + "loss_eval": 4254.474609375, + "epoch": 36 + }, + { + "hidden_norms": [ + 5501.59130859375, + 2140827.0, + 2181494.0, + 2452387.75, + 2540377.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001305495505221188, + 0.0007833651034161448, + 0.0007831369293853641, + 0.0007831998518668115, + 0.0007831742987036705 + ], + "gamma_dfa": 0.019166686572134495, + "gamma_dfa_per_layer": [ + 0.3015354871749878, + -0.04834163561463356, + -0.08644455671310425, + -0.090082548558712 + ], + "acc_eval": 0.2060546875, + "loss_eval": 7909.48291015625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5605.65625, + 2338654.5, + 2381249.75, + 2662644.5, + 2754823.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001968128141015768, + 0.0008015396306291223, + 0.0008015292696654797, + 0.0008016829378902912, + 0.0008016840438358486 + ], + "gamma_dfa": 0.01810804195702076, + "gamma_dfa_per_layer": [ + 0.352972149848938, + -0.05855761468410492, + -0.11013064533472061, + -0.11185172200202942 + ], + "acc_eval": 0.091796875, + "loss_eval": 9552.5458984375, + "epoch": 38 + }, + { + "hidden_norms": [ + 5776.4921875, + 2524649.5, + 2569209.25, + 2862403.25, + 2959360.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001521907513961196, + 0.0007685177261009812, + 0.0007685192977078259, + 0.0007685712771490216, + 0.0007685913005843759 + ], + "gamma_dfa": 0.006301743909716606, + "gamma_dfa_per_layer": [ + 0.3194616436958313, + -0.07331519573926926, + -0.09753184020519257, + -0.12340763211250305 + ], + "acc_eval": 0.123046875, + "loss_eval": 9288.3515625, + "epoch": 39 + }, + { + "hidden_norms": [ + 5893.2958984375, + 2719236.25, + 2766489.0, + 3076192.25, + 3179584.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.001874743727967143, + 0.0007690778584219515, + 0.0007690794300287962, + 0.000769136706367135, + 0.000769163656514138 + ], + "gamma_dfa": -0.008455535396933556, + "gamma_dfa_per_layer": [ + 0.27458086609840393, + -0.07574597001075745, + -0.10251512378454208, + -0.13014191389083862 + ], + "acc_eval": 0.1015625, + "loss_eval": 9500.7265625, + "epoch": 40 + }, + { + "hidden_norms": [ + 6037.26904296875, + 2917167.0, + 2966218.0, + 3287947.75, + 3395999.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015074120601639152, + 0.0007870618137530982, + 0.0007870634435676038, + 0.00078706128988415, + 0.0007870564586482942 + ], + "gamma_dfa": 0.003465494140982628, + "gamma_dfa_per_layer": [ + 0.23106470704078674, + -0.04510585218667984, + -0.1033426821231842, + -0.06875419616699219 + ], + "acc_eval": 0.1484375, + "loss_eval": 13665.34375, + "epoch": 41 + }, + { + "hidden_norms": [ + 6165.3271484375, + 3150321.25, + 3201845.5, + 3537869.5, + 3651609.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0038438383489847183, + 0.0007633256609551609, + 0.0007633093046024442, + 0.0007634069188497961, + 0.0007634120993316174 + ], + "gamma_dfa": 0.05023553688079119, + "gamma_dfa_per_layer": [ + 0.36768630146980286, + -0.05948590859770775, + -0.06263985484838486, + -0.0446183905005455 + ], + "acc_eval": 0.130859375, + "loss_eval": 15518.396484375, + "epoch": 42 + }, + { + "hidden_norms": [ + 6322.185546875, + 3356179.75, + 3409150.0, + 3756998.75, + 3874858.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017886407440528274, + 0.0007953053573146462, + 0.000795268511865288, + 0.0007953139720484614, + 0.0007953820750117302 + ], + "gamma_dfa": -0.004728740081191063, + "gamma_dfa_per_layer": [ + 0.26050812005996704, + -0.07150034606456757, + -0.10889407992362976, + -0.09902865439653397 + ], + "acc_eval": 0.1474609375, + "loss_eval": 13731.47265625, + "epoch": 43 + }, + { + "hidden_norms": [ + 6455.05615234375, + 3581075.75, + 3636212.25, + 3997916.75, + 4121800.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014103130670264363, + 0.0008020435925573111, + 0.0008020424866117537, + 0.0008023462723940611, + 0.0008024003473110497 + ], + "gamma_dfa": 0.03236876800656319, + "gamma_dfa_per_layer": [ + 0.3784361481666565, + -0.05973149091005325, + -0.09747618436813354, + -0.09175340086221695 + ], + "acc_eval": 0.1396484375, + "loss_eval": 8173.1318359375, + "epoch": 44 + }, + { + "hidden_norms": [ + 6596.92529296875, + 3790696.25, + 3847633.75, + 4219067.0, + 4346740.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001376444473862648, + 0.0007939717615954578, + 0.0007933968445286155, + 0.0007933415472507477, + 0.0007934658788144588 + ], + "gamma_dfa": 0.026161080226302147, + "gamma_dfa_per_layer": [ + 0.35278040170669556, + -0.07518108189105988, + -0.09520787000656128, + -0.07774712890386581 + ], + "acc_eval": 0.158203125, + "loss_eval": 10093.57421875, + "epoch": 45 + }, + { + "hidden_norms": [ + 6752.326171875, + 4013893.75, + 4072463.0, + 4456049.5, + 4588960.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016587942373007536, + 0.000801959540694952, + 0.0008019180968403816, + 0.0008022981346584857, + 0.0008023587288334966 + ], + "gamma_dfa": 0.0014634709805250168, + "gamma_dfa_per_layer": [ + 0.26356324553489685, + -0.05649265646934509, + -0.09903856366872787, + -0.10217814147472382 + ], + "acc_eval": 0.16796875, + "loss_eval": 11805.994140625, + "epoch": 46 + }, + { + "hidden_norms": [ + 6883.87158203125, + 4249640.0, + 4310267.0, + 4705052.0, + 4842379.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017551308264955878, + 0.0007804373744875193, + 0.0007804358028806746, + 0.0007804319611750543, + 0.0007804720080457628 + ], + "gamma_dfa": -0.00971926562488079, + "gamma_dfa_per_layer": [ + 0.23957225680351257, + -0.06951768696308136, + -0.09375166893005371, + -0.11517996340990067 + ], + "acc_eval": 0.16015625, + "loss_eval": 19465.8828125, + "epoch": 47 + }, + { + "hidden_norms": [ + 7004.37841796875, + 4461495.0, + 4523850.0, + 4930553.5, + 5072236.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015129564562812448, + 0.0007847726810723543, + 0.0007845073123462498, + 0.000784386123996228, + 0.0007843819330446422 + ], + "gamma_dfa": 0.0085066519677639, + "gamma_dfa_per_layer": [ + 0.2637098431587219, + -0.05605460703372955, + -0.08905251324176788, + -0.08457611501216888 + ], + "acc_eval": 0.2021484375, + "loss_eval": 7892.26611328125, + "epoch": 48 + }, + { + "hidden_norms": [ + 7112.80078125, + 4708139.0, + 4772392.0, + 5193498.0, + 5341091.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015166979283094406, + 0.0007669071783311665, + 0.0007669082842767239, + 0.0007670924533158541, + 0.0007671677158214152 + ], + "gamma_dfa": 0.015125783160328865, + "gamma_dfa_per_layer": [ + 0.2562488615512848, + -0.046804703772068024, + -0.08796676248311996, + -0.06097426265478134 + ], + "acc_eval": 0.2333984375, + "loss_eval": 8893.0791015625, + "epoch": 49 + }, + { + "hidden_norms": [ + 7200.81201171875, + 4906775.0, + 4972128.5, + 5401281.5, + 5552169.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015469590434804559, + 0.0007871663547120988, + 0.0007869182154536247, + 0.0007867610547691584, + 0.0007867159438319504 + ], + "gamma_dfa": 0.016506953164935112, + "gamma_dfa_per_layer": [ + 0.29171258211135864, + -0.05020506680011749, + -0.09062528610229492, + -0.08485441654920578 + ], + "acc_eval": 0.2197265625, + "loss_eval": 10566.345703125, + "epoch": 50 + }, + { + "hidden_norms": [ + 7296.0625, + 5134799.0, + 5202023.5, + 5643737.5, + 5799758.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018195129232481122, + 0.0007844618521630764, + 0.0007844566716812551, + 0.000784536823630333, + 0.000784553587436676 + ], + "gamma_dfa": 0.019483929499983788, + "gamma_dfa_per_layer": [ + 0.29106640815734863, + -0.05478575825691223, + -0.07833737879991531, + -0.08000755310058594 + ], + "acc_eval": 0.1650390625, + "loss_eval": 9639.78125, + "epoch": 51 + }, + { + "hidden_norms": [ + 7403.17138671875, + 5361356.5, + 5429682.0, + 5879784.5, + 6039432.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002603700151666999, + 0.000755469489376992, + 0.0007554262992925942, + 0.0007555284537374973, + 0.0007555308402515948 + ], + "gamma_dfa": 0.05388479772955179, + "gamma_dfa_per_layer": [ + 0.3746236264705658, + -0.060121551156044006, + -0.06174459308385849, + -0.03721829131245613 + ], + "acc_eval": 0.1494140625, + "loss_eval": 12397.41015625, + "epoch": 52 + }, + { + "hidden_norms": [ + 7488.30126953125, + 5582023.0, + 5651748.5, + 6110668.5, + 6273320.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00202713580802083, + 0.0007801816100254655, + 0.000780182599555701, + 0.0007801790488883853, + 0.0007801697356626391 + ], + "gamma_dfa": 0.01045304723083973, + "gamma_dfa_per_layer": [ + 0.25068047642707825, + -0.06100655347108841, + -0.0828605443239212, + -0.06500118970870972 + ], + "acc_eval": 0.2138671875, + "loss_eval": 18765.955078125, + "epoch": 53 + }, + { + "hidden_norms": [ + 7561.47265625, + 5795100.5, + 5866105.0, + 6334896.0, + 6501444.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017575331730768085, + 0.0007978819194249809, + 0.0007978450739756227, + 0.000798230292275548, + 0.0007982761017046869 + ], + "gamma_dfa": 0.011411387473344803, + "gamma_dfa_per_layer": [ + 0.29157841205596924, + -0.05369853973388672, + -0.09859319031238556, + -0.09364113211631775 + ], + "acc_eval": 0.1875, + "loss_eval": 10589.0087890625, + "epoch": 54 + }, + { + "hidden_norms": [ + 7636.35595703125, + 6016687.0, + 6089686.0, + 6570658.5, + 6741688.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001416882500052452, + 0.0007854877039790154, + 0.0007851187838241458, + 0.0007847094675526023, + 0.0007846617372706532 + ], + "gamma_dfa": 0.004635758697986603, + "gamma_dfa_per_layer": [ + 0.2832094430923462, + -0.06018421798944473, + -0.10714054107666016, + -0.09734164923429489 + ], + "acc_eval": 0.1884765625, + "loss_eval": 11045.0107421875, + "epoch": 55 + }, + { + "hidden_norms": [ + 7700.8466796875, + 6215443.5, + 6289647.5, + 6780492.0, + 6955139.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017022350803017616, + 0.0007623002748005092, + 0.000762303126975894, + 0.000762506271712482, + 0.0007625941070728004 + ], + "gamma_dfa": 0.026831449940800667, + "gamma_dfa_per_layer": [ + 0.339847594499588, + -0.0706903263926506, + -0.0816052109003067, + -0.08022625744342804 + ], + "acc_eval": 0.154296875, + "loss_eval": 9215.373046875, + "epoch": 56 + }, + { + "hidden_norms": [ + 7773.85986328125, + 6413204.5, + 6488502.5, + 6988337.0, + 7166683.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013730988139286637, + 0.0007787180948071182, + 0.0007787116337567568, + 0.0007787745562382042, + 0.0007787866634316742 + ], + "gamma_dfa": 0.013194277882575989, + "gamma_dfa_per_layer": [ + 0.30715805292129517, + -0.0632064938545227, + -0.09261326491832733, + -0.09856118261814117 + ], + "acc_eval": 0.2236328125, + "loss_eval": 6176.3076171875, + "epoch": 57 + }, + { + "hidden_norms": [ + 7820.23388671875, + 6598801.0, + 6675650.0, + 7184845.0, + 7367520.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015506811905652285, + 0.000799653644207865, + 0.0007990750018507242, + 0.0007989082369022071, + 0.0007991326274350286 + ], + "gamma_dfa": 0.00773581862449646, + "gamma_dfa_per_layer": [ + 0.28355157375335693, + -0.054453425109386444, + -0.11499008536338806, + -0.08316478878259659 + ], + "acc_eval": 0.205078125, + "loss_eval": 7889.31005859375, + "epoch": 58 + }, + { + "hidden_norms": [ + 7864.2060546875, + 6797904.5, + 6876033.0, + 7392718.0, + 7578431.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020978215616196394, + 0.0007834822754375637, + 0.0007832171395421028, + 0.0007829645182937384, + 0.0007829380920156837 + ], + "gamma_dfa": 0.033629802986979485, + "gamma_dfa_per_layer": [ + 0.34407293796539307, + -0.05567466467618942, + -0.08536086976528168, + -0.06851819157600403 + ], + "acc_eval": 0.15625, + "loss_eval": 14391.9736328125, + "epoch": 59 + }, + { + "hidden_norms": [ + 7871.78173828125, + 7003051.0, + 7083124.0, + 7611188.0, + 7801170.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012560655595734715, + 0.0007599582313559949, + 0.0007599598611705005, + 0.0007601079414598644, + 0.0007601887919008732 + ], + "gamma_dfa": 0.004498079419136047, + "gamma_dfa_per_layer": [ + 0.32327917218208313, + -0.07260935008525848, + -0.10525670647621155, + -0.1274207979440689 + ], + "acc_eval": 0.1572265625, + "loss_eval": 7188.275390625, + "epoch": 60 + }, + { + "hidden_norms": [ + 7934.14794921875, + 7210797.0, + 7292245.5, + 7829288.0, + 8023057.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001343236886896193, + 0.0007599524687975645, + 0.0007598291267640889, + 0.0007597675430588424, + 0.0007598883821628988 + ], + "gamma_dfa": 0.02613817434757948, + "gamma_dfa_per_layer": [ + 0.3003483712673187, + -0.0427340604364872, + -0.09165668487548828, + -0.06140492856502533 + ], + "acc_eval": 0.259765625, + "loss_eval": 7055.94677734375, + "epoch": 61 + }, + { + "hidden_norms": [ + 7964.50244140625, + 7416797.0, + 7500505.0, + 8048676.5, + 8247824.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015083092730492353, + 0.0007851184927858412, + 0.0007850866531953216, + 0.0007850754773244262, + 0.0007851301343180239 + ], + "gamma_dfa": 0.027105171233415604, + "gamma_dfa_per_layer": [ + 0.37000784277915955, + -0.05895276367664337, + -0.10036876797676086, + -0.1022656261920929 + ], + "acc_eval": 0.166015625, + "loss_eval": 7052.08203125, + "epoch": 62 + }, + { + "hidden_norms": [ + 8006.1318359375, + 7588913.0, + 7673353.5, + 8229041.0, + 8431689.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014928504824638367, + 0.0007839660393074155, + 0.000783930707257241, + 0.0007839277386665344, + 0.0007839910103939474 + ], + "gamma_dfa": 0.018935419619083405, + "gamma_dfa_per_layer": [ + 0.3158775568008423, + -0.051478639245033264, + -0.09881415218114853, + -0.08984308689832687 + ], + "acc_eval": 0.2119140625, + "loss_eval": 6266.041015625, + "epoch": 63 + }, + { + "hidden_norms": [ + 8030.2109375, + 7754257.5, + 7839832.5, + 8400781.0, + 8605522.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012633835431188345, + 0.0007809567032381892, + 0.0007807457586750388, + 0.0007805972127243876, + 0.0007805809145793319 + ], + "gamma_dfa": 0.009956683963537216, + "gamma_dfa_per_layer": [ + 0.30735114216804504, + -0.06991781294345856, + -0.09387198090553284, + -0.10373461246490479 + ], + "acc_eval": 0.1806640625, + "loss_eval": 8467.8125, + "epoch": 64 + }, + { + "hidden_norms": [ + 8048.080078125, + 7913574.5, + 8000306.0, + 8567918.0, + 8775169.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001400441862642765, + 0.0007796542486175895, + 0.0007795418496243656, + 0.0007795065175741911, + 0.0007797059370204806 + ], + "gamma_dfa": 0.008816102519631386, + "gamma_dfa_per_layer": [ + 0.28880423307418823, + -0.05614739656448364, + -0.11088694632053375, + -0.0865054801106453 + ], + "acc_eval": 0.203125, + "loss_eval": 9558.021484375, + "epoch": 65 + }, + { + "hidden_norms": [ + 8067.34375, + 8070731.5, + 8158800.0, + 8733572.0, + 8943043.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014346289681270719, + 0.000756031135097146, + 0.0007560329977422953, + 0.0007561623933725059, + 0.0007562324753962457 + ], + "gamma_dfa": 0.009170351549983025, + "gamma_dfa_per_layer": [ + 0.3515056073665619, + -0.0781104564666748, + -0.10490105301141739, + -0.1318126916885376 + ], + "acc_eval": 0.1103515625, + "loss_eval": 11967.486328125, + "epoch": 66 + }, + { + "hidden_norms": [ + 8073.40283203125, + 8227977.0, + 8317204.5, + 8898513.0, + 9110756.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015745362034067512, + 0.0007811843534000218, + 0.000781158625613898, + 0.0007811560644768178, + 0.0007812076364643872 + ], + "gamma_dfa": 0.011113166809082031, + "gamma_dfa_per_layer": [ + 0.30191734433174133, + -0.05505914241075516, + -0.10382715612649918, + -0.09857837855815887 + ], + "acc_eval": 0.177734375, + "loss_eval": 7797.017578125, + "epoch": 67 + }, + { + "hidden_norms": [ + 8071.63623046875, + 8375112.0, + 8465576.0, + 9052592.0, + 9267093.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002133303554728627, + 0.0007824470521882176, + 0.0007822668994776905, + 0.0007822004845365882, + 0.0007824745844118297 + ], + "gamma_dfa": 0.03663862869143486, + "gamma_dfa_per_layer": [ + 0.34291785955429077, + -0.036236945539712906, + -0.10749906301498413, + -0.052627336233854294 + ], + "acc_eval": 0.1396484375, + "loss_eval": 11433.0302734375, + "epoch": 68 + }, + { + "hidden_norms": [ + 8084.59130859375, + 8523176.0, + 8614498.0, + 9207429.0, + 9424164.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001537870615720749, + 0.0007688916521146894, + 0.0007688923506066203, + 0.0007689034100621939, + 0.0007689160411246121 + ], + "gamma_dfa": 0.020611698739230633, + "gamma_dfa_per_layer": [ + 0.3258458971977234, + -0.053132835775613785, + -0.10754033923149109, + -0.08272592723369598 + ], + "acc_eval": 0.1787109375, + "loss_eval": 6151.634765625, + "epoch": 69 + }, + { + "hidden_norms": [ + 8098.82373046875, + 8648680.0, + 8741121.0, + 9338018.0, + 9556207.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014389777788892388, + 0.0007975181215442717, + 0.0007967942510731518, + 0.0007966712000779808, + 0.0007968792924657464 + ], + "gamma_dfa": 0.009284427389502525, + "gamma_dfa_per_layer": [ + 0.29391974210739136, + -0.058484748005867004, + -0.11177978664636612, + -0.08651749789714813 + ], + "acc_eval": 0.18359375, + "loss_eval": 5277.328125, + "epoch": 70 + }, + { + "hidden_norms": [ + 8113.7255859375, + 8773553.0, + 8866719.0, + 9469018.0, + 9689706.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00145814404822886, + 0.0007955037872307003, + 0.0007954062311910093, + 0.0007954093161970377, + 0.0007956796325743198 + ], + "gamma_dfa": 0.01389121450483799, + "gamma_dfa_per_layer": [ + 0.28217679262161255, + -0.058154717087745667, + -0.08273636549711227, + -0.08572085201740265 + ], + "acc_eval": 0.1923828125, + "loss_eval": 10207.12109375, + "epoch": 71 + }, + { + "hidden_norms": [ + 8063.9951171875, + 8889169.0, + 8984089.0, + 9593494.0, + 9817277.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011409161379560828, + 0.0007544065010733902, + 0.0007542934035882354, + 0.000754217617213726, + 0.0007543462561443448 + ], + "gamma_dfa": 0.018794666975736618, + "gamma_dfa_per_layer": [ + 0.2941493093967438, + -0.0533231720328331, + -0.09251905977725983, + -0.07312840968370438 + ], + "acc_eval": 0.2626953125, + "loss_eval": 4281.3994140625, + "epoch": 72 + }, + { + "hidden_norms": [ + 8021.80126953125, + 9019768.0, + 9115790.0, + 9730846.0, + 9956825.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012580875772982836, + 0.0007680498529225588, + 0.0007680428680032492, + 0.0007680479320697486, + 0.0007680551498197019 + ], + "gamma_dfa": 0.027317012660205364, + "gamma_dfa_per_layer": [ + 0.3265392780303955, + -0.04611017927527428, + -0.09342358261346817, + -0.0777374655008316 + ], + "acc_eval": 0.2275390625, + "loss_eval": 4907.6142578125, + "epoch": 73 + }, + { + "hidden_norms": [ + 7995.38916015625, + 9118244.0, + 9214531.0, + 9832139.0, + 10058956.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012337823864072561, + 0.0007691435748711228, + 0.000768946367315948, + 0.000768885191064328, + 0.0007689236663281918 + ], + "gamma_dfa": 0.012230871245265007, + "gamma_dfa_per_layer": [ + 0.2935040593147278, + -0.06186644732952118, + -0.09978199750185013, + -0.08293212950229645 + ], + "acc_eval": 0.2001953125, + "loss_eval": 7199.5888671875, + "epoch": 74 + }, + { + "hidden_norms": [ + 7966.3759765625, + 9213122.0, + 9310022.0, + 9931662.0, + 10160365.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011302486527711153, + 0.0007655700901523232, + 0.0007655754452571273, + 0.0007655742228962481, + 0.0007655934314243495 + ], + "gamma_dfa": 0.01679898425936699, + "gamma_dfa_per_layer": [ + 0.3025580048561096, + -0.05692540109157562, + -0.10290184617042542, + -0.07553482055664062 + ], + "acc_eval": 0.2490234375, + "loss_eval": 2667.806640625, + "epoch": 75 + }, + { + "hidden_norms": [ + 7937.92041015625, + 9292608.0, + 9390243.0, + 10015125.0, + 10244868.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011147550540044904, + 0.0007753095123916864, + 0.0007750216755084693, + 0.000774735352024436, + 0.0007747214986011386 + ], + "gamma_dfa": 0.027967805042862892, + "gamma_dfa_per_layer": [ + 0.3572651743888855, + -0.05705829709768295, + -0.09071685373783112, + -0.09761880338191986 + ], + "acc_eval": 0.1923828125, + "loss_eval": 3299.91259765625, + "epoch": 76 + }, + { + "hidden_norms": [ + 7904.56689453125, + 9393010.0, + 9491687.0, + 10122118.0, + 10354408.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00107352074701339, + 0.0007645431905984879, + 0.0007645484292879701, + 0.0007645472651347518, + 0.0007645685109309852 + ], + "gamma_dfa": 0.02625838667154312, + "gamma_dfa_per_layer": [ + 0.3598015606403351, + -0.06442467868328094, + -0.09077714383602142, + -0.09956619143486023 + ], + "acc_eval": 0.2119140625, + "loss_eval": 2758.64599609375, + "epoch": 77 + }, + { + "hidden_norms": [ + 7855.07861328125, + 9500690.0, + 9600497.0, + 10235757.0, + 10469660.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001235201139934361, + 0.0007838172605261207, + 0.000783789437264204, + 0.0007840599282644689, + 0.00078408676199615 + ], + "gamma_dfa": 0.02602401003241539, + "gamma_dfa_per_layer": [ + 0.35960710048675537, + -0.06299363076686859, + -0.10128454864025116, + -0.09123288094997406 + ], + "acc_eval": 0.1689453125, + "loss_eval": 4279.3154296875, + "epoch": 78 + }, + { + "hidden_norms": [ + 7826.134765625, + 9581674.0, + 9682195.0, + 10320423.0, + 10555402.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010469084372743964, + 0.0007737708510830998, + 0.0007735842373222113, + 0.0007734137470833957, + 0.0007734144455753267 + ], + "gamma_dfa": 0.024147922173142433, + "gamma_dfa_per_layer": [ + 0.37674999237060547, + -0.07557321339845657, + -0.09047992527484894, + -0.11410516500473022 + ], + "acc_eval": 0.1669921875, + "loss_eval": 3201.240966796875, + "epoch": 79 + }, + { + "hidden_norms": [ + 7779.2138671875, + 9660604.0, + 9761859.0, + 10404086.0, + 10640750.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010143390391021967, + 0.0007633482455275953, + 0.0007633481291122735, + 0.0007633698405697942, + 0.0007633839850313962 + ], + "gamma_dfa": 0.019840596243739128, + "gamma_dfa_per_layer": [ + 0.30444687604904175, + -0.049144186079502106, + -0.09650193899869919, + -0.07943836599588394 + ], + "acc_eval": 0.2763671875, + "loss_eval": 1991.417236328125, + "epoch": 80 + }, + { + "hidden_norms": [ + 7760.08642578125, + 9716882.0, + 9818513.0, + 10462903.0, + 10700433.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00105896289460361, + 0.0007729134522378445, + 0.0007727605989202857, + 0.0007726037292741239, + 0.000772611063439399 + ], + "gamma_dfa": 0.026730000041425228, + "gamma_dfa_per_layer": [ + 0.34768593311309814, + -0.056363869458436966, + -0.09562714397907257, + -0.0887749195098877 + ], + "acc_eval": 0.2177734375, + "loss_eval": 2112.26025390625, + "epoch": 81 + }, + { + "hidden_norms": [ + 7743.93798828125, + 9786243.0, + 9888395.0, + 10535762.0, + 10774483.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010133162140846252, + 0.0007726953481324017, + 0.0007724745664745569, + 0.0007722667651250958, + 0.0007722647860646248 + ], + "gamma_dfa": 0.019241390749812126, + "gamma_dfa_per_layer": [ + 0.3473237156867981, + -0.06556949764490128, + -0.10282130539417267, + -0.10196734964847565 + ], + "acc_eval": 0.193359375, + "loss_eval": 2962.46826171875, + "epoch": 82 + }, + { + "hidden_norms": [ + 7708.34033203125, + 9842047.0, + 9944650.0, + 10594529.0, + 10834219.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000999346375465393, + 0.0007619770476594567, + 0.0007619837997481227, + 0.0007619837415404618, + 0.0007620092947036028 + ], + "gamma_dfa": 0.019368495792150497, + "gamma_dfa_per_layer": [ + 0.3106932044029236, + -0.057876452803611755, + -0.09636038541793823, + -0.0789823830127716 + ], + "acc_eval": 0.2607421875, + "loss_eval": 1792.6400146484375, + "epoch": 83 + }, + { + "hidden_norms": [ + 7673.24560546875, + 9901470.0, + 10004649.0, + 10656950.0, + 10898699.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009565355721861124, + 0.0007485878886654973, + 0.0007484929519705474, + 0.000748424616176635, + 0.0007485424866899848 + ], + "gamma_dfa": 0.01748405210673809, + "gamma_dfa_per_layer": [ + 0.2931858003139496, + -0.05277211219072342, + -0.09270339459180832, + -0.07777408510446548 + ], + "acc_eval": 0.29296875, + "loss_eval": 974.1173095703125, + "epoch": 84 + }, + { + "hidden_norms": [ + 7628.22412109375, + 9951868.0, + 10055369.0, + 10709207.0, + 10951317.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000980330049060285, + 0.0007466387469321489, + 0.0007466417155228555, + 0.0007467885152436793, + 0.0007468488765880466 + ], + "gamma_dfa": 0.019473757594823837, + "gamma_dfa_per_layer": [ + 0.29309791326522827, + -0.05341349542140961, + -0.08986704051494598, + -0.07192234694957733 + ], + "acc_eval": 0.27734375, + "loss_eval": 1743.6519775390625, + "epoch": 85 + }, + { + "hidden_norms": [ + 7586.08837890625, + 9992418.0, + 10096238.0, + 10751557.0, + 10993641.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009816273814067245, + 0.0007609970052726567, + 0.000761001487262547, + 0.0007610011962242424, + 0.0007610262255184352 + ], + "gamma_dfa": 0.017493372783064842, + "gamma_dfa_per_layer": [ + 0.307644248008728, + -0.054675400257110596, + -0.09402725845575333, + -0.08896809816360474 + ], + "acc_eval": 0.2783203125, + "loss_eval": 986.1089477539062, + "epoch": 86 + }, + { + "hidden_norms": [ + 7546.07666015625, + 10019561.0, + 10123471.0, + 10779392.0, + 11021634.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010106659028679132, + 0.0007606986328028142, + 0.0007606985163874924, + 0.0007607255247421563, + 0.0007607414736412466 + ], + "gamma_dfa": 0.0189383989199996, + "gamma_dfa_per_layer": [ + 0.3057447671890259, + -0.05296015366911888, + -0.09528908133506775, + -0.08174193650484085 + ], + "acc_eval": 0.2412109375, + "loss_eval": 1453.539306640625, + "epoch": 87 + }, + { + "hidden_norms": [ + 7507.373046875, + 10034866.0, + 10138899.0, + 10794880.0, + 11037002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009441400761716068, + 0.0007457168539986014, + 0.0007457205792888999, + 0.0007458969485014677, + 0.0007459585904143751 + ], + "gamma_dfa": 0.016358308494091034, + "gamma_dfa_per_layer": [ + 0.29192131757736206, + -0.054730333387851715, + -0.08949868381023407, + -0.08225906640291214 + ], + "acc_eval": 0.2939453125, + "loss_eval": 889.3756103515625, + "epoch": 88 + }, + { + "hidden_norms": [ + 7475.10595703125, + 10059038.0, + 10163330.0, + 10820810.0, + 11063516.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009275015909224749, + 0.0007406340446323156, + 0.0007405761862173676, + 0.0007405940559692681, + 0.0007405842188745737 + ], + "gamma_dfa": 0.019343840889632702, + "gamma_dfa_per_layer": [ + 0.2714617848396301, + -0.049602191895246506, + -0.07989576458930969, + -0.06458846479654312 + ], + "acc_eval": 0.322265625, + "loss_eval": 778.108642578125, + "epoch": 89 + }, + { + "hidden_norms": [ + 7444.8466796875, + 10064810.0, + 10169219.0, + 10827134.0, + 11070129.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009403944713994861, + 0.000745263765566051, + 0.0007452677236869931, + 0.0007454471196979284, + 0.0007455073646269739 + ], + "gamma_dfa": 0.01310044713318348, + "gamma_dfa_per_layer": [ + 0.28572195768356323, + -0.054389551281929016, + -0.09277918189764023, + -0.08615143597126007 + ], + "acc_eval": 0.26953125, + "loss_eval": 932.53662109375, + "epoch": 90 + }, + { + "hidden_norms": [ + 7414.4970703125, + 10075394.0, + 10179775.0, + 10837778.0, + 11080979.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009539846796542406, + 0.0007622878183610737, + 0.0007622832781635225, + 0.0007622758857905865, + 0.0007622810662724078 + ], + "gamma_dfa": 0.02442830428481102, + "gamma_dfa_per_layer": [ + 0.34633398056030273, + -0.059510812163352966, + -0.09629844129085541, + -0.09281150996685028 + ], + "acc_eval": 0.228515625, + "loss_eval": 1020.4122924804688, + "epoch": 91 + }, + { + "hidden_norms": [ + 7385.740234375, + 10098198.0, + 10202575.0, + 10860396.0, + 11103300.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009258585050702095, + 0.0007462432840839028, + 0.0007461663917638361, + 0.000746095203794539, + 0.0007462148205377162 + ], + "gamma_dfa": 0.021881024353206158, + "gamma_dfa_per_layer": [ + 0.3117921054363251, + -0.0562119297683239, + -0.0811537504196167, + -0.08690232783555984 + ], + "acc_eval": 0.2783203125, + "loss_eval": 812.965576171875, + "epoch": 92 + }, + { + "hidden_norms": [ + 7372.93115234375, + 10112263.0, + 10216603.0, + 10874068.0, + 11116538.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009158457978628576, + 0.000744756544008851, + 0.0007447608513757586, + 0.0007449553813785315, + 0.0007450156263075769 + ], + "gamma_dfa": 0.018241400830447674, + "gamma_dfa_per_layer": [ + 0.27702248096466064, + -0.048618000000715256, + -0.0829005166888237, + -0.072538360953331 + ], + "acc_eval": 0.330078125, + "loss_eval": 675.6625366210938, + "epoch": 93 + }, + { + "hidden_norms": [ + 7363.2099609375, + 10119183.0, + 10223550.0, + 10881119.0, + 11123569.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009229940478689969, + 0.0007447171374224126, + 0.000744720280636102, + 0.0007448522374033928, + 0.000744906603358686 + ], + "gamma_dfa": 0.016729017719626427, + "gamma_dfa_per_layer": [ + 0.27939361333847046, + -0.048901431262493134, + -0.08870212733745575, + -0.07487398386001587 + ], + "acc_eval": 0.3251953125, + "loss_eval": 708.3804931640625, + "epoch": 94 + }, + { + "hidden_norms": [ + 7355.3544921875, + 10123197.0, + 10227558.0, + 10885026.0, + 11127411.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009278868092224002, + 0.0007445889641530812, + 0.0007445933879353106, + 0.0007447681855410337, + 0.0007448261021636426 + ], + "gamma_dfa": 0.014646172523498535, + "gamma_dfa_per_layer": [ + 0.28425437211990356, + -0.053754955530166626, + -0.08852015435695648, + -0.08339457213878632 + ], + "acc_eval": 0.310546875, + "loss_eval": 688.0819091796875, + "epoch": 95 + }, + { + "hidden_norms": [ + 7349.30078125, + 10126695.0, + 10231071.0, + 10888593.0, + 11130985.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000914200150873512, + 0.0007393965497612953, + 0.000739329494535923, + 0.0007393491105176508, + 0.0007393329287879169 + ], + "gamma_dfa": 0.01913625281304121, + "gamma_dfa_per_layer": [ + 0.26301705837249756, + -0.04846196621656418, + -0.07772514969110489, + -0.06028493121266365 + ], + "acc_eval": 0.3203125, + "loss_eval": 697.3836669921875, + "epoch": 96 + }, + { + "hidden_norms": [ + 7345.333984375, + 10127832.0, + 10232199.0, + 10889673.0, + 11132020.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009217644692398608, + 0.0007456630119122565, + 0.0007455685408785939, + 0.0007454968290403485, + 0.0007456148159690201 + ], + "gamma_dfa": 0.017519758082926273, + "gamma_dfa_per_layer": [ + 0.29056763648986816, + -0.05349243804812431, + -0.08799343556165695, + -0.0790027305483818 + ], + "acc_eval": 0.30859375, + "loss_eval": 661.5548095703125, + "epoch": 97 + }, + { + "hidden_norms": [ + 7343.10888671875, + 10128861.0, + 10233227.0, + 10890713.0, + 11133060.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009042566525749862, + 0.0007393184932880104, + 0.0007392505649477243, + 0.0007392706465907395, + 0.0007392524858005345 + ], + "gamma_dfa": 0.018206479027867317, + "gamma_dfa_per_layer": [ + 0.2680240869522095, + -0.047486238181591034, + -0.08014586567878723, + -0.06756606698036194 + ], + "acc_eval": 0.3388671875, + "loss_eval": 636.5595703125, + "epoch": 98 + }, + { + "hidden_norms": [ + 7342.0625, + 10129300.0, + 10233666.0, + 10891137.0, + 11133475.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009002314181998372, + 0.0007393373525701463, + 0.0007392485276795924, + 0.0007392755360342562, + 0.0007392438710667193 + ], + "gamma_dfa": 0.01726893801242113, + "gamma_dfa_per_layer": [ + 0.2736765742301941, + -0.05038469657301903, + -0.0817006528377533, + -0.07251547276973724 + ], + "acc_eval": 0.3330078125, + "loss_eval": 611.882080078125, + "epoch": 99 + }, + { + "hidden_norms": [ + 7341.77294921875, + 10129401.0, + 10233766.0, + 10891235.0, + 11133570.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009032402304001153, + 0.0007393273408524692, + 0.0007392435800284147, + 0.0007392680854536593, + 0.0007392411935143173 + ], + "gamma_dfa": 0.01641188934445381, + "gamma_dfa_per_layer": [ + 0.2728629410266876, + -0.05080822855234146, + -0.08297968655824661, + -0.0734274685382843 + ], + "acc_eval": 0.33203125, + "loss_eval": 625.6834106445312, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s456.json b/results/snapshot_no_outln_v1/snapshot_noLN_s456.json new file mode 100644 index 0000000..f490ffc --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s456.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 456, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005607507191598415, + 0.0005558764678426087, + 0.0005541853606700897, + 0.0005498801474459469, + 0.0005458085797727108 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.091796875, + "loss_eval": 2.3707523345947266, + "epoch": 0 + }, + { + "hidden_norms": [ + 40.06809616088867, + 37.16851043701172, + 35.97419738769531, + 34.98802185058594, + 34.09989547729492 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013246900925878435, + 0.00013836311700288206, + 0.00014998784172348678, + 0.00017555677914060652, + 0.0002279145992361009 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4365234375, + "loss_eval": 1.5941123962402344, + "epoch": 1 + }, + { + "hidden_norms": [ + 51.32597732543945, + 46.865997314453125, + 44.336944580078125, + 42.399295806884766, + 41.083709716796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010603138071019202, + 0.00011028712469851598, + 0.00011670063395285979, + 0.00013331198715604842, + 0.00016258291725534946 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4736328125, + "loss_eval": 1.4793150424957275, + "epoch": 2 + }, + { + "hidden_norms": [ + 62.084197998046875, + 56.17497253417969, + 52.24001693725586, + 48.81613540649414, + 45.96797561645508 + ], + "bp_grad_per_sample_l2_med": [ + 9.958917507901788e-05, + 0.00010542560630710796, + 0.00011132164945593104, + 0.00012339121894910932, + 0.00014191119407769293 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.48046875, + "loss_eval": 1.4157963991165161, + "epoch": 3 + }, + { + "hidden_norms": [ + 70.11115264892578, + 62.7204704284668, + 57.0128059387207, + 52.67961883544922, + 49.0619010925293 + ], + "bp_grad_per_sample_l2_med": [ + 9.119982860283926e-05, + 9.68000604189001e-05, + 0.0001028164042509161, + 0.0001113277321564965, + 0.00012708066788036376 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.529296875, + "loss_eval": 1.3824131488800049, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.96520233154297, + 68.33187866210938, + 62.02028274536133, + 56.785953521728516, + 52.50190734863281 + ], + "bp_grad_per_sample_l2_med": [ + 9.251978190150112e-05, + 9.91317501757294e-05, + 0.00010523655510041863, + 0.00011500742402859032, + 0.00012610112025868148 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.49609375, + "loss_eval": 1.4219003915786743, + "epoch": 5 + }, + { + "hidden_norms": [ + 84.35594940185547, + 73.65497589111328, + 65.76171875, + 59.78555679321289, + 54.72732925415039 + ], + "bp_grad_per_sample_l2_med": [ + 8.53061064844951e-05, + 9.119947208091617e-05, + 9.546471119392663e-05, + 0.00010272912186337635, + 0.00011094262299593538 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5107421875, + "loss_eval": 1.3764042854309082, + "epoch": 6 + }, + { + "hidden_norms": [ + 90.34719848632812, + 78.86559295654297, + 69.58448028564453, + 62.62751388549805, + 56.49700164794922 + ], + "bp_grad_per_sample_l2_med": [ + 8.279601024696603e-05, + 8.869311568560079e-05, + 9.525373752694577e-05, + 0.00010276824468746781, + 0.00011047293082810938 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.521484375, + "loss_eval": 1.3063517808914185, + "epoch": 7 + }, + { + "hidden_norms": [ + 94.70899200439453, + 82.14017486572266, + 72.3757553100586, + 63.97325134277344, + 57.261043548583984 + ], + "bp_grad_per_sample_l2_med": [ + 8.42147201183252e-05, + 8.977072138804942e-05, + 9.571140253683552e-05, + 0.00010196219227509573, + 0.00010500354983378202 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.521484375, + "loss_eval": 1.3536221981048584, + "epoch": 8 + }, + { + "hidden_norms": [ + 101.69925689697266, + 87.86920928955078, + 77.13504791259766, + 68.15769958496094, + 60.63106918334961 + ], + "bp_grad_per_sample_l2_med": [ + 8.040699322009459e-05, + 8.682452607899904e-05, + 9.194648009724915e-05, + 9.875267278403044e-05, + 0.00010358950385125354 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.517578125, + "loss_eval": 1.3398748636245728, + "epoch": 9 + }, + { + "hidden_norms": [ + 106.84738159179688, + 92.9166259765625, + 81.7030029296875, + 71.8150863647461, + 63.29521179199219 + ], + "bp_grad_per_sample_l2_med": [ + 7.807361544109881e-05, + 8.290779078379273e-05, + 8.751150744501501e-05, + 9.41800099099055e-05, + 9.622493234928697e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5595703125, + "loss_eval": 1.3021488189697266, + "epoch": 10 + }, + { + "hidden_norms": [ + 110.62977600097656, + 96.08146667480469, + 83.02938842773438, + 71.82244873046875, + 62.47097396850586 + ], + "bp_grad_per_sample_l2_med": [ + 7.582613034173846e-05, + 8.177754352800548e-05, + 8.888287266017869e-05, + 9.501135355094448e-05, + 9.754132042871788e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53125, + "loss_eval": 1.2963578701019287, + "epoch": 11 + }, + { + "hidden_norms": [ + 115.87433624267578, + 99.99412536621094, + 86.81661987304688, + 75.194580078125, + 65.24598693847656 + ], + "bp_grad_per_sample_l2_med": [ + 7.453945727320388e-05, + 7.999759691301733e-05, + 8.587146294303238e-05, + 9.281275561079383e-05, + 9.684430551715195e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.537109375, + "loss_eval": 1.300926685333252, + "epoch": 12 + }, + { + "hidden_norms": [ + 115.8588638305664, + 100.0324478149414, + 87.23123931884766, + 75.2608871459961, + 64.53407287597656 + ], + "bp_grad_per_sample_l2_med": [ + 7.783657201798633e-05, + 8.2304140960332e-05, + 8.792509470367804e-05, + 9.308305016020313e-05, + 9.498461440671235e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5302734375, + "loss_eval": 1.2952370643615723, + "epoch": 13 + }, + { + "hidden_norms": [ + 121.24994659423828, + 103.9144515991211, + 88.99864959716797, + 75.50836944580078, + 64.28103637695312 + ], + "bp_grad_per_sample_l2_med": [ + 7.956428453326225e-05, + 8.667269139550626e-05, + 9.291838068747893e-05, + 9.890568617265671e-05, + 0.00010031831334345043 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.537109375, + "loss_eval": 1.3034818172454834, + "epoch": 14 + }, + { + "hidden_norms": [ + 124.64612579345703, + 107.64379119873047, + 92.03299713134766, + 77.67626190185547, + 66.19109344482422 + ], + "bp_grad_per_sample_l2_med": [ + 7.466476381523535e-05, + 8.086472371360287e-05, + 8.857141801854596e-05, + 9.320858225692064e-05, + 9.685206168796867e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.521484375, + "loss_eval": 1.2701925039291382, + "epoch": 15 + }, + { + "hidden_norms": [ + 128.4908905029297, + 110.93827819824219, + 95.34327697753906, + 80.90787506103516, + 68.56732940673828 + ], + "bp_grad_per_sample_l2_med": [ + 7.461471977876499e-05, + 8.18013577372767e-05, + 8.659388549858704e-05, + 9.226851398125291e-05, + 9.443429007660598e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5537109375, + "loss_eval": 1.2619553804397583, + "epoch": 16 + }, + { + "hidden_norms": [ + 130.65846252441406, + 112.31464385986328, + 95.85350036621094, + 79.80601501464844, + 67.30303192138672 + ], + "bp_grad_per_sample_l2_med": [ + 7.368716615019366e-05, + 8.01649657660164e-05, + 8.653382974443957e-05, + 9.32966941036284e-05, + 9.312365727964789e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5576171875, + "loss_eval": 1.2436624765396118, + "epoch": 17 + }, + { + "hidden_norms": [ + 133.13165283203125, + 114.61791229248047, + 97.15895080566406, + 81.40515899658203, + 69.13287353515625 + ], + "bp_grad_per_sample_l2_med": [ + 7.137899228837341e-05, + 7.771244418108836e-05, + 8.332561264978722e-05, + 8.920324762584642e-05, + 8.9491848484613e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.56640625, + "loss_eval": 1.239585518836975, + "epoch": 18 + }, + { + "hidden_norms": [ + 136.59140014648438, + 117.42953491210938, + 99.51315307617188, + 83.76544189453125, + 69.16895294189453 + ], + "bp_grad_per_sample_l2_med": [ + 7.198385719675571e-05, + 7.928090053610504e-05, + 8.52016091812402e-05, + 9.1185538622085e-05, + 9.257275087293237e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5673828125, + "loss_eval": 1.2780827283859253, + "epoch": 19 + }, + { + "hidden_norms": [ + 139.33346557617188, + 119.61570739746094, + 102.05357360839844, + 85.16582489013672, + 70.09222412109375 + ], + "bp_grad_per_sample_l2_med": [ + 7.267932232934982e-05, + 7.949839346110821e-05, + 8.610116492491215e-05, + 9.125673386733979e-05, + 9.256677003577352e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5419921875, + "loss_eval": 1.2823748588562012, + "epoch": 20 + }, + { + "hidden_norms": [ + 141.82034301757812, + 122.27132415771484, + 103.36873626708984, + 86.49518585205078, + 71.40383911132812 + ], + "bp_grad_per_sample_l2_med": [ + 7.251821807585657e-05, + 7.807672955095768e-05, + 8.464990969514474e-05, + 8.788360719336197e-05, + 8.839634392643347e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.2162373065948486, + "epoch": 21 + }, + { + "hidden_norms": [ + 144.1250762939453, + 123.32146453857422, + 105.33419036865234, + 87.95057678222656, + 71.54405975341797 + ], + "bp_grad_per_sample_l2_med": [ + 7.141266542021185e-05, + 7.827960507711396e-05, + 8.527522732038051e-05, + 9.162349306279793e-05, + 8.910013275453821e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5712890625, + "loss_eval": 1.2267348766326904, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.35816955566406, + 123.92304229736328, + 106.45323944091797, + 89.38124084472656, + 72.80756378173828 + ], + "bp_grad_per_sample_l2_med": [ + 6.914530968060717e-05, + 7.74021100369282e-05, + 8.25833558337763e-05, + 8.843685645842925e-05, + 8.765731763560325e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2464958429336548, + "epoch": 23 + }, + { + "hidden_norms": [ + 146.9630126953125, + 126.59661102294922, + 108.23934936523438, + 90.85575103759766, + 72.80107879638672 + ], + "bp_grad_per_sample_l2_med": [ + 7.045341044431552e-05, + 7.726218609604985e-05, + 8.23774971649982e-05, + 8.931937190936878e-05, + 9.00102750165388e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5556640625, + "loss_eval": 1.226228952407837, + "epoch": 24 + }, + { + "hidden_norms": [ + 150.7821044921875, + 129.61668395996094, + 108.98286437988281, + 89.68734741210938, + 72.85277557373047 + ], + "bp_grad_per_sample_l2_med": [ + 7.34334607841447e-05, + 7.900002674432471e-05, + 8.469617750961334e-05, + 8.900847751647234e-05, + 8.846351556712762e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.2140324115753174, + "epoch": 25 + }, + { + "hidden_norms": [ + 151.44703674316406, + 129.4413604736328, + 110.14541625976562, + 91.28382110595703, + 74.19001770019531 + ], + "bp_grad_per_sample_l2_med": [ + 6.830286292824894e-05, + 7.440579793183133e-05, + 8.040962711675093e-05, + 8.615498518338427e-05, + 8.749076368985698e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5771484375, + "loss_eval": 1.2101829051971436, + "epoch": 26 + }, + { + "hidden_norms": [ + 153.631591796875, + 132.0617218017578, + 110.9275894165039, + 92.176513671875, + 73.5614242553711 + ], + "bp_grad_per_sample_l2_med": [ + 7.137414650060236e-05, + 7.97546817921102e-05, + 8.503787830704823e-05, + 9.110210521612316e-05, + 9.112519910559058e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1954376697540283, + "epoch": 27 + }, + { + "hidden_norms": [ + 155.2130584716797, + 133.7564697265625, + 113.44039916992188, + 93.51616668701172, + 74.26422882080078 + ], + "bp_grad_per_sample_l2_med": [ + 7.436865416821092e-05, + 8.266629447462037e-05, + 8.722272468730807e-05, + 9.24940686672926e-05, + 9.228193084709346e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.568359375, + "loss_eval": 1.2368288040161133, + "epoch": 28 + }, + { + "hidden_norms": [ + 156.52346801757812, + 134.0899200439453, + 113.28357696533203, + 93.11508178710938, + 74.41522216796875 + ], + "bp_grad_per_sample_l2_med": [ + 7.232115603983402e-05, + 7.883219950599596e-05, + 8.385341061512008e-05, + 8.885351417120546e-05, + 8.985922613646835e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5849609375, + "loss_eval": 1.1935406923294067, + "epoch": 29 + }, + { + "hidden_norms": [ + 157.1343536376953, + 136.0911102294922, + 115.831298828125, + 94.6191177368164, + 74.93243408203125 + ], + "bp_grad_per_sample_l2_med": [ + 6.815487722633407e-05, + 7.527582783950493e-05, + 8.152059308486059e-05, + 8.597332634963095e-05, + 8.487412560498342e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1716928482055664, + "epoch": 30 + }, + { + "hidden_norms": [ + 158.87771606445312, + 136.84617614746094, + 115.38484191894531, + 95.1522445678711, + 75.46046447753906 + ], + "bp_grad_per_sample_l2_med": [ + 7.11698376107961e-05, + 7.946270488901064e-05, + 8.58406419865787e-05, + 8.943407010519877e-05, + 8.97061254363507e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.1900701522827148, + "epoch": 31 + }, + { + "hidden_norms": [ + 158.57237243652344, + 135.3989715576172, + 115.39788818359375, + 94.26459503173828, + 74.65320587158203 + ], + "bp_grad_per_sample_l2_med": [ + 7.135280611691996e-05, + 7.875803567003459e-05, + 8.35385944810696e-05, + 9.056212002178654e-05, + 8.802927186479792e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58984375, + "loss_eval": 1.1936118602752686, + "epoch": 32 + }, + { + "hidden_norms": [ + 161.12164306640625, + 138.0847930908203, + 116.51541137695312, + 96.06510925292969, + 75.79708862304688 + ], + "bp_grad_per_sample_l2_med": [ + 7.089033169904724e-05, + 7.788193033775315e-05, + 8.262616029242054e-05, + 8.66727132233791e-05, + 8.98441721801646e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1777372360229492, + "epoch": 33 + }, + { + "hidden_norms": [ + 162.0608673095703, + 138.521728515625, + 117.39189147949219, + 96.19066619873047, + 75.76524353027344 + ], + "bp_grad_per_sample_l2_med": [ + 7.102260860847309e-05, + 7.727317279204726e-05, + 8.381292718695477e-05, + 8.586590411141515e-05, + 8.668057853356004e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1749277114868164, + "epoch": 34 + }, + { + "hidden_norms": [ + 161.66477966308594, + 138.45208740234375, + 118.22246551513672, + 96.99449920654297, + 76.40058135986328 + ], + "bp_grad_per_sample_l2_med": [ + 6.717143696732819e-05, + 7.219286635518074e-05, + 7.78083413024433e-05, + 8.173672540578991e-05, + 8.14773520687595e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.183088779449463, + "epoch": 35 + }, + { + "hidden_norms": [ + 163.6893310546875, + 140.37518310546875, + 119.34339904785156, + 96.78111267089844, + 75.42987823486328 + ], + "bp_grad_per_sample_l2_med": [ + 6.809990736655891e-05, + 7.472001743735746e-05, + 7.982164243003353e-05, + 8.6645879491698e-05, + 8.662666368763894e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.599609375, + "loss_eval": 1.1695549488067627, + "epoch": 36 + }, + { + "hidden_norms": [ + 164.063232421875, + 140.68441772460938, + 118.45069122314453, + 96.70316314697266, + 75.4270248413086 + ], + "bp_grad_per_sample_l2_med": [ + 7.114750769687817e-05, + 7.883143553044647e-05, + 8.33458179840818e-05, + 8.941504347603768e-05, + 8.57952400110662e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.1776624917984009, + "epoch": 37 + }, + { + "hidden_norms": [ + 163.89480590820312, + 140.18966674804688, + 119.30622863769531, + 97.97473907470703, + 76.34546661376953 + ], + "bp_grad_per_sample_l2_med": [ + 6.944040069356561e-05, + 7.674084190512076e-05, + 8.196813723770902e-05, + 8.950124902185053e-05, + 8.920513209886849e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1852729320526123, + "epoch": 38 + }, + { + "hidden_norms": [ + 165.47622680664062, + 141.58221435546875, + 119.55635070800781, + 98.0240707397461, + 76.13150787353516 + ], + "bp_grad_per_sample_l2_med": [ + 7.238827674882486e-05, + 7.85816737334244e-05, + 8.403261745115742e-05, + 8.998374687507749e-05, + 8.897150837583467e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1676307916641235, + "epoch": 39 + }, + { + "hidden_norms": [ + 164.69053649902344, + 142.07537841796875, + 121.09794616699219, + 99.6556396484375, + 77.98886108398438 + ], + "bp_grad_per_sample_l2_med": [ + 7.123505201889202e-05, + 7.861913036322221e-05, + 8.443401020485908e-05, + 8.940586121752858e-05, + 8.976398385129869e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1959164142608643, + "epoch": 40 + }, + { + "hidden_norms": [ + 164.97906494140625, + 141.9008026123047, + 120.19933319091797, + 98.47044372558594, + 76.0770263671875 + ], + "bp_grad_per_sample_l2_med": [ + 7.325963088078424e-05, + 8.044692367548123e-05, + 8.460321987513453e-05, + 9.052005771081895e-05, + 8.883728878572583e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1650420427322388, + "epoch": 41 + }, + { + "hidden_norms": [ + 167.11508178710938, + 144.4076690673828, + 121.90902709960938, + 99.70268249511719, + 77.1493911743164 + ], + "bp_grad_per_sample_l2_med": [ + 6.938715523574501e-05, + 7.598697993671522e-05, + 8.122843428282067e-05, + 8.419268124271184e-05, + 8.758077456150204e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6103515625, + "loss_eval": 1.1334974765777588, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.23953247070312, + 143.8128662109375, + 121.41165924072266, + 99.37804412841797, + 76.86026763916016 + ], + "bp_grad_per_sample_l2_med": [ + 7.253287185449153e-05, + 7.92228602222167e-05, + 8.514960791217163e-05, + 9.06435088836588e-05, + 8.896931103663519e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1443839073181152, + "epoch": 43 + }, + { + "hidden_norms": [ + 167.02175903320312, + 143.56179809570312, + 121.07357025146484, + 98.59805297851562, + 76.59933471679688 + ], + "bp_grad_per_sample_l2_med": [ + 7.202434790087864e-05, + 7.884378283051774e-05, + 8.405950211454183e-05, + 8.979378617368639e-05, + 8.789195271674544e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.1233543157577515, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.8506622314453, + 144.7351531982422, + 122.07427978515625, + 100.25342559814453, + 77.3443832397461 + ], + "bp_grad_per_sample_l2_med": [ + 6.906851194798946e-05, + 7.469953561667353e-05, + 7.91402708273381e-05, + 8.30625431262888e-05, + 8.482224802719429e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1078553199768066, + "epoch": 45 + }, + { + "hidden_norms": [ + 167.80520629882812, + 145.0210418701172, + 123.11544036865234, + 101.08995056152344, + 77.6504898071289 + ], + "bp_grad_per_sample_l2_med": [ + 6.715168274240568e-05, + 7.365776400547475e-05, + 7.808832015143707e-05, + 8.405041444348171e-05, + 8.283500210382044e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1213364601135254, + "epoch": 46 + }, + { + "hidden_norms": [ + 168.5064697265625, + 144.57977294921875, + 122.67310333251953, + 100.03209686279297, + 76.30200958251953 + ], + "bp_grad_per_sample_l2_med": [ + 7.193082274170592e-05, + 7.761332381051034e-05, + 8.224599878303707e-05, + 8.772317232796922e-05, + 8.76585254445672e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1593999862670898, + "epoch": 47 + }, + { + "hidden_norms": [ + 168.2687225341797, + 145.1931610107422, + 123.04153442382812, + 100.33060455322266, + 77.3511734008789 + ], + "bp_grad_per_sample_l2_med": [ + 7.396154978778213e-05, + 8.14273880678229e-05, + 8.724145300220698e-05, + 9.166308882413432e-05, + 9.03390027815476e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1506351232528687, + "epoch": 48 + }, + { + "hidden_norms": [ + 169.19711303710938, + 145.7348175048828, + 122.21668243408203, + 100.78398895263672, + 77.85338592529297 + ], + "bp_grad_per_sample_l2_med": [ + 7.148115400923416e-05, + 7.858182652853429e-05, + 8.472947956761345e-05, + 8.831475861370564e-05, + 9.002227307064459e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1426208019256592, + "epoch": 49 + }, + { + "hidden_norms": [ + 169.87611389160156, + 144.65980529785156, + 122.2470932006836, + 99.39762115478516, + 76.66820526123047 + ], + "bp_grad_per_sample_l2_med": [ + 7.574502524221316e-05, + 8.358684863196686e-05, + 8.949989569373429e-05, + 9.581056656315923e-05, + 9.291989408666268e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.599609375, + "loss_eval": 1.146412968635559, + "epoch": 50 + }, + { + "hidden_norms": [ + 167.4952850341797, + 143.16302490234375, + 119.86161804199219, + 97.8775863647461, + 75.75617980957031 + ], + "bp_grad_per_sample_l2_med": [ + 7.487049151677638e-05, + 8.140889985952526e-05, + 8.958375110523775e-05, + 9.491044329479337e-05, + 9.230020805262029e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6064453125, + "loss_eval": 1.1555390357971191, + "epoch": 51 + }, + { + "hidden_norms": [ + 169.03530883789062, + 144.57913208007812, + 122.20657348632812, + 100.42291259765625, + 77.34142303466797 + ], + "bp_grad_per_sample_l2_med": [ + 7.283290324267e-05, + 8.043479465413839e-05, + 8.612027886556461e-05, + 9.16399949346669e-05, + 9.119778405874968e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.145568609237671, + "epoch": 52 + }, + { + "hidden_norms": [ + 168.97242736816406, + 144.64987182617188, + 121.88980865478516, + 99.5838394165039, + 76.98419952392578 + ], + "bp_grad_per_sample_l2_med": [ + 7.706385804340243e-05, + 8.52798912092112e-05, + 9.141799091594294e-05, + 9.48576707742177e-05, + 9.280487574869767e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.173735499382019, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.5861053466797, + 145.18853759765625, + 123.36368560791016, + 100.5948257446289, + 77.515380859375 + ], + "bp_grad_per_sample_l2_med": [ + 7.197257218649611e-05, + 7.774284313200042e-05, + 8.511826308676973e-05, + 9.136695007327944e-05, + 8.776389586273581e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.125669240951538, + "epoch": 54 + }, + { + "hidden_norms": [ + 168.54624938964844, + 144.20028686523438, + 120.96566009521484, + 98.61659240722656, + 75.90725708007812 + ], + "bp_grad_per_sample_l2_med": [ + 7.784854824421927e-05, + 8.512740896549076e-05, + 9.021186269819736e-05, + 9.572209819452837e-05, + 9.406798199051991e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.143272042274475, + "epoch": 55 + }, + { + "hidden_norms": [ + 167.1956024169922, + 144.33364868164062, + 121.39191436767578, + 99.15605926513672, + 76.89862060546875 + ], + "bp_grad_per_sample_l2_med": [ + 7.683308649575338e-05, + 8.338083716807887e-05, + 9.210927237290889e-05, + 9.760970715433359e-05, + 9.435461106477305e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.1492671966552734, + "epoch": 56 + }, + { + "hidden_norms": [ + 168.5964813232422, + 144.6849365234375, + 122.38106536865234, + 99.73613739013672, + 77.72384643554688 + ], + "bp_grad_per_sample_l2_med": [ + 7.762440509395674e-05, + 8.45814065542072e-05, + 9.048492211150005e-05, + 9.445888281334192e-05, + 9.163413778878748e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6103515625, + "loss_eval": 1.1285452842712402, + "epoch": 57 + }, + { + "hidden_norms": [ + 169.4349365234375, + 145.3781280517578, + 122.81243896484375, + 100.45063781738281, + 77.73384094238281 + ], + "bp_grad_per_sample_l2_med": [ + 7.32980333850719e-05, + 8.07973847258836e-05, + 8.676065772306174e-05, + 8.88932918314822e-05, + 8.98713551578112e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.1177959442138672, + "epoch": 58 + }, + { + "hidden_norms": [ + 167.85089111328125, + 143.60365295410156, + 120.23004913330078, + 98.14772033691406, + 76.00984191894531 + ], + "bp_grad_per_sample_l2_med": [ + 7.664797885809094e-05, + 8.470165630569682e-05, + 9.283467807108536e-05, + 9.794873039936647e-05, + 9.169583063339815e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.1301027536392212, + "epoch": 59 + }, + { + "hidden_norms": [ + 167.4250946044922, + 144.43685913085938, + 120.5447769165039, + 98.6132583618164, + 76.67144775390625 + ], + "bp_grad_per_sample_l2_med": [ + 7.264616579050198e-05, + 8.033386984607205e-05, + 8.730305125936866e-05, + 9.157789463642985e-05, + 9.014589886646718e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.1262563467025757, + "epoch": 60 + }, + { + "hidden_norms": [ + 167.57273864746094, + 143.9201202392578, + 120.18034362792969, + 99.7088851928711, + 77.43472290039062 + ], + "bp_grad_per_sample_l2_med": [ + 7.527784327976406e-05, + 8.20689310785383e-05, + 8.86347406776622e-05, + 9.488592331763357e-05, + 9.351663175038993e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1255381107330322, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.32432556152344, + 143.3669891357422, + 120.5047378540039, + 98.29914093017578, + 76.91972351074219 + ], + "bp_grad_per_sample_l2_med": [ + 8.1095946370624e-05, + 9.126035001827404e-05, + 9.773251076694578e-05, + 0.00010036173625849187, + 9.892736852634698e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.625, + "loss_eval": 1.121397614479065, + "epoch": 62 + }, + { + "hidden_norms": [ + 167.19789123535156, + 143.76556396484375, + 120.66227722167969, + 98.42743682861328, + 76.89801788330078 + ], + "bp_grad_per_sample_l2_med": [ + 7.633089262526482e-05, + 8.335815800819546e-05, + 9.061676246346906e-05, + 9.574641444487497e-05, + 9.495441918261349e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62109375, + "loss_eval": 1.1192781925201416, + "epoch": 63 + }, + { + "hidden_norms": [ + 166.93948364257812, + 142.26893615722656, + 119.55793762207031, + 97.94837951660156, + 76.42357635498047 + ], + "bp_grad_per_sample_l2_med": [ + 7.782453758409247e-05, + 8.425768464803696e-05, + 9.212247096002102e-05, + 9.447304182685912e-05, + 9.302303078584373e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1216533184051514, + "epoch": 64 + }, + { + "hidden_norms": [ + 166.6027069091797, + 143.06201171875, + 120.18063354492188, + 98.2688217163086, + 76.29009246826172 + ], + "bp_grad_per_sample_l2_med": [ + 8.051560871535912e-05, + 8.871743193594739e-05, + 9.67002852121368e-05, + 0.00010364756599301472, + 9.896839765133336e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.1287095546722412, + "epoch": 65 + }, + { + "hidden_norms": [ + 167.1055908203125, + 142.63758850097656, + 119.64879608154297, + 97.64229583740234, + 76.44933319091797 + ], + "bp_grad_per_sample_l2_med": [ + 7.66752491472289e-05, + 8.481083932565525e-05, + 9.087422949960455e-05, + 9.747539297677577e-05, + 9.831935312831774e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62109375, + "loss_eval": 1.1142747402191162, + "epoch": 66 + }, + { + "hidden_norms": [ + 165.7790985107422, + 141.932861328125, + 119.308349609375, + 97.3916244506836, + 76.28073120117188 + ], + "bp_grad_per_sample_l2_med": [ + 8.054008503677323e-05, + 8.828196587273851e-05, + 9.400352428201586e-05, + 0.0001006148086162284, + 9.63730999501422e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6220703125, + "loss_eval": 1.1091513633728027, + "epoch": 67 + }, + { + "hidden_norms": [ + 166.0056915283203, + 142.36737060546875, + 119.14185333251953, + 97.59127044677734, + 76.91047668457031 + ], + "bp_grad_per_sample_l2_med": [ + 7.921652286313474e-05, + 8.842039096634835e-05, + 9.518962178844959e-05, + 9.989101090468466e-05, + 9.532425610814244e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.109208106994629, + "epoch": 68 + }, + { + "hidden_norms": [ + 165.06881713867188, + 141.9323272705078, + 119.31546783447266, + 97.39105987548828, + 76.88532257080078 + ], + "bp_grad_per_sample_l2_med": [ + 7.891654968261719e-05, + 8.609334327047691e-05, + 9.276948549086228e-05, + 9.923002653522417e-05, + 9.674452303443104e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62890625, + "loss_eval": 1.102659821510315, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.70677185058594, + 141.7493896484375, + 119.19147491455078, + 97.61845397949219, + 76.11932373046875 + ], + "bp_grad_per_sample_l2_med": [ + 8.021068788366392e-05, + 8.757255272939801e-05, + 9.637014591135085e-05, + 0.00010106353875016794, + 9.785306610865518e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1182312965393066, + "epoch": 70 + }, + { + "hidden_norms": [ + 164.398193359375, + 141.26121520996094, + 118.28160095214844, + 96.55244445800781, + 75.79473876953125 + ], + "bp_grad_per_sample_l2_med": [ + 8.341020293300971e-05, + 9.248757123714313e-05, + 9.663405944593251e-05, + 0.00010157335054827854, + 9.801337728276849e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62890625, + "loss_eval": 1.1038966178894043, + "epoch": 71 + }, + { + "hidden_norms": [ + 164.95956420898438, + 141.71456909179688, + 118.70948028564453, + 96.87312316894531, + 76.1374740600586 + ], + "bp_grad_per_sample_l2_med": [ + 8.227327634813264e-05, + 9.05249617062509e-05, + 9.777413652045652e-05, + 0.00010368443327024579, + 9.96799353742972e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1255979537963867, + "epoch": 72 + }, + { + "hidden_norms": [ + 164.7284393310547, + 140.8751678466797, + 118.047607421875, + 96.35321044921875, + 75.17439270019531 + ], + "bp_grad_per_sample_l2_med": [ + 7.813700358383358e-05, + 8.510561019647866e-05, + 9.316992509411648e-05, + 9.944752673618495e-05, + 9.348603634862229e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6298828125, + "loss_eval": 1.1074620485305786, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.93450927734375, + 140.53248596191406, + 117.69375610351562, + 96.16271209716797, + 75.15106201171875 + ], + "bp_grad_per_sample_l2_med": [ + 8.089678158285096e-05, + 9.048588981386274e-05, + 9.746959403855726e-05, + 0.00010185279097640887, + 9.633745503379032e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.118239164352417, + "epoch": 74 + }, + { + "hidden_norms": [ + 164.21043395996094, + 139.88815307617188, + 117.45735931396484, + 95.94420623779297, + 75.4442138671875 + ], + "bp_grad_per_sample_l2_med": [ + 8.050485485000536e-05, + 8.884233102435246e-05, + 9.638822666602209e-05, + 9.927270002663136e-05, + 9.542587213218212e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.1022429466247559, + "epoch": 75 + }, + { + "hidden_norms": [ + 163.64498901367188, + 139.56788635253906, + 117.33267974853516, + 95.80303192138672, + 75.07954406738281 + ], + "bp_grad_per_sample_l2_med": [ + 8.35943064885214e-05, + 9.346263686893508e-05, + 0.0001004879450192675, + 0.00010487801773706451, + 0.0001030422281473875 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.101865530014038, + "epoch": 76 + }, + { + "hidden_norms": [ + 163.15895080566406, + 139.2528533935547, + 116.07748413085938, + 94.62651824951172, + 74.8349380493164 + ], + "bp_grad_per_sample_l2_med": [ + 8.33335579955019e-05, + 9.210313146468252e-05, + 9.823974687606096e-05, + 0.00010392737749498338, + 9.883133316179737e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.107062816619873, + "epoch": 77 + }, + { + "hidden_norms": [ + 162.9849090576172, + 138.823974609375, + 116.6355972290039, + 95.05895233154297, + 74.80722045898438 + ], + "bp_grad_per_sample_l2_med": [ + 8.333245204994455e-05, + 9.167871758108959e-05, + 9.739672532305121e-05, + 0.00010222326818620786, + 9.918824798660353e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.1088743209838867, + "epoch": 78 + }, + { + "hidden_norms": [ + 162.9673614501953, + 138.89553833007812, + 116.67662811279297, + 94.80388641357422, + 74.41240692138672 + ], + "bp_grad_per_sample_l2_med": [ + 8.250313112512231e-05, + 9.097345173358917e-05, + 9.694542677607387e-05, + 0.00010250341438222677, + 9.611865971237421e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1069759130477905, + "epoch": 79 + }, + { + "hidden_norms": [ + 163.01101684570312, + 138.9472198486328, + 116.52082824707031, + 94.81626892089844, + 74.34078216552734 + ], + "bp_grad_per_sample_l2_med": [ + 8.468546730000526e-05, + 9.535141725791618e-05, + 9.998930181609467e-05, + 0.00010477996693225577, + 0.00010350123920943588 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.11004638671875, + "epoch": 80 + }, + { + "hidden_norms": [ + 162.48593139648438, + 138.60171508789062, + 116.15435028076172, + 94.63046264648438, + 74.77122497558594 + ], + "bp_grad_per_sample_l2_med": [ + 8.888062438927591e-05, + 9.835455421125516e-05, + 0.00010451052366988733, + 0.00010972235031658784, + 0.00010192779154749587 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1166486740112305, + "epoch": 81 + }, + { + "hidden_norms": [ + 162.33985900878906, + 138.57908630371094, + 115.86516571044922, + 94.62572479248047, + 74.61656951904297 + ], + "bp_grad_per_sample_l2_med": [ + 8.704938227310777e-05, + 9.788614988792688e-05, + 0.00010670957271941006, + 0.00011224307672819123, + 0.00010563644173089415 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.1027870178222656, + "epoch": 82 + }, + { + "hidden_norms": [ + 162.28363037109375, + 137.98855590820312, + 115.68619537353516, + 94.57305145263672, + 74.67822265625 + ], + "bp_grad_per_sample_l2_med": [ + 8.545320451958105e-05, + 9.513215627521276e-05, + 0.00010359021689509973, + 0.00010905940871452913, + 0.00010360238957218826 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1074315309524536, + "epoch": 83 + }, + { + "hidden_norms": [ + 161.65008544921875, + 138.2888946533203, + 115.37015533447266, + 94.0649185180664, + 74.40010070800781 + ], + "bp_grad_per_sample_l2_med": [ + 8.725856605451554e-05, + 9.554363350616768e-05, + 0.00010503961675567552, + 0.00011096282105427235, + 0.00010341637971578166 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.104964017868042, + "epoch": 84 + }, + { + "hidden_norms": [ + 162.56822204589844, + 138.35604858398438, + 115.56212615966797, + 93.74854278564453, + 74.29190826416016 + ], + "bp_grad_per_sample_l2_med": [ + 8.511068881489336e-05, + 9.339748066850007e-05, + 0.00010132823081221431, + 0.00010685007873689756, + 0.00010203333658864722 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.110845923423767, + "epoch": 85 + }, + { + "hidden_norms": [ + 161.8057861328125, + 137.9845733642578, + 115.51632690429688, + 94.12870788574219, + 74.2806167602539 + ], + "bp_grad_per_sample_l2_med": [ + 8.701891783857718e-05, + 9.453850361751392e-05, + 0.00010162424587178975, + 0.00010690372437238693, + 0.0001028447222779505 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.108534574508667, + "epoch": 86 + }, + { + "hidden_norms": [ + 161.5404815673828, + 137.67727661132812, + 115.56287384033203, + 94.2837142944336, + 74.19786834716797 + ], + "bp_grad_per_sample_l2_med": [ + 8.555947715649381e-05, + 9.61149125942029e-05, + 0.00010081662185257301, + 0.00010581265814835206, + 0.00010205370926996693 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.1068053245544434, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.6155242919922, + 137.77752685546875, + 115.26612854003906, + 93.79004669189453, + 74.01652526855469 + ], + "bp_grad_per_sample_l2_med": [ + 8.888345473678783e-05, + 9.766507719177753e-05, + 0.00010646588634699583, + 0.0001093660102924332, + 0.0001023485092446208 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.112060308456421, + "epoch": 88 + }, + { + "hidden_norms": [ + 161.4155731201172, + 137.4070281982422, + 114.93219757080078, + 93.83850860595703, + 74.04694366455078 + ], + "bp_grad_per_sample_l2_med": [ + 8.62668312038295e-05, + 9.635779133532196e-05, + 0.00010364993795519695, + 0.00010628051677485928, + 0.00010416742588859051 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.1054459810256958, + "epoch": 89 + }, + { + "hidden_norms": [ + 161.10385131835938, + 137.37892150878906, + 114.876953125, + 93.37522888183594, + 73.81317901611328 + ], + "bp_grad_per_sample_l2_med": [ + 8.967578469309956e-05, + 9.864033199846745e-05, + 0.00010763857426354662, + 0.00011277131852693856, + 0.0001057170593412593 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1104364395141602, + "epoch": 90 + }, + { + "hidden_norms": [ + 160.9930419921875, + 137.13717651367188, + 114.8873062133789, + 93.33486938476562, + 74.0313949584961 + ], + "bp_grad_per_sample_l2_med": [ + 8.793028973741457e-05, + 9.762586705619469e-05, + 0.00010612032929202542, + 0.00010882189963012934, + 0.00010218457464361563 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.107926607131958, + "epoch": 91 + }, + { + "hidden_norms": [ + 161.131103515625, + 136.96864318847656, + 114.8429183959961, + 93.4638442993164, + 74.06806945800781 + ], + "bp_grad_per_sample_l2_med": [ + 8.899801468942314e-05, + 9.761646651895717e-05, + 0.00010549664148129523, + 0.00011210257798666134, + 0.000105380589957349 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1014349460601807, + "epoch": 92 + }, + { + "hidden_norms": [ + 160.92770385742188, + 137.00291442871094, + 114.67124938964844, + 93.55059051513672, + 73.94056701660156 + ], + "bp_grad_per_sample_l2_med": [ + 8.758921467233449e-05, + 9.86124505288899e-05, + 0.0001072377126547508, + 0.00011291914415778592, + 0.00010492445289855823 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1031121015548706, + "epoch": 93 + }, + { + "hidden_norms": [ + 160.88087463378906, + 136.80621337890625, + 114.49836730957031, + 93.34219360351562, + 73.85013580322266 + ], + "bp_grad_per_sample_l2_med": [ + 8.935505320550874e-05, + 9.829271584749222e-05, + 0.00010722390288719907, + 0.00011369076673872769, + 0.0001048692429321818 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.64453125, + "loss_eval": 1.105837106704712, + "epoch": 94 + }, + { + "hidden_norms": [ + 160.87530517578125, + 136.97203063964844, + 114.57328033447266, + 93.34746551513672, + 73.79950714111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.837936184136197e-05, + 9.732619946589693e-05, + 0.00010843550262507051, + 0.00011282044579274952, + 0.00010489222768228501 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1061646938323975, + "epoch": 95 + }, + { + "hidden_norms": [ + 160.83152770996094, + 136.82012939453125, + 114.41039276123047, + 93.26609802246094, + 73.75130462646484 + ], + "bp_grad_per_sample_l2_med": [ + 8.924134453991428e-05, + 9.699882502900437e-05, + 0.00010844215285032988, + 0.00011508698662510142, + 0.00010382343316450715 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1083133220672607, + "epoch": 96 + }, + { + "hidden_norms": [ + 160.8388214111328, + 136.79220581054688, + 114.45349884033203, + 93.23229217529297, + 73.71869659423828 + ], + "bp_grad_per_sample_l2_med": [ + 8.902873378247023e-05, + 9.731733007356524e-05, + 0.0001077003325917758, + 0.00011335347517160699, + 0.00010528459824854508 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1074192523956299, + "epoch": 97 + }, + { + "hidden_norms": [ + 160.82676696777344, + 136.7546844482422, + 114.41687774658203, + 93.24365234375, + 73.72588348388672 + ], + "bp_grad_per_sample_l2_med": [ + 8.967860048869625e-05, + 9.900779696181417e-05, + 0.00010877639579121023, + 0.00011359385825926438, + 0.0001041799841914326 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1075721979141235, + "epoch": 98 + }, + { + "hidden_norms": [ + 160.8055419921875, + 136.8428955078125, + 114.41191864013672, + 93.23294067382812, + 73.72472381591797 + ], + "bp_grad_per_sample_l2_med": [ + 8.870402962202206e-05, + 9.879077697405592e-05, + 0.00010879703768296167, + 0.00011367550177965313, + 0.00010426441440358758 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.107743263244629, + "epoch": 99 + }, + { + "hidden_norms": [ + 160.795166015625, + 136.82778930664062, + 114.41122436523438, + 93.22368621826172, + 73.72713470458984 + ], + "bp_grad_per_sample_l2_med": [ + 8.868239092407748e-05, + 9.911284723784775e-05, + 0.00010880655463552102, + 0.00011359110794728622, + 0.00010424658830743283 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1077194213867188, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005607507191598415, + 0.0005558764678426087, + 0.0005541853606700897, + 0.0005498801474459469, + 0.0005458085797727108 + ], + "gamma_dfa": 0.002593531389720738, + "gamma_dfa_per_layer": [ + 0.011040969751775265, + 0.0018278355710208416, + -0.019951725378632545, + 0.01745704561471939 + ], + "acc_eval": 0.091796875, + "loss_eval": 2.3707523345947266, + "epoch": 0 + }, + { + "hidden_norms": [ + 543.6214599609375, + 970.167724609375, + 1128.5582275390625, + 1385.4898681640625, + 1506.6824951171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006441785371862352, + 0.0006426527979783714, + 0.0006424304447136819, + 0.000642389350105077, + 0.0006423307931981981 + ], + "gamma_dfa": 0.013619338162243366, + "gamma_dfa_per_layer": [ + 0.044537801295518875, + 0.008280456066131592, + -0.026753954589366913, + 0.02841304987668991 + ], + "acc_eval": 0.224609375, + "loss_eval": 7.057413101196289, + "epoch": 1 + }, + { + "hidden_norms": [ + 877.8099365234375, + 2093.12060546875, + 2686.85400390625, + 3536.0849609375, + 3998.738037109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007192303892225027, + 0.000718857510946691, + 0.0007187117007561028, + 0.0007188154268078506, + 0.0007185889990068972 + ], + "gamma_dfa": -0.0027784015983343124, + "gamma_dfa_per_layer": [ + 0.04956255108118057, + -0.024007968604564667, + -0.02988382987678051, + -0.006784358993172646 + ], + "acc_eval": 0.2197265625, + "loss_eval": 11.82400131225586, + "epoch": 2 + }, + { + "hidden_norms": [ + 1082.57763671875, + 3122.52001953125, + 4171.595703125, + 5502.81494140625, + 6367.2392578125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007569500594399869, + 0.0007553253090009093, + 0.0007550596492365003, + 0.0007549565634690225, + 0.0007544843829236925 + ], + "gamma_dfa": -0.004858810920268297, + "gamma_dfa_per_layer": [ + 0.06696394830942154, + -0.024477044120430946, + -0.04227307811379433, + -0.019649069756269455 + ], + "acc_eval": 0.18359375, + "loss_eval": 24.264713287353516, + "epoch": 3 + }, + { + "hidden_norms": [ + 1244.07275390625, + 4114.89111328125, + 5548.310546875, + 7262.12744140625, + 8410.1474609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007311897934414446, + 0.0007286664913408458, + 0.0007287323824129999, + 0.0007287483895197511, + 0.0007287858170457184 + ], + "gamma_dfa": -0.003940413473173976, + "gamma_dfa_per_layer": [ + 0.06546925008296967, + -0.03793267905712128, + -0.03520221635699272, + -0.008096008561551571 + ], + "acc_eval": 0.197265625, + "loss_eval": 21.850379943847656, + "epoch": 4 + }, + { + "hidden_norms": [ + 1357.7320556640625, + 5130.4609375, + 7149.40380859375, + 9744.58984375, + 11396.052734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000750180275645107, + 0.0007480062777176499, + 0.0007475404418073595, + 0.0007476753671653569, + 0.0007474455051124096 + ], + "gamma_dfa": -6.745467544533312e-06, + "gamma_dfa_per_layer": [ + 0.08006488531827927, + -0.0292807687073946, + -0.04997118189930916, + -0.0008399165817536414 + ], + "acc_eval": 0.2314453125, + "loss_eval": 30.650737762451172, + "epoch": 5 + }, + { + "hidden_norms": [ + 1438.5594482421875, + 5736.68994140625, + 8271.92578125, + 11658.373046875, + 13768.2861328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000744938850402832, + 0.0007369474042207003, + 0.0007347911596298218, + 0.0007346841157414019, + 0.000734883826225996 + ], + "gamma_dfa": -0.0024929028004407883, + "gamma_dfa_per_layer": [ + 0.08933529257774353, + -0.03695790469646454, + -0.04257381707429886, + -0.019775182008743286 + ], + "acc_eval": 0.23046875, + "loss_eval": 42.61720275878906, + "epoch": 6 + }, + { + "hidden_norms": [ + 1512.00244140625, + 6517.73779296875, + 9229.724609375, + 13440.5166015625, + 16669.212890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007609400781802833, + 0.0007555288611911237, + 0.0007558621582575142, + 0.0007557112840004265, + 0.0007554451585747302 + ], + "gamma_dfa": -0.007545993197709322, + "gamma_dfa_per_layer": [ + 0.08795229345560074, + -0.03476891666650772, + -0.06410981714725494, + -0.01925753243267536 + ], + "acc_eval": 0.208984375, + "loss_eval": 50.873321533203125, + "epoch": 7 + }, + { + "hidden_norms": [ + 1582.1080322265625, + 7188.6318359375, + 9899.5947265625, + 15346.5009765625, + 19886.591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007456639432348311, + 0.0007417471497319639, + 0.0007396289147436619, + 0.0007396984728984535, + 0.0007395402644760907 + ], + "gamma_dfa": -0.009718619287014008, + "gamma_dfa_per_layer": [ + 0.09109380096197128, + -0.042414966970682144, + -0.04605134204030037, + -0.0415019690990448 + ], + "acc_eval": 0.189453125, + "loss_eval": 54.14390182495117, + "epoch": 8 + }, + { + "hidden_norms": [ + 1618.51708984375, + 7916.01416015625, + 10608.3408203125, + 17416.95703125, + 24058.658203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007598118390887976, + 0.0007534913602285087, + 0.0007532819290645421, + 0.0007532560266554356, + 0.0007529302965849638 + ], + "gamma_dfa": 0.0011779842898249626, + "gamma_dfa_per_layer": [ + 0.10601411014795303, + -0.0355507917702198, + -0.04322661831974983, + -0.022524762898683548 + ], + "acc_eval": 0.169921875, + "loss_eval": 79.9201889038086, + "epoch": 9 + }, + { + "hidden_norms": [ + 1708.6558837890625, + 8872.5908203125, + 11589.568359375, + 19666.24609375, + 28447.203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000754358887206763, + 0.0007440761546604335, + 0.0007443547365255654, + 0.0007444044458679855, + 0.0007447295938618481 + ], + "gamma_dfa": -0.006681790575385094, + "gamma_dfa_per_layer": [ + 0.12310357391834259, + -0.054726000875234604, + -0.061426255851984024, + -0.03367847949266434 + ], + "acc_eval": 0.189453125, + "loss_eval": 117.76714324951172, + "epoch": 10 + }, + { + "hidden_norms": [ + 1757.5994873046875, + 10265.8017578125, + 13090.66796875, + 22099.814453125, + 34584.30078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000756443478167057, + 0.0007464477675966918, + 0.000743720680475235, + 0.0007434834260493517, + 0.0007420994224958122 + ], + "gamma_dfa": -0.01398628018796444, + "gamma_dfa_per_layer": [ + 0.12564796209335327, + -0.05404478684067726, + -0.07238315045833588, + -0.05516514554619789 + ], + "acc_eval": 0.189453125, + "loss_eval": 103.90010070800781, + "epoch": 11 + }, + { + "hidden_norms": [ + 1799.9754638671875, + 11735.4208984375, + 14739.4091796875, + 24244.48828125, + 40467.53125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007648739847354591, + 0.0007477994076907635, + 0.0007476488244719803, + 0.0007475496386177838, + 0.0007478601182810962 + ], + "gamma_dfa": -0.005489904433488846, + "gamma_dfa_per_layer": [ + 0.1469549834728241, + -0.04884009808301926, + -0.05759190022945404, + -0.06248260289430618 + ], + "acc_eval": 0.2041015625, + "loss_eval": 124.61287689208984, + "epoch": 12 + }, + { + "hidden_norms": [ + 1851.51123046875, + 13681.8662109375, + 17609.712890625, + 27533.84375, + 52049.0703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007830688264220953, + 0.0007742528687231243, + 0.0007744400063529611, + 0.0007723497110418975, + 0.0007720965659245849 + ], + "gamma_dfa": -0.0014207642525434494, + "gamma_dfa_per_layer": [ + 0.18515333533287048, + -0.04434240236878395, + -0.09712066501379013, + -0.0493733249604702 + ], + "acc_eval": 0.142578125, + "loss_eval": 212.8883056640625, + "epoch": 13 + }, + { + "hidden_norms": [ + 1899.2525634765625, + 16269.4736328125, + 21580.724609375, + 31947.771484375, + 66851.5703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000794055697042495, + 0.0007606232538819313, + 0.0007601877441629767, + 0.0007598533411510289, + 0.000759296934120357 + ], + "gamma_dfa": 0.012796862982213497, + "gamma_dfa_per_layer": [ + 0.206809401512146, + -0.04797299578785896, + -0.0716182291507721, + -0.03603072464466095 + ], + "acc_eval": 0.1591796875, + "loss_eval": 268.9534912109375, + "epoch": 14 + }, + { + "hidden_norms": [ + 1988.337890625, + 20679.96484375, + 27719.126953125, + 37757.640625, + 86759.0234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007827074150554836, + 0.0007373052649199963, + 0.0007380677270703018, + 0.000736265501473099, + 0.0007371739484369755 + ], + "gamma_dfa": 0.003913283348083496, + "gamma_dfa_per_layer": [ + 0.18332748115062714, + -0.05311701446771622, + -0.06076449155807495, + -0.053792841732501984 + ], + "acc_eval": 0.2548828125, + "loss_eval": 367.0162048339844, + "epoch": 15 + }, + { + "hidden_norms": [ + 2074.877685546875, + 25397.2421875, + 35934.484375, + 45723.14453125, + 111497.4296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008315286249853671, + 0.0007900919299572706, + 0.0007844009087421, + 0.0007838390883989632, + 0.0007860813639126718 + ], + "gamma_dfa": -0.002616437152028084, + "gamma_dfa_per_layer": [ + 0.21044191718101501, + -0.05741831660270691, + -0.1141648143529892, + -0.049324534833431244 + ], + "acc_eval": 0.1220703125, + "loss_eval": 449.4093322753906, + "epoch": 16 + }, + { + "hidden_norms": [ + 2160.0703125, + 30060.396484375, + 43998.6953125, + 54128.03515625, + 137197.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007943993550725281, + 0.0007568124565295875, + 0.0007565468549728394, + 0.0007549119181931019, + 0.0007542246603406966 + ], + "gamma_dfa": 0.005578489974141121, + "gamma_dfa_per_layer": [ + 0.21836650371551514, + -0.057003527879714966, + -0.08258379250764847, + -0.05646522343158722 + ], + "acc_eval": 0.2099609375, + "loss_eval": 505.51385498046875, + "epoch": 17 + }, + { + "hidden_norms": [ + 2261.926025390625, + 35914.08203125, + 53701.83203125, + 65022.0234375, + 174995.234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008322449866682291, + 0.0007640637923032045, + 0.0007639409159310162, + 0.000764198659453541, + 0.0007642150158062577 + ], + "gamma_dfa": 0.017949961125850677, + "gamma_dfa_per_layer": [ + 0.23718158900737762, + -0.05374513193964958, + -0.062201935797929764, + -0.04943467676639557 + ], + "acc_eval": 0.2109375, + "loss_eval": 610.7471923828125, + "epoch": 18 + }, + { + "hidden_norms": [ + 2326.78271484375, + 42755.171875, + 66353.453125, + 77731.328125, + 221615.828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008451915346086025, + 0.0007553622708655894, + 0.0007553161703981459, + 0.0007546090637333691, + 0.0007550025475211442 + ], + "gamma_dfa": 0.029257358983159065, + "gamma_dfa_per_layer": [ + 0.26171058416366577, + -0.04214981198310852, + -0.06413372606039047, + -0.03839761018753052 + ], + "acc_eval": 0.19921875, + "loss_eval": 652.3941650390625, + "epoch": 19 + }, + { + "hidden_norms": [ + 2443.6630859375, + 48300.12109375, + 77390.1015625, + 91484.09375, + 270700.96875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009103405755013227, + 0.0007761572487652302, + 0.0007760545704513788, + 0.0007730794604867697, + 0.0007728201453574002 + ], + "gamma_dfa": 0.017114468850195408, + "gamma_dfa_per_layer": [ + 0.26115190982818604, + -0.050561077892780304, + -0.08694136142730713, + -0.05519159510731697 + ], + "acc_eval": 0.1669921875, + "loss_eval": 1354.747314453125, + "epoch": 20 + }, + { + "hidden_norms": [ + 2499.429931640625, + 57379.33203125, + 93242.0859375, + 111601.9921875, + 332709.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010016581509262323, + 0.0007549687870778143, + 0.0007551733287982643, + 0.0007543734973296523, + 0.0007547553977929056 + ], + "gamma_dfa": 0.047867871820926666, + "gamma_dfa_per_layer": [ + 0.3270750641822815, + -0.037589848041534424, + -0.06097441166639328, + -0.037039317190647125 + ], + "acc_eval": 0.2041015625, + "loss_eval": 1818.91650390625, + "epoch": 21 + }, + { + "hidden_norms": [ + 2615.140625, + 75715.7109375, + 109683.390625, + 132553.84375, + 406621.46875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008831259910948575, + 0.0007625823491252959, + 0.0007627239683642983, + 0.0007604075944982469, + 0.0007611791370436549 + ], + "gamma_dfa": 0.022762255743145943, + "gamma_dfa_per_layer": [ + 0.27839380502700806, + -0.05395745486021042, + -0.07682197540998459, + -0.05656535178422928 + ], + "acc_eval": 0.2119140625, + "loss_eval": 1167.954833984375, + "epoch": 22 + }, + { + "hidden_norms": [ + 2742.37353515625, + 97227.28125, + 131140.8125, + 155048.3125, + 481929.84375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001124670379795134, + 0.0007696108077652752, + 0.0007702686125412583, + 0.0007697975379414856, + 0.0007697619148530066 + ], + "gamma_dfa": 0.03202100656926632, + "gamma_dfa_per_layer": [ + 0.300557404756546, + -0.04680653661489487, + -0.052118271589279175, + -0.0735485702753067 + ], + "acc_eval": 0.240234375, + "loss_eval": 2470.89453125, + "epoch": 23 + }, + { + "hidden_norms": [ + 2858.224609375, + 126260.15625, + 160387.703125, + 186178.890625, + 564007.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001086456119082868, + 0.0007698858971707523, + 0.0007706494652666152, + 0.0007701858412474394, + 0.0007703170995227993 + ], + "gamma_dfa": 0.03411092050373554, + "gamma_dfa_per_layer": [ + 0.3229827582836151, + -0.03976103663444519, + -0.05624774843454361, + -0.09053029119968414 + ], + "acc_eval": 0.2080078125, + "loss_eval": 1589.14599609375, + "epoch": 24 + }, + { + "hidden_norms": [ + 3010.89697265625, + 156964.375, + 194623.5, + 223223.875, + 662826.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010667620226740837, + 0.0007900846539996564, + 0.0007894287118688226, + 0.0007884356309659779, + 0.0007912488654255867 + ], + "gamma_dfa": 0.03901553526520729, + "gamma_dfa_per_layer": [ + 0.34151530265808105, + -0.04678330570459366, + -0.06850147247314453, + -0.0701683834195137 + ], + "acc_eval": 0.19921875, + "loss_eval": 1886.69091796875, + "epoch": 25 + }, + { + "hidden_norms": [ + 3121.8056640625, + 191038.40625, + 232148.296875, + 265744.1875, + 761219.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011186219053342938, + 0.0007986227865330875, + 0.0007986134733073413, + 0.0007980577065609396, + 0.0007973008905537426 + ], + "gamma_dfa": 0.027425863780081272, + "gamma_dfa_per_layer": [ + 0.35862213373184204, + -0.061674464493989944, + -0.0841888040304184, + -0.10305541008710861 + ], + "acc_eval": 0.185546875, + "loss_eval": 1700.765869140625, + "epoch": 26 + }, + { + "hidden_norms": [ + 3283.62646484375, + 232390.3125, + 279218.25, + 315312.8125, + 875470.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001439103507436812, + 0.0007854723371565342, + 0.0007857424207031727, + 0.0007855244330130517, + 0.0007853199495002627 + ], + "gamma_dfa": 0.03129031043499708, + "gamma_dfa_per_layer": [ + 0.33073610067367554, + -0.058702368289232254, + -0.06629009544849396, + -0.080582395195961 + ], + "acc_eval": 0.201171875, + "loss_eval": 3809.69873046875, + "epoch": 27 + }, + { + "hidden_norms": [ + 3407.8984375, + 272082.28125, + 324674.25, + 365055.125, + 983575.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.001244095852598548, + 0.0008176793926395476, + 0.0008168797940015793, + 0.000815192295704037, + 0.0008157575502991676 + ], + "gamma_dfa": 0.02919871360063553, + "gamma_dfa_per_layer": [ + 0.3321998715400696, + -0.048228584229946136, + -0.057734884321689606, + -0.10944154858589172 + ], + "acc_eval": 0.1650390625, + "loss_eval": 5145.80615234375, + "epoch": 28 + }, + { + "hidden_norms": [ + 3570.579833984375, + 325919.34375, + 383859.84375, + 429527.59375, + 1121656.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013903328217566013, + 0.0008181754965335131, + 0.0008133396040648222, + 0.0008111604838632047, + 0.0008120551356114447 + ], + "gamma_dfa": 0.04902177257463336, + "gamma_dfa_per_layer": [ + 0.33004581928253174, + -0.017712868750095367, + -0.016218842938542366, + -0.10002701729536057 + ], + "acc_eval": 0.1220703125, + "loss_eval": 4755.40869140625, + "epoch": 29 + }, + { + "hidden_norms": [ + 3675.836181640625, + 381066.84375, + 446664.84375, + 495540.4375, + 1244910.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013685236917808652, + 0.0007945130346342921, + 0.0007943777018226683, + 0.0007925048121251166, + 0.0007924467790871859 + ], + "gamma_dfa": 0.01623274479061365, + "gamma_dfa_per_layer": [ + 0.27984413504600525, + -0.06000320240855217, + -0.06209240108728409, + -0.09281755238771439 + ], + "acc_eval": 0.1962890625, + "loss_eval": 3555.3525390625, + "epoch": 30 + }, + { + "hidden_norms": [ + 3779.81103515625, + 443408.34375, + 515845.65625, + 568047.125, + 1396404.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001294015790335834, + 0.0007740295841358602, + 0.0007753889658488333, + 0.0007745815673843026, + 0.000773973239120096 + ], + "gamma_dfa": 0.048758171033114195, + "gamma_dfa_per_layer": [ + 0.3447470963001251, + -0.05413726717233658, + -0.0899808406829834, + -0.005596304312348366 + ], + "acc_eval": 0.1103515625, + "loss_eval": 8851.5302734375, + "epoch": 31 + }, + { + "hidden_norms": [ + 3920.750732421875, + 517289.40625, + 595296.5625, + 655510.1875, + 1569922.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001448597526177764, + 0.0008134506642818451, + 0.0008149920613504946, + 0.0008116801618598402, + 0.0008117944234982133 + ], + "gamma_dfa": 0.016455436125397682, + "gamma_dfa_per_layer": [ + 0.28803595900535583, + -0.048596471548080444, + -0.07654894888401031, + -0.09706879407167435 + ], + "acc_eval": 0.1767578125, + "loss_eval": 4626.505859375, + "epoch": 32 + }, + { + "hidden_norms": [ + 4035.357666015625, + 605458.75, + 691596.8125, + 758344.75, + 1762235.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013269236078485847, + 0.0007732360390946269, + 0.0007741436711512506, + 0.000773612700868398, + 0.0007734647369943559 + ], + "gamma_dfa": 0.029436825774610043, + "gamma_dfa_per_layer": [ + 0.2940990924835205, + -0.04052134230732918, + -0.05536778271198273, + -0.08046266436576843 + ], + "acc_eval": 0.2578125, + "loss_eval": 2423.88037109375, + "epoch": 33 + }, + { + "hidden_norms": [ + 4180.47998046875, + 680883.875, + 781089.375, + 856024.9375, + 1949442.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015648282133042812, + 0.0007914449088275433, + 0.0007915649330243468, + 0.0007914216257631779, + 0.0007914576563052833 + ], + "gamma_dfa": 0.019646714441478252, + "gamma_dfa_per_layer": [ + 0.2821764647960663, + -0.0451091043651104, + -0.08556324988603592, + -0.07291725277900696 + ], + "acc_eval": 0.2314453125, + "loss_eval": 3942.80810546875, + "epoch": 34 + }, + { + "hidden_norms": [ + 4309.49462890625, + 763385.4375, + 877493.9375, + 964321.4375, + 2131046.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001357953529804945, + 0.0008006176794879138, + 0.000801383052021265, + 0.0008009205921553075, + 0.0008007651194930077 + ], + "gamma_dfa": 0.012816952541470528, + "gamma_dfa_per_layer": [ + 0.3179120421409607, + -0.07943161576986313, + -0.08064424991607666, + -0.1065683662891388 + ], + "acc_eval": 0.1904296875, + "loss_eval": 4230.3056640625, + "epoch": 35 + }, + { + "hidden_norms": [ + 4492.82568359375, + 851087.875, + 976163.875, + 1072469.125, + 2314147.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001730966498143971, + 0.000772459723521024, + 0.0007729437202215195, + 0.0007728235796093941, + 0.0007726353942416608 + ], + "gamma_dfa": 0.03693788964301348, + "gamma_dfa_per_layer": [ + 0.29988259077072144, + -0.0496492013335228, + -0.08479931950569153, + -0.0176825113594532 + ], + "acc_eval": 0.1484375, + "loss_eval": 8231.34765625, + "epoch": 36 + }, + { + "hidden_norms": [ + 4624.63720703125, + 951948.25, + 1092683.875, + 1196542.75, + 2542183.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002538386033847928, + 0.0007714434177614748, + 0.0007710265927016735, + 0.0007713963277637959, + 0.0007713483064435422 + ], + "gamma_dfa": 0.04740711580961943, + "gamma_dfa_per_layer": [ + 0.33979880809783936, + -0.04041346162557602, + -0.07300114631652832, + -0.03675573691725731 + ], + "acc_eval": 0.1923828125, + "loss_eval": 8949.130859375, + "epoch": 37 + }, + { + "hidden_norms": [ + 4807.11767578125, + 1054507.625, + 1214753.0, + 1323814.0, + 2764538.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0027727719862014055, + 0.000796200183685869, + 0.0007976335473358631, + 0.0007973454194143414, + 0.0007971985614858568 + ], + "gamma_dfa": 0.08554775826632977, + "gamma_dfa_per_layer": [ + 0.5049943923950195, + -0.037710923701524734, + -0.07092456519603729, + -0.05416787043213844 + ], + "acc_eval": 0.1162109375, + "loss_eval": 12713.4443359375, + "epoch": 38 + }, + { + "hidden_norms": [ + 4955.41943359375, + 1174053.875, + 1354818.125, + 1476400.375, + 3014463.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020058690570294857, + 0.0008079316467046738, + 0.0008077211095951498, + 0.0008079909021034837, + 0.000808066048193723 + ], + "gamma_dfa": -0.01097937673330307, + "gamma_dfa_per_layer": [ + 0.23371317982673645, + -0.07769355922937393, + -0.08009498566389084, + -0.11984214186668396 + ], + "acc_eval": 0.169921875, + "loss_eval": 5398.2822265625, + "epoch": 39 + }, + { + "hidden_norms": [ + 5098.02978515625, + 1282560.25, + 1488493.125, + 1621443.25, + 3242451.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017661951715126634, + 0.0007956374902278185, + 0.0007964695687405765, + 0.0007961427327245474, + 0.0007956251502037048 + ], + "gamma_dfa": 0.022673148661851883, + "gamma_dfa_per_layer": [ + 0.3096145689487457, + -0.05532063543796539, + -0.08393190801143646, + -0.07966943085193634 + ], + "acc_eval": 0.185546875, + "loss_eval": 4639.80908203125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5239.9326171875, + 1391390.625, + 1615340.375, + 1765558.375, + 3480115.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020867532584816217, + 0.0007667955360375345, + 0.0007673996733501554, + 0.0007673778454773128, + 0.0007672442006878555 + ], + "gamma_dfa": 0.0395392719656229, + "gamma_dfa_per_layer": [ + 0.33367329835891724, + -0.043648943305015564, + -0.055444151163101196, + -0.07642311602830887 + ], + "acc_eval": 0.234375, + "loss_eval": 9990.30859375, + "epoch": 41 + }, + { + "hidden_norms": [ + 5359.44677734375, + 1521280.0, + 1767789.625, + 1930907.75, + 3750866.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017118212999776006, + 0.0007934573804959655, + 0.0007942463853396475, + 0.000793949409853667, + 0.0007934118038974702 + ], + "gamma_dfa": 0.03361810464411974, + "gamma_dfa_per_layer": [ + 0.3103788495063782, + -0.03702692314982414, + -0.055835530161857605, + -0.08304397761821747 + ], + "acc_eval": 0.216796875, + "loss_eval": 9768.205078125, + "epoch": 42 + }, + { + "hidden_norms": [ + 5546.62451171875, + 1660698.625, + 1925789.375, + 2096456.25, + 4028953.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017267497023567557, + 0.000821329711470753, + 0.0008239842718467116, + 0.0008229895029217005, + 0.0008229521918110549 + ], + "gamma_dfa": 0.029660841450095177, + "gamma_dfa_per_layer": [ + 0.35288333892822266, + -0.043948374688625336, + -0.0895853042602539, + -0.10070629417896271 + ], + "acc_eval": 0.1884765625, + "loss_eval": 8935.0380859375, + "epoch": 43 + }, + { + "hidden_norms": [ + 5664.30810546875, + 1784317.875, + 2078188.375, + 2264432.75, + 4288914.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022900900803506374, + 0.0007636325899511576, + 0.0007642185082659125, + 0.0007641956908628345, + 0.0007639650139026344 + ], + "gamma_dfa": 0.06175872636958957, + "gamma_dfa_per_layer": [ + 0.4067830443382263, + -0.03052734024822712, + -0.06545087695121765, + -0.06376992166042328 + ], + "acc_eval": 0.2197265625, + "loss_eval": 8287.39453125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5794.2666015625, + 1915382.125, + 2237977.75, + 2434797.75, + 4568056.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001793600502423942, + 0.0008144167950376868, + 0.0008172079687938094, + 0.0008157116826623678, + 0.0008155000978149474 + ], + "gamma_dfa": 0.034024693071842194, + "gamma_dfa_per_layer": [ + 0.35199591517448425, + -0.03579515218734741, + -0.09812411665916443, + -0.08197787404060364 + ], + "acc_eval": 0.1806640625, + "loss_eval": 8560.4384765625, + "epoch": 45 + }, + { + "hidden_norms": [ + 5928.12158203125, + 2057562.625, + 2403872.5, + 2624509.5, + 4865204.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001855076989158988, + 0.0007629086030647159, + 0.0007635788642801344, + 0.0007633934146724641, + 0.0007630206528119743 + ], + "gamma_dfa": 0.023082666099071503, + "gamma_dfa_per_layer": [ + 0.27648454904556274, + -0.05024096742272377, + -0.0845799595117569, + -0.049332957714796066 + ], + "acc_eval": 0.197265625, + "loss_eval": 10714.77734375, + "epoch": 46 + }, + { + "hidden_norms": [ + 6079.8232421875, + 2190046.5, + 2564464.5, + 2797927.0, + 5132383.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015576905570924282, + 0.0007896191673353314, + 0.0007904896046966314, + 0.0007902018842287362, + 0.0007895485614426434 + ], + "gamma_dfa": 0.03866780921816826, + "gamma_dfa_per_layer": [ + 0.37201371788978577, + -0.049719154834747314, + -0.07755836844444275, + -0.09006495773792267 + ], + "acc_eval": 0.19140625, + "loss_eval": 7322.5205078125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6184.03369140625, + 2339567.0, + 2744136.25, + 2990721.25, + 5426845.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020522314589470625, + 0.0007883926737122238, + 0.0007893759175203741, + 0.0007890417473390698, + 0.0007883401704020798 + ], + "gamma_dfa": 0.021758251823484898, + "gamma_dfa_per_layer": [ + 0.2855323553085327, + -0.04375234618782997, + -0.07049872726202011, + -0.08424827456474304 + ], + "acc_eval": 0.2080078125, + "loss_eval": 13975.05859375, + "epoch": 48 + }, + { + "hidden_norms": [ + 6295.5458984375, + 2477445.75, + 2917469.0, + 3179694.0, + 5727252.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002105356426909566, + 0.0008074102224782109, + 0.0008063287241384387, + 0.000806407246273011, + 0.0008067074231803417 + ], + "gamma_dfa": 0.0267162024974823, + "gamma_dfa_per_layer": [ + 0.30986034870147705, + -0.05209521949291229, + -0.09783680737018585, + -0.05306351184844971 + ], + "acc_eval": 0.1435546875, + "loss_eval": 9590.544921875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6367.55029296875, + 2638468.75, + 3095811.75, + 3362978.75, + 6030941.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015475827967748046, + 0.0008064319263212383, + 0.0008070095209404826, + 0.0008065010770224035, + 0.0008065410074777901 + ], + "gamma_dfa": 0.00636688619852066, + "gamma_dfa_per_layer": [ + 0.29843205213546753, + -0.03980886936187744, + -0.06682014465332031, + -0.16633549332618713 + ], + "acc_eval": 0.11328125, + "loss_eval": 12254.064453125, + "epoch": 50 + }, + { + "hidden_norms": [ + 6482.18798828125, + 2769282.5, + 3257572.75, + 3548043.5, + 6284645.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022430147510021925, + 0.0008079760009422898, + 0.000807179429102689, + 0.0008071344927884638, + 0.0008072732598520815 + ], + "gamma_dfa": 0.04464401211589575, + "gamma_dfa_per_layer": [ + 0.3536185026168823, + -0.02255946770310402, + -0.07369404286146164, + -0.07878894358873367 + ], + "acc_eval": 0.181640625, + "loss_eval": 10079.115234375, + "epoch": 51 + }, + { + "hidden_norms": [ + 6566.8623046875, + 2899506.0, + 3420720.5, + 3728966.75, + 6555012.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001695870072580874, + 0.000820032088086009, + 0.0008200806332752109, + 0.0008201819728128612, + 0.0008201953023672104 + ], + "gamma_dfa": 0.034856872633099556, + "gamma_dfa_per_layer": [ + 0.3895777463912964, + -0.057720690965652466, + -0.08937396109104156, + -0.10305560380220413 + ], + "acc_eval": 0.1181640625, + "loss_eval": 10401.4013671875, + "epoch": 52 + }, + { + "hidden_norms": [ + 6618.705078125, + 3056073.5, + 3608076.25, + 3938206.0, + 6870646.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014620226575061679, + 0.000811390345916152, + 0.0008111409260891378, + 0.000811099074780941, + 0.000811324454843998 + ], + "gamma_dfa": 0.002492595463991165, + "gamma_dfa_per_layer": [ + 0.2934489846229553, + -0.07660828530788422, + -0.0814061164855957, + -0.12546420097351074 + ], + "acc_eval": 0.16796875, + "loss_eval": 11906.7060546875, + "epoch": 53 + }, + { + "hidden_norms": [ + 6674.03759765625, + 3201735.0, + 3787927.75, + 4133561.75, + 7173546.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015491953818127513, + 0.0007825249340385199, + 0.0007832346600480378, + 0.0007830507238395512, + 0.0007823925698176026 + ], + "gamma_dfa": 0.054443607572466135, + "gamma_dfa_per_layer": [ + 0.38785266876220703, + -0.022086789831519127, + -0.062120988965034485, + -0.08587045967578888 + ], + "acc_eval": 0.2373046875, + "loss_eval": 9465.3525390625, + "epoch": 54 + }, + { + "hidden_norms": [ + 6740.52392578125, + 3338670.5, + 3953341.75, + 4315309.5, + 7447204.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015645271632820368, + 0.0007820724858902395, + 0.0007820809260010719, + 0.0007819690508767962, + 0.0007819557213224471 + ], + "gamma_dfa": 0.027317455038428307, + "gamma_dfa_per_layer": [ + 0.3320838212966919, + -0.06272841989994049, + -0.06253603100776672, + -0.09754955023527145 + ], + "acc_eval": 0.1923828125, + "loss_eval": 9605.2587890625, + "epoch": 55 + }, + { + "hidden_norms": [ + 6826.42578125, + 3488233.5, + 4125392.0, + 4514242.0, + 7747655.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018625661032274365, + 0.0008403572137467563, + 0.0008396300836466253, + 0.0008392629097215831, + 0.000840048654936254 + ], + "gamma_dfa": 0.018042685464024544, + "gamma_dfa_per_layer": [ + 0.34575170278549194, + -0.061284519731998444, + -0.08629278838634491, + -0.12600365281105042 + ], + "acc_eval": 0.1494140625, + "loss_eval": 13453.193359375, + "epoch": 56 + }, + { + "hidden_norms": [ + 6878.60009765625, + 3647417.5, + 4303500.5, + 4707215.0, + 8039602.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001495232223533094, + 0.0008112883078865707, + 0.0008119228295981884, + 0.0008115706732496619, + 0.0008112648501992226 + ], + "gamma_dfa": 0.025581182446330786, + "gamma_dfa_per_layer": [ + 0.301077663898468, + -0.015085713937878609, + -0.07233025878667831, + -0.11133696138858795 + ], + "acc_eval": 0.1513671875, + "loss_eval": 10446.5498046875, + "epoch": 57 + }, + { + "hidden_norms": [ + 6956.30126953125, + 3782040.0, + 4474453.5, + 4889139.0, + 8311892.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001576881273649633, + 0.0008043631678447127, + 0.0008050674805417657, + 0.0008046348229981959, + 0.0008046681759878993 + ], + "gamma_dfa": 0.005857756361365318, + "gamma_dfa_per_layer": [ + 0.28321602940559387, + -0.03702875226736069, + -0.06707675755023956, + -0.15567949414253235 + ], + "acc_eval": 0.1484375, + "loss_eval": 6591.0849609375, + "epoch": 58 + }, + { + "hidden_norms": [ + 7021.955078125, + 3911149.5, + 4636672.0, + 5064123.0, + 8571758.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002099651610478759, + 0.0008183405152522027, + 0.0008207465871237218, + 0.0008196401176974177, + 0.000819449604023248 + ], + "gamma_dfa": 0.006074780598282814, + "gamma_dfa_per_layer": [ + 0.2577749490737915, + -0.05066239833831787, + -0.06501314789056778, + -0.1178002804517746 + ], + "acc_eval": 0.2109375, + "loss_eval": 7962.04443359375, + "epoch": 59 + }, + { + "hidden_norms": [ + 7101.7373046875, + 4061103.5, + 4820611.0, + 5257086.0, + 8861818.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018932655220851302, + 0.0008025900460779667, + 0.0008032865589484572, + 0.000802954426035285, + 0.0008029173477552831 + ], + "gamma_dfa": 0.020984639413654804, + "gamma_dfa_per_layer": [ + 0.3329803943634033, + -0.03559138998389244, + -0.06842450797557831, + -0.14502593874931335 + ], + "acc_eval": 0.1650390625, + "loss_eval": 8638.353515625, + "epoch": 60 + }, + { + "hidden_norms": [ + 7120.71240234375, + 4194965.0, + 4982087.0, + 5430094.5, + 9121286.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015255591133609414, + 0.0007772985845804214, + 0.0007780406740494072, + 0.0007778139552101493, + 0.000777201319579035 + ], + "gamma_dfa": 0.0210345396772027, + "gamma_dfa_per_layer": [ + 0.3191820979118347, + -0.05588069185614586, + -0.0712573379278183, + -0.10790590941905975 + ], + "acc_eval": 0.22265625, + "loss_eval": 8870.3212890625, + "epoch": 61 + }, + { + "hidden_norms": [ + 7166.24462890625, + 4326872.0, + 5144769.0, + 5605003.0, + 9390572.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019027154194191098, + 0.000822498113848269, + 0.0008225358324125409, + 0.0008226112113334239, + 0.0008225055644288659 + ], + "gamma_dfa": 0.01758619397878647, + "gamma_dfa_per_layer": [ + 0.29208946228027344, + -0.046764522790908813, + -0.10779638588428497, + -0.06718377768993378 + ], + "acc_eval": 0.154296875, + "loss_eval": 18607.9921875, + "epoch": 62 + }, + { + "hidden_norms": [ + 7173.86865234375, + 4454190.5, + 5300661.5, + 5764316.0, + 9633685.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017527258023619652, + 0.0008042250410653651, + 0.0008040837710723281, + 0.0008041510009206831, + 0.0008041784167289734 + ], + "gamma_dfa": 0.04197401413694024, + "gamma_dfa_per_layer": [ + 0.31714165210723877, + -0.025468191131949425, + -0.05378583073616028, + -0.0699915736913681 + ], + "acc_eval": 0.1826171875, + "loss_eval": 10768.23046875, + "epoch": 63 + }, + { + "hidden_norms": [ + 7200.1064453125, + 4569527.5, + 5448454.0, + 5924151.0, + 9865530.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016467028763145208, + 0.0007759482250548899, + 0.0007759520667605102, + 0.0007758319843560457, + 0.0007757880375720561 + ], + "gamma_dfa": 0.019114631228148937, + "gamma_dfa_per_layer": [ + 0.3342781364917755, + -0.05670151486992836, + -0.0891423374414444, + -0.111975759267807 + ], + "acc_eval": 0.1865234375, + "loss_eval": 9049.12109375, + "epoch": 64 + }, + { + "hidden_norms": [ + 7198.30419921875, + 4679779.5, + 5583911.5, + 6073903.5, + 10075961.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015529918018728495, + 0.0008276477456092834, + 0.0008274043793790042, + 0.0008273764979094267, + 0.00082727539120242 + ], + "gamma_dfa": 0.012379471212625504, + "gamma_dfa_per_layer": [ + 0.33610183000564575, + -0.0668979212641716, + -0.09369023889303207, + -0.12599578499794006 + ], + "acc_eval": 0.1533203125, + "loss_eval": 9929.3125, + "epoch": 65 + }, + { + "hidden_norms": [ + 7191.220703125, + 4787683.5, + 5730170.5, + 6223255.0, + 10287596.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002624395303428173, + 0.0008026033756323159, + 0.0008024688577279449, + 0.0008025110582821071, + 0.000802531314548105 + ], + "gamma_dfa": 0.041071049869060516, + "gamma_dfa_per_layer": [ + 0.3911614418029785, + -0.03441564738750458, + -0.07384517788887024, + -0.11861641705036163 + ], + "acc_eval": 0.1669921875, + "loss_eval": 9811.68359375, + "epoch": 66 + }, + { + "hidden_norms": [ + 7184.458984375, + 4895536.0, + 5864442.5, + 6369317.5, + 10509902.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016685851151123643, + 0.0007737133419141173, + 0.0007737109554000199, + 0.0007736092084087431, + 0.0007735762046650052 + ], + "gamma_dfa": 0.03856207150965929, + "gamma_dfa_per_layer": [ + 0.3347627520561218, + -0.05478603392839432, + -0.09395486861467361, + -0.03177356347441673 + ], + "acc_eval": 0.15625, + "loss_eval": 7798.90283203125, + "epoch": 67 + }, + { + "hidden_norms": [ + 7166.86083984375, + 4995598.0, + 5984263.5, + 6498221.0, + 10708319.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013723000884056091, + 0.0008002148242667317, + 0.0007998319924809039, + 0.0007997409556992352, + 0.0008000954985618591 + ], + "gamma_dfa": 0.024815326556563377, + "gamma_dfa_per_layer": [ + 0.3238403797149658, + -0.05496574938297272, + -0.0969959944486618, + -0.07261732965707779 + ], + "acc_eval": 0.1552734375, + "loss_eval": 6333.236328125, + "epoch": 68 + }, + { + "hidden_norms": [ + 7156.17236328125, + 5093715.5, + 6108802.5, + 6629623.5, + 10896864.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001458030310459435, + 0.0007727351039648056, + 0.0007727306219749153, + 0.0007726310286670923, + 0.0007726071053184569 + ], + "gamma_dfa": 0.018785862252116203, + "gamma_dfa_per_layer": [ + 0.31862637400627136, + -0.06633786112070084, + -0.07025538384914398, + -0.10688968002796173 + ], + "acc_eval": 0.2060546875, + "loss_eval": 5966.35400390625, + "epoch": 69 + }, + { + "hidden_norms": [ + 7127.96875, + 5203388.5, + 6229672.5, + 6756540.5, + 11105730.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018821367993950844, + 0.000799131637904793, + 0.0007999413646757603, + 0.0007995158084668219, + 0.0007994744228199124 + ], + "gamma_dfa": 0.033654400147497654, + "gamma_dfa_per_layer": [ + 0.3480244278907776, + -0.0470522977411747, + -0.08066973835229874, + -0.08568479120731354 + ], + "acc_eval": 0.21484375, + "loss_eval": 8679.373046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 7127.84326171875, + 5291613.5, + 6343081.5, + 6873492.5, + 11283083.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013305873144418001, + 0.0008001387468539178, + 0.0007999925292097032, + 0.0008000367670319974, + 0.0008000454981811345 + ], + "gamma_dfa": 0.026681816205382347, + "gamma_dfa_per_layer": [ + 0.33079925179481506, + -0.04635504633188248, + -0.060725681483745575, + -0.11699125915765762 + ], + "acc_eval": 0.2001953125, + "loss_eval": 7321.45654296875, + "epoch": 71 + }, + { + "hidden_norms": [ + 7118.43115234375, + 5399320.5, + 6461637.5, + 6995765.0, + 11479911.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0027539313305169344, + 0.0007441912894137204, + 0.000744749209843576, + 0.0007447105017490685, + 0.0007443142239935696 + ], + "gamma_dfa": 0.0691906102001667, + "gamma_dfa_per_layer": [ + 0.4505346715450287, + -0.03461931645870209, + -0.07136575877666473, + -0.06778715550899506 + ], + "acc_eval": 0.16015625, + "loss_eval": 10899.68359375, + "epoch": 72 + }, + { + "hidden_norms": [ + 7104.958984375, + 5484605.5, + 6570873.0, + 7105816.5, + 11646348.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011745812371373177, + 0.000797195709310472, + 0.0007963370881043375, + 0.0007962601375766098, + 0.0007965530967339873 + ], + "gamma_dfa": 0.016523053869605064, + "gamma_dfa_per_layer": [ + 0.3157949447631836, + -0.05805324763059616, + -0.0915503203868866, + -0.10009916126728058 + ], + "acc_eval": 0.185546875, + "loss_eval": 4549.11328125, + "epoch": 73 + }, + { + "hidden_norms": [ + 7046.66552734375, + 5575192.0, + 6682143.0, + 7216392.5, + 11814821.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014973932411521673, + 0.0007987518329173326, + 0.000798598921392113, + 0.0007986334967426956, + 0.00079863186692819 + ], + "gamma_dfa": 0.006323261186480522, + "gamma_dfa_per_layer": [ + 0.3186365067958832, + -0.07689585536718369, + -0.08955803513526917, + -0.12688957154750824 + ], + "acc_eval": 0.1845703125, + "loss_eval": 5873.4677734375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6997.1630859375, + 5656117.0, + 6779526.0, + 7314913.5, + 11969090.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014266286743804812, + 0.0007692458457313478, + 0.0007703236187808216, + 0.0007699450361542404, + 0.0007692069630138576 + ], + "gamma_dfa": 0.04031236469745636, + "gamma_dfa_per_layer": [ + 0.3853839635848999, + -0.054634347558021545, + -0.08128909766674042, + -0.0882110595703125 + ], + "acc_eval": 0.1953125, + "loss_eval": 4200.4296875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6970.02099609375, + 5731178.0, + 6870747.5, + 7405309.0, + 12120166.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013568063732236624, + 0.0007682641153223813, + 0.000768258236348629, + 0.0007681549177505076, + 0.0007681125425733626 + ], + "gamma_dfa": 0.04615131672471762, + "gamma_dfa_per_layer": [ + 0.3717971444129944, + -0.05474664270877838, + -0.05301285162568092, + -0.07943238317966461 + ], + "acc_eval": 0.1943359375, + "loss_eval": 3897.47607421875, + "epoch": 76 + }, + { + "hidden_norms": [ + 6942.25, + 5793439.5, + 6946580.5, + 7481325.5, + 12242140.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011983924778178334, + 0.0007509839488193393, + 0.0007508245762437582, + 0.0007505225948989391, + 0.0007505776011385024 + ], + "gamma_dfa": 0.03128352388739586, + "gamma_dfa_per_layer": [ + 0.31842517852783203, + -0.03316807746887207, + -0.06335921585559845, + -0.09676378965377808 + ], + "acc_eval": 0.2685546875, + "loss_eval": 3095.559814453125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6881.80810546875, + 5850806.5, + 7011394.5, + 7546550.5, + 12350002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011590005597099662, + 0.0007501945947296917, + 0.0007500603678636253, + 0.0007497719489037991, + 0.0007498189806938171 + ], + "gamma_dfa": 0.01806825865060091, + "gamma_dfa_per_layer": [ + 0.313739538192749, + -0.047393035143613815, + -0.07615944743156433, + -0.11791402101516724 + ], + "acc_eval": 0.205078125, + "loss_eval": 3942.599853515625, + "epoch": 78 + }, + { + "hidden_norms": [ + 6837.1533203125, + 5897771.5, + 7073526.0, + 7607611.5, + 12444407.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001163899782113731, + 0.0007416060543619096, + 0.0007419964531436563, + 0.0007419841131195426, + 0.0007417319575324655 + ], + "gamma_dfa": 0.03044590726494789, + "gamma_dfa_per_layer": [ + 0.30829477310180664, + -0.03881052881479263, + -0.07340054214000702, + -0.07430007308721542 + ], + "acc_eval": 0.2939453125, + "loss_eval": 2950.356689453125, + "epoch": 79 + }, + { + "hidden_norms": [ + 6806.5322265625, + 5963679.5, + 7147126.0, + 7679290.5, + 12557362.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012401024578139186, + 0.0007945983088575304, + 0.0007953918538987637, + 0.0007950742146931589, + 0.0007950655417516828 + ], + "gamma_dfa": -0.007623729296028614, + "gamma_dfa_per_layer": [ + 0.24250081181526184, + -0.04293825104832649, + -0.07043637335300446, + -0.15962110459804535 + ], + "acc_eval": 0.14453125, + "loss_eval": 3910.8994140625, + "epoch": 80 + }, + { + "hidden_norms": [ + 6782.47607421875, + 5997089.0, + 7185317.5, + 7719894.5, + 12633342.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012797614326700568, + 0.0007944905664771795, + 0.0007951240986585617, + 0.0007947491831146181, + 0.0007947032572701573 + ], + "gamma_dfa": 0.03983990382403135, + "gamma_dfa_per_layer": [ + 0.35600101947784424, + -0.023466136306524277, + -0.07362768054008484, + -0.09954758733510971 + ], + "acc_eval": 0.193359375, + "loss_eval": 3587.8212890625, + "epoch": 81 + }, + { + "hidden_norms": [ + 6723.70654296875, + 6042461.0, + 7238613.0, + 7771656.5, + 12718382.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012927292846143246, + 0.000765398726798594, + 0.0007653928478248417, + 0.0007653140346519649, + 0.0007652752683497965 + ], + "gamma_dfa": 0.03482971154153347, + "gamma_dfa_per_layer": [ + 0.34003761410713196, + -0.05069781839847565, + -0.05738937109708786, + -0.09263157844543457 + ], + "acc_eval": 0.23046875, + "loss_eval": 2805.9716796875, + "epoch": 82 + }, + { + "hidden_norms": [ + 6669.96435546875, + 6085424.0, + 7288909.5, + 7821635.0, + 12799732.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011438996298238635, + 0.000740286021027714, + 0.0007406995864585042, + 0.0007406825898215175, + 0.0007403898634947836 + ], + "gamma_dfa": 0.03725961223244667, + "gamma_dfa_per_layer": [ + 0.32540398836135864, + -0.04895278066396713, + -0.07243393361568451, + -0.05497882515192032 + ], + "acc_eval": 0.2373046875, + "loss_eval": 2089.305908203125, + "epoch": 83 + }, + { + "hidden_norms": [ + 6611.064453125, + 6121666.0, + 7328789.5, + 7859580.5, + 12864450.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010610584868118167, + 0.0007183317793533206, + 0.0007201047264970839, + 0.0007199530373327434, + 0.0007199217798188329 + ], + "gamma_dfa": 0.03143393341451883, + "gamma_dfa_per_layer": [ + 0.2940787076950073, + -0.035069357603788376, + -0.0604243278503418, + -0.07284928858280182 + ], + "acc_eval": 0.3076171875, + "loss_eval": 1459.638916015625, + "epoch": 84 + }, + { + "hidden_norms": [ + 6564.220703125, + 6147971.0, + 7358806.5, + 7888597.5, + 12918884.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001103258109651506, + 0.0007199789397418499, + 0.0007205012370832264, + 0.0007201395928859711, + 0.000719686911907047 + ], + "gamma_dfa": 0.02568601444363594, + "gamma_dfa_per_layer": [ + 0.3047623038291931, + -0.05378233641386032, + -0.07432089745998383, + -0.0739150121808052 + ], + "acc_eval": 0.2607421875, + "loss_eval": 1398.54931640625, + "epoch": 85 + }, + { + "hidden_norms": [ + 6523.052734375, + 6163991.5, + 7377848.0, + 7906464.0, + 12959929.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010483200894668698, + 0.0007394760614261031, + 0.0007398684392683208, + 0.0007398549350909889, + 0.0007395940483547747 + ], + "gamma_dfa": 0.028113607317209244, + "gamma_dfa_per_layer": [ + 0.2919086515903473, + -0.04769399017095566, + -0.06982402503490448, + -0.06193620711565018 + ], + "acc_eval": 0.294921875, + "loss_eval": 1247.0958251953125, + "epoch": 86 + }, + { + "hidden_norms": [ + 6480.38134765625, + 6177022.5, + 7396143.5, + 7924145.0, + 12992374.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011187344789505005, + 0.0007568535511381924, + 0.0007568564033135772, + 0.0007567762513644993, + 0.0007568445871584117 + ], + "gamma_dfa": 0.029856184497475624, + "gamma_dfa_per_layer": [ + 0.32282522320747375, + -0.05086465924978256, + -0.06785817444324493, + -0.08467765152454376 + ], + "acc_eval": 0.267578125, + "loss_eval": 1623.752197265625, + "epoch": 87 + }, + { + "hidden_norms": [ + 6430.5322265625, + 6198352.0, + 7419959.0, + 7946585.0, + 13023161.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010678176768124104, + 0.0007456489838659763, + 0.0007455460145138204, + 0.0007452794816344976, + 0.000745359982829541 + ], + "gamma_dfa": 0.019207272678613663, + "gamma_dfa_per_layer": [ + 0.28421786427497864, + -0.04965135455131531, + -0.07151313126087189, + -0.08622428774833679 + ], + "acc_eval": 0.291015625, + "loss_eval": 1205.84716796875, + "epoch": 88 + }, + { + "hidden_norms": [ + 6396.35009765625, + 6216262.0, + 7436144.0, + 7961794.0, + 13045224.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010295198298990726, + 0.0007388790836557746, + 0.0007392680854536593, + 0.000739254173822701, + 0.000738998525775969 + ], + "gamma_dfa": 0.02955447882413864, + "gamma_dfa_per_layer": [ + 0.2954120337963104, + -0.046598292887210846, + -0.069032222032547, + -0.061563603579998016 + ], + "acc_eval": 0.298828125, + "loss_eval": 1123.675048828125, + "epoch": 89 + }, + { + "hidden_norms": [ + 6366.1259765625, + 6230148.5, + 7451647.0, + 7975150.0, + 13064555.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010110137518495321, + 0.0007565211853943765, + 0.0007565242704004049, + 0.0007563806138932705, + 0.0007564250845462084 + ], + "gamma_dfa": 0.011881772428750992, + "gamma_dfa_per_layer": [ + 0.2693521976470947, + -0.04482053220272064, + -0.07126723229885101, + -0.1057373434305191 + ], + "acc_eval": 0.240234375, + "loss_eval": 1118.5343017578125, + "epoch": 90 + }, + { + "hidden_norms": [ + 6341.41796875, + 6233793.0, + 7457683.5, + 7981064.5, + 13074395.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010112811578437686, + 0.0007385196513496339, + 0.0007389356032945216, + 0.000738917791750282, + 0.0007386352517642081 + ], + "gamma_dfa": 0.0292903920635581, + "gamma_dfa_per_layer": [ + 0.28946253657341003, + -0.033900823444128036, + -0.06436440348625183, + -0.07403574138879776 + ], + "acc_eval": 0.306640625, + "loss_eval": 1028.103515625, + "epoch": 91 + }, + { + "hidden_norms": [ + 6319.90185546875, + 6241203.5, + 7463285.5, + 7986068.5, + 13084655.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010045261587947607, + 0.0007187838782556355, + 0.0007187584415078163, + 0.0007185733411461115, + 0.0007185345166362822 + ], + "gamma_dfa": 0.02470484748482704, + "gamma_dfa_per_layer": [ + 0.2734910249710083, + -0.0429413765668869, + -0.06623440980911255, + -0.06549584865570068 + ], + "acc_eval": 0.3271484375, + "loss_eval": 879.8018798828125, + "epoch": 92 + }, + { + "hidden_norms": [ + 6299.453125, + 6240490.0, + 7464953.0, + 7988364.0, + 13086769.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010041827335953712, + 0.0007186768343672156, + 0.0007186515722423792, + 0.0007184677524492145, + 0.0007184296264313161 + ], + "gamma_dfa": 0.022233721800148487, + "gamma_dfa_per_layer": [ + 0.2633175849914551, + -0.04053181782364845, + -0.06492872536182404, + -0.06892215460538864 + ], + "acc_eval": 0.322265625, + "loss_eval": 871.9059448242188, + "epoch": 93 + }, + { + "hidden_norms": [ + 6280.70068359375, + 6248322.5, + 7472246.5, + 7994814.0, + 13094255.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000998231815174222, + 0.0007185792201198637, + 0.0007185565191321075, + 0.0007183970883488655, + 0.0007183645502664149 + ], + "gamma_dfa": 0.02329079993069172, + "gamma_dfa_per_layer": [ + 0.27325427532196045, + -0.04209248721599579, + -0.0645713210105896, + -0.07342726737260818 + ], + "acc_eval": 0.326171875, + "loss_eval": 876.770263671875, + "epoch": 94 + }, + { + "hidden_norms": [ + 6259.79541015625, + 6251884.0, + 7473855.0, + 7995730.5, + 13095582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001000022399239242, + 0.0007185632712207735, + 0.0007185383583419025, + 0.0007183536072261631, + 0.0007183143752627075 + ], + "gamma_dfa": 0.01565107237547636, + "gamma_dfa_per_layer": [ + 0.26019614934921265, + -0.042762644588947296, + -0.06100854650139809, + -0.09382066875696182 + ], + "acc_eval": 0.31640625, + "loss_eval": 847.3887939453125, + "epoch": 95 + }, + { + "hidden_norms": [ + 6250.6630859375, + 6252472.0, + 7474356.5, + 7996154.0, + 13096382.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009951539104804397, + 0.000718452560249716, + 0.0007184353889897466, + 0.0007182956906035542, + 0.0007182672270573676 + ], + "gamma_dfa": 0.01607441157102585, + "gamma_dfa_per_layer": [ + 0.2622864246368408, + -0.04606177657842636, + -0.06511188298463821, + -0.08681511878967285 + ], + "acc_eval": 0.3125, + "loss_eval": 820.6640625, + "epoch": 96 + }, + { + "hidden_norms": [ + 6245.84228515625, + 6252136.5, + 7473891.5, + 7995642.0, + 13095543.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009887836640700698, + 0.0007184472633525729, + 0.0007184235146269202, + 0.0007182589615695179, + 0.0007182253757491708 + ], + "gamma_dfa": 0.01632563304156065, + "gamma_dfa_per_layer": [ + 0.2587689757347107, + -0.041752640157938004, + -0.06282168626785278, + -0.08889211714267731 + ], + "acc_eval": 0.3271484375, + "loss_eval": 794.9835815429688, + "epoch": 97 + }, + { + "hidden_norms": [ + 6243.275390625, + 6252353.5, + 7474147.5, + 7995911.0, + 13095907.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010000880574807525, + 0.0007184495334513485, + 0.0007184281130321324, + 0.0007182535482570529, + 0.0007182166446000338 + ], + "gamma_dfa": 0.01966456975787878, + "gamma_dfa_per_layer": [ + 0.26670968532562256, + -0.04189712926745415, + -0.06575733423233032, + -0.08039694279432297 + ], + "acc_eval": 0.3173828125, + "loss_eval": 809.9351196289062, + "epoch": 98 + }, + { + "hidden_norms": [ + 6242.01708984375, + 6252447.5, + 7474218.0, + 7995986.5, + 13096086.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009963318007066846, + 0.000718410883564502, + 0.000718392024282366, + 0.0007182427798397839, + 0.0007182121044024825 + ], + "gamma_dfa": 0.017472295090556145, + "gamma_dfa_per_layer": [ + 0.26097655296325684, + -0.042458876967430115, + -0.06487732380628586, + -0.08375117182731628 + ], + "acc_eval": 0.326171875, + "loss_eval": 790.8746337890625, + "epoch": 99 + }, + { + "hidden_norms": [ + 6241.6884765625, + 6252462.0, + 7474227.5, + 7995996.0, + 13096118.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009859646670520306, + 0.0007156162173487246, + 0.0007178352097980678, + 0.0007174411439336836, + 0.0007168283336795866 + ], + "gamma_dfa": 0.01725842524319887, + "gamma_dfa_per_layer": [ + 0.25597745180130005, + -0.041728582233190536, + -0.06328003108501434, + -0.08193513751029968 + ], + "acc_eval": 0.3359375, + "loss_eval": 790.8336181640625, + "epoch": 100 + } + ] +} \ No newline at end of file -- cgit v1.2.3