diff options
Diffstat (limited to 'results/snapshot_no_outln_v1/run_s456.log')
| -rw-r--r-- | results/snapshot_no_outln_v1/run_s456.log | 51 |
1 files changed, 51 insertions, 0 deletions
diff --git a/results/snapshot_no_outln_v1/run_s456.log b/results/snapshot_no_outln_v1/run_s456.log new file mode 100644 index 0000000..a0a3bd0 --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s456.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=456 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918 + [BP-noLN] Ep 1: ||h_L||=3.410e+01 ||g||=1.500e-04 acc=0.4365 + [BP-noLN] Ep 5: ||h_L||=5.250e+01 ||g||=1.052e-04 acc=0.4961 + [BP-noLN] Ep 10: ||h_L||=6.330e+01 ||g||=8.751e-05 acc=0.5596 + [BP-noLN] Ep 15: ||h_L||=6.619e+01 ||g||=8.857e-05 acc=0.5215 + [BP-noLN] Ep 20: ||h_L||=7.009e+01 ||g||=8.610e-05 acc=0.5420 + [BP-noLN] Ep 25: ||h_L||=7.285e+01 ||g||=8.470e-05 acc=0.5723 + [BP-noLN] Ep 30: ||h_L||=7.493e+01 ||g||=8.152e-05 acc=0.5938 + [BP-noLN] Ep 35: ||h_L||=7.640e+01 ||g||=7.781e-05 acc=0.6074 + [BP-noLN] Ep 40: ||h_L||=7.799e+01 ||g||=8.443e-05 acc=0.5938 + [BP-noLN] Ep 45: ||h_L||=7.734e+01 ||g||=7.914e-05 acc=0.6143 + [BP-noLN] Ep 50: ||h_L||=7.667e+01 ||g||=8.950e-05 acc=0.5996 + [BP-noLN] Ep 55: ||h_L||=7.591e+01 ||g||=9.021e-05 acc=0.6201 + [BP-noLN] Ep 60: ||h_L||=7.667e+01 ||g||=8.730e-05 acc=0.6338 + [BP-noLN] Ep 65: ||h_L||=7.629e+01 ||g||=9.670e-05 acc=0.6230 + [BP-noLN] Ep 70: ||h_L||=7.612e+01 ||g||=9.637e-05 acc=0.6260 + [BP-noLN] Ep 75: ||h_L||=7.544e+01 ||g||=9.639e-05 acc=0.6338 + [BP-noLN] Ep 80: ||h_L||=7.434e+01 ||g||=9.999e-05 acc=0.6455 + [BP-noLN] Ep 85: ||h_L||=7.429e+01 ||g||=1.013e-04 acc=0.6348 + [BP-noLN] Ep 90: ||h_L||=7.381e+01 ||g||=1.076e-04 acc=0.6348 + [BP-noLN] Ep 95: ||h_L||=7.380e+01 ||g||=1.084e-04 acc=0.6436 + [BP-noLN] Ep 100: ||h_L||=7.373e+01 ||g||=1.088e-04 acc=0.6465 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918 + [DFA-noLN] Ep 1: ||h_L||=1.507e+03 ||g||=6.424e-04 acc=0.2246 γ=0.0136 + [DFA-noLN] Ep 5: ||h_L||=1.140e+04 ||g||=7.475e-04 acc=0.2314 γ=-0.0000 + [DFA-noLN] Ep 10: ||h_L||=2.845e+04 ||g||=7.444e-04 acc=0.1895 γ=-0.0067 + [DFA-noLN] Ep 15: ||h_L||=8.676e+04 ||g||=7.381e-04 acc=0.2549 γ=0.0039 + [DFA-noLN] Ep 20: ||h_L||=2.707e+05 ||g||=7.761e-04 acc=0.1670 γ=0.0171 + [DFA-noLN] Ep 25: ||h_L||=6.628e+05 ||g||=7.894e-04 acc=0.1992 γ=0.0390 + [DFA-noLN] Ep 30: ||h_L||=1.245e+06 ||g||=7.944e-04 acc=0.1963 γ=0.0162 + [DFA-noLN] Ep 35: ||h_L||=2.131e+06 ||g||=8.014e-04 acc=0.1904 γ=0.0128 + [DFA-noLN] Ep 40: ||h_L||=3.242e+06 ||g||=7.965e-04 acc=0.1855 γ=0.0227 + [DFA-noLN] Ep 45: ||h_L||=4.568e+06 ||g||=8.172e-04 acc=0.1807 γ=0.0340 + [DFA-noLN] Ep 50: ||h_L||=6.031e+06 ||g||=8.070e-04 acc=0.1133 γ=0.0064 + [DFA-noLN] Ep 55: ||h_L||=7.447e+06 ||g||=7.821e-04 acc=0.1924 γ=0.0273 + [DFA-noLN] Ep 60: ||h_L||=8.862e+06 ||g||=8.033e-04 acc=0.1650 γ=0.0210 + [DFA-noLN] Ep 65: ||h_L||=1.008e+07 ||g||=8.274e-04 acc=0.1533 γ=0.0124 + [DFA-noLN] Ep 70: ||h_L||=1.111e+07 ||g||=7.999e-04 acc=0.2148 γ=0.0337 + [DFA-noLN] Ep 75: ||h_L||=1.197e+07 ||g||=7.703e-04 acc=0.1953 γ=0.0403 + [DFA-noLN] Ep 80: ||h_L||=1.256e+07 ||g||=7.954e-04 acc=0.1445 γ=-0.0076 + [DFA-noLN] Ep 85: ||h_L||=1.292e+07 ||g||=7.205e-04 acc=0.2607 γ=0.0257 + [DFA-noLN] Ep 90: ||h_L||=1.306e+07 ||g||=7.565e-04 acc=0.2402 γ=0.0119 + [DFA-noLN] Ep 95: ||h_L||=1.310e+07 ||g||=7.185e-04 acc=0.3164 γ=0.0157 + [DFA-noLN] Ep 100: ||h_L||=1.310e+07 ||g||=7.178e-04 acc=0.3359 γ=0.0173 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s456.json |
