blob: a0a3bd0840697ad8329518da66743dd46f255097 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
|
NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=456
=== BP training (NO out_ln) ===
[BP-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918
[BP-noLN] Ep 1: ||h_L||=3.410e+01 ||g||=1.500e-04 acc=0.4365
[BP-noLN] Ep 5: ||h_L||=5.250e+01 ||g||=1.052e-04 acc=0.4961
[BP-noLN] Ep 10: ||h_L||=6.330e+01 ||g||=8.751e-05 acc=0.5596
[BP-noLN] Ep 15: ||h_L||=6.619e+01 ||g||=8.857e-05 acc=0.5215
[BP-noLN] Ep 20: ||h_L||=7.009e+01 ||g||=8.610e-05 acc=0.5420
[BP-noLN] Ep 25: ||h_L||=7.285e+01 ||g||=8.470e-05 acc=0.5723
[BP-noLN] Ep 30: ||h_L||=7.493e+01 ||g||=8.152e-05 acc=0.5938
[BP-noLN] Ep 35: ||h_L||=7.640e+01 ||g||=7.781e-05 acc=0.6074
[BP-noLN] Ep 40: ||h_L||=7.799e+01 ||g||=8.443e-05 acc=0.5938
[BP-noLN] Ep 45: ||h_L||=7.734e+01 ||g||=7.914e-05 acc=0.6143
[BP-noLN] Ep 50: ||h_L||=7.667e+01 ||g||=8.950e-05 acc=0.5996
[BP-noLN] Ep 55: ||h_L||=7.591e+01 ||g||=9.021e-05 acc=0.6201
[BP-noLN] Ep 60: ||h_L||=7.667e+01 ||g||=8.730e-05 acc=0.6338
[BP-noLN] Ep 65: ||h_L||=7.629e+01 ||g||=9.670e-05 acc=0.6230
[BP-noLN] Ep 70: ||h_L||=7.612e+01 ||g||=9.637e-05 acc=0.6260
[BP-noLN] Ep 75: ||h_L||=7.544e+01 ||g||=9.639e-05 acc=0.6338
[BP-noLN] Ep 80: ||h_L||=7.434e+01 ||g||=9.999e-05 acc=0.6455
[BP-noLN] Ep 85: ||h_L||=7.429e+01 ||g||=1.013e-04 acc=0.6348
[BP-noLN] Ep 90: ||h_L||=7.381e+01 ||g||=1.076e-04 acc=0.6348
[BP-noLN] Ep 95: ||h_L||=7.380e+01 ||g||=1.084e-04 acc=0.6436
[BP-noLN] Ep 100: ||h_L||=7.373e+01 ||g||=1.088e-04 acc=0.6465
=== DFA training (NO out_ln) ===
[DFA-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918
[DFA-noLN] Ep 1: ||h_L||=1.507e+03 ||g||=6.424e-04 acc=0.2246 γ=0.0136
[DFA-noLN] Ep 5: ||h_L||=1.140e+04 ||g||=7.475e-04 acc=0.2314 γ=-0.0000
[DFA-noLN] Ep 10: ||h_L||=2.845e+04 ||g||=7.444e-04 acc=0.1895 γ=-0.0067
[DFA-noLN] Ep 15: ||h_L||=8.676e+04 ||g||=7.381e-04 acc=0.2549 γ=0.0039
[DFA-noLN] Ep 20: ||h_L||=2.707e+05 ||g||=7.761e-04 acc=0.1670 γ=0.0171
[DFA-noLN] Ep 25: ||h_L||=6.628e+05 ||g||=7.894e-04 acc=0.1992 γ=0.0390
[DFA-noLN] Ep 30: ||h_L||=1.245e+06 ||g||=7.944e-04 acc=0.1963 γ=0.0162
[DFA-noLN] Ep 35: ||h_L||=2.131e+06 ||g||=8.014e-04 acc=0.1904 γ=0.0128
[DFA-noLN] Ep 40: ||h_L||=3.242e+06 ||g||=7.965e-04 acc=0.1855 γ=0.0227
[DFA-noLN] Ep 45: ||h_L||=4.568e+06 ||g||=8.172e-04 acc=0.1807 γ=0.0340
[DFA-noLN] Ep 50: ||h_L||=6.031e+06 ||g||=8.070e-04 acc=0.1133 γ=0.0064
[DFA-noLN] Ep 55: ||h_L||=7.447e+06 ||g||=7.821e-04 acc=0.1924 γ=0.0273
[DFA-noLN] Ep 60: ||h_L||=8.862e+06 ||g||=8.033e-04 acc=0.1650 γ=0.0210
[DFA-noLN] Ep 65: ||h_L||=1.008e+07 ||g||=8.274e-04 acc=0.1533 γ=0.0124
[DFA-noLN] Ep 70: ||h_L||=1.111e+07 ||g||=7.999e-04 acc=0.2148 γ=0.0337
[DFA-noLN] Ep 75: ||h_L||=1.197e+07 ||g||=7.703e-04 acc=0.1953 γ=0.0403
[DFA-noLN] Ep 80: ||h_L||=1.256e+07 ||g||=7.954e-04 acc=0.1445 γ=-0.0076
[DFA-noLN] Ep 85: ||h_L||=1.292e+07 ||g||=7.205e-04 acc=0.2607 γ=0.0257
[DFA-noLN] Ep 90: ||h_L||=1.306e+07 ||g||=7.565e-04 acc=0.2402 γ=0.0119
[DFA-noLN] Ep 95: ||h_L||=1.310e+07 ||g||=7.185e-04 acc=0.3164 γ=0.0157
[DFA-noLN] Ep 100: ||h_L||=1.310e+07 ||g||=7.178e-04 acc=0.3359 γ=0.0173
Saved results/snapshot_no_outln_v1/snapshot_noLN_s456.json
|