1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
|
device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=456
eval buffer: torch.Size([1024, 3072])
=== DFA training ===
[DFA] Ep 0: ||h||_med=[8.696551322937012, 42.47159957885742, 42.67432403564453, 45.272701263427734, 43.449092864990234] ||g||_med=[0.0011182057205587626, 0.00021166827355045825, 0.00014748115791007876, 0.00011803740198956802, 0.00010102539090439677] acc=0.1143
[DFA] Ep 1: ||h_L||=9.975e+03 ||g_2||=4.843e-07 acc=0.1113 gamma_dfa=0.0185
[DFA] Ep 2: ||h_L||=4.258e+04 ||g_2||=8.536e-08 acc=0.1006 gamma_dfa=0.0173
[DFA] Ep 3: ||h_L||=9.508e+04 ||g_2||=3.481e-08 acc=0.0801 gamma_dfa=0.0150
[DFA] Ep 4: ||h_L||=1.685e+05 ||g_2||=1.968e-08 acc=0.0654 gamma_dfa=0.0208
[DFA] Ep 5: ||h_L||=2.704e+05 ||g_2||=1.294e-08 acc=0.0732 gamma_dfa=0.0239
[DFA] Ep 6: ||h_L||=4.002e+05 ||g_2||=9.634e-09 acc=0.1064 gamma_dfa=0.0241
[DFA] Ep 7: ||h_L||=5.563e+05 ||g_2||=7.954e-09 acc=0.1123 gamma_dfa=0.0292
[DFA] Ep 8: ||h_L||=7.605e+05 ||g_2||=6.522e-09 acc=0.1152 gamma_dfa=0.0312
[DFA] Ep 9: ||h_L||=1.011e+06 ||g_2||=5.556e-09 acc=0.1162 gamma_dfa=0.0348
[DFA] Ep 10: ||h_L||=1.307e+06 ||g_2||=4.731e-09 acc=0.1152 gamma_dfa=0.0403
[DFA] Ep 11: ||h_L||=1.643e+06 ||g_2||=4.127e-09 acc=0.1162 gamma_dfa=0.0408
[DFA] Ep 12: ||h_L||=2.047e+06 ||g_2||=3.521e-09 acc=0.1123 gamma_dfa=0.0411
[DFA] Ep 13: ||h_L||=2.529e+06 ||g_2||=3.068e-09 acc=0.1143 gamma_dfa=0.0436
[DFA] Ep 14: ||h_L||=3.069e+06 ||g_2||=2.661e-09 acc=0.1152 gamma_dfa=0.0434
[DFA] Ep 15: ||h_L||=3.672e+06 ||g_2||=2.340e-09 acc=0.1123 gamma_dfa=0.0459
[DFA] Ep 16: ||h_L||=4.363e+06 ||g_2||=2.085e-09 acc=0.1104 gamma_dfa=0.0443
[DFA] Ep 17: ||h_L||=5.116e+06 ||g_2||=1.862e-09 acc=0.1035 gamma_dfa=0.0453
[DFA] Ep 18: ||h_L||=5.947e+06 ||g_2||=1.664e-09 acc=0.0859 gamma_dfa=0.0454
[DFA] Ep 19: ||h_L||=6.799e+06 ||g_2||=1.496e-09 acc=0.0762 gamma_dfa=0.0448
[DFA] Ep 20: ||h_L||=7.803e+06 ||g_2||=1.355e-09 acc=0.0801 gamma_dfa=0.0458
[DFA] Ep 21: ||h_L||=8.837e+06 ||g_2||=1.236e-09 acc=0.0928 gamma_dfa=0.0458
[DFA] Ep 22: ||h_L||=9.928e+06 ||g_2||=1.132e-09 acc=0.1045 gamma_dfa=0.0462
[DFA] Ep 23: ||h_L||=1.110e+07 ||g_2||=1.038e-09 acc=0.1055 gamma_dfa=0.0465
[DFA] Ep 24: ||h_L||=1.236e+07 ||g_2||=9.618e-10 acc=0.1055 gamma_dfa=0.0462
[DFA] Ep 25: ||h_L||=1.366e+07 ||g_2||=8.898e-10 acc=0.1055 gamma_dfa=0.0468
[DFA] Ep 26: ||h_L||=1.500e+07 ||g_2||=8.268e-10 acc=0.1055 gamma_dfa=0.0475
[DFA] Ep 27: ||h_L||=1.650e+07 ||g_2||=7.703e-10 acc=0.1064 gamma_dfa=0.0474
[DFA] Ep 28: ||h_L||=1.811e+07 ||g_2||=7.228e-10 acc=0.1055 gamma_dfa=0.0473
[DFA] Ep 29: ||h_L||=1.965e+07 ||g_2||=6.773e-10 acc=0.1055 gamma_dfa=0.0472
[DFA] Ep 30: ||h_L||=2.139e+07 ||g_2||=6.385e-10 acc=0.1055 gamma_dfa=0.0478
[DFA] Ep 31: ||h_L||=2.306e+07 ||g_2||=6.001e-10 acc=0.1055 gamma_dfa=0.0481
[DFA] Ep 32: ||h_L||=2.490e+07 ||g_2||=5.676e-10 acc=0.1064 gamma_dfa=0.0476
[DFA] Ep 33: ||h_L||=2.693e+07 ||g_2||=5.345e-10 acc=0.1055 gamma_dfa=0.0476
[DFA] Ep 34: ||h_L||=2.880e+07 ||g_2||=5.057e-10 acc=0.1055 gamma_dfa=0.0481
[DFA] Ep 35: ||h_L||=3.075e+07 ||g_2||=4.826e-10 acc=0.1055 gamma_dfa=0.0478
[DFA] Ep 36: ||h_L||=3.269e+07 ||g_2||=4.582e-10 acc=0.1055 gamma_dfa=0.0478
[DFA] Ep 37: ||h_L||=3.458e+07 ||g_2||=4.370e-10 acc=0.1055 gamma_dfa=0.0480
[DFA] Ep 38: ||h_L||=3.663e+07 ||g_2||=4.178e-10 acc=0.1055 gamma_dfa=0.0481
[DFA] Ep 39: ||h_L||=3.877e+07 ||g_2||=4.003e-10 acc=0.1055 gamma_dfa=0.0479
[DFA] Ep 40: ||h_L||=4.085e+07 ||g_2||=3.838e-10 acc=0.1055 gamma_dfa=0.0483
[DFA] Ep 41: ||h_L||=4.301e+07 ||g_2||=3.697e-10 acc=0.1055 gamma_dfa=0.0488
[DFA] Ep 42: ||h_L||=4.527e+07 ||g_2||=3.547e-10 acc=0.1055 gamma_dfa=0.0488
[DFA] Ep 43: ||h_L||=4.735e+07 ||g_2||=3.417e-10 acc=0.1055 gamma_dfa=0.0487
[DFA] Ep 44: ||h_L||=4.957e+07 ||g_2||=3.287e-10 acc=0.1055 gamma_dfa=0.0491
[DFA] Ep 45: ||h_L||=5.152e+07 ||g_2||=3.176e-10 acc=0.1055 gamma_dfa=0.0493
[DFA] Ep 46: ||h_L||=5.370e+07 ||g_2||=3.079e-10 acc=0.1055 gamma_dfa=0.0490
[DFA] Ep 47: ||h_L||=5.579e+07 ||g_2||=2.985e-10 acc=0.1055 gamma_dfa=0.0497
[DFA] Ep 48: ||h_L||=5.788e+07 ||g_2||=2.902e-10 acc=0.1055 gamma_dfa=0.0495
[DFA] Ep 49: ||h_L||=6.001e+07 ||g_2||=2.819e-10 acc=0.1055 gamma_dfa=0.0495
[DFA] Ep 50: ||h_L||=6.212e+07 ||g_2||=2.740e-10 acc=0.1055 gamma_dfa=0.0500
[DFA] Ep 51: ||h_L||=6.409e+07 ||g_2||=2.676e-10 acc=0.1055 gamma_dfa=0.0503
[DFA] Ep 52: ||h_L||=6.611e+07 ||g_2||=2.606e-10 acc=0.1055 gamma_dfa=0.0498
[DFA] Ep 53: ||h_L||=6.824e+07 ||g_2||=2.535e-10 acc=0.1055 gamma_dfa=0.0503
[DFA] Ep 54: ||h_L||=7.033e+07 ||g_2||=2.483e-10 acc=0.1055 gamma_dfa=0.0506
[DFA] Ep 55: ||h_L||=7.230e+07 ||g_2||=2.428e-10 acc=0.1055 gamma_dfa=0.0507
[DFA] Ep 56: ||h_L||=7.415e+07 ||g_2||=2.379e-10 acc=0.1055 gamma_dfa=0.0508
[DFA] Ep 57: ||h_L||=7.599e+07 ||g_2||=2.338e-10 acc=0.1055 gamma_dfa=0.0508
[DFA] Ep 58: ||h_L||=7.792e+07 ||g_2||=2.293e-10 acc=0.1055 gamma_dfa=0.0510
[DFA] Ep 59: ||h_L||=7.974e+07 ||g_2||=2.247e-10 acc=0.1055 gamma_dfa=0.0511
[DFA] Ep 60: ||h_L||=8.161e+07 ||g_2||=2.218e-10 acc=0.1055 gamma_dfa=0.0513
[DFA] Ep 61: ||h_L||=8.329e+07 ||g_2||=2.178e-10 acc=0.1055 gamma_dfa=0.0515
[DFA] Ep 62: ||h_L||=8.490e+07 ||g_2||=2.139e-10 acc=0.1055 gamma_dfa=0.0518
[DFA] Ep 63: ||h_L||=8.655e+07 ||g_2||=2.119e-10 acc=0.1055 gamma_dfa=0.0518
[DFA] Ep 64: ||h_L||=8.808e+07 ||g_2||=2.085e-10 acc=0.1055 gamma_dfa=0.0519
[DFA] Ep 65: ||h_L||=8.967e+07 ||g_2||=2.067e-10 acc=0.1055 gamma_dfa=0.0517
[DFA] Ep 66: ||h_L||=9.106e+07 ||g_2||=2.040e-10 acc=0.1055 gamma_dfa=0.0519
[DFA] Ep 67: ||h_L||=9.243e+07 ||g_2||=2.017e-10 acc=0.1055 gamma_dfa=0.0520
[DFA] Ep 68: ||h_L||=9.373e+07 ||g_2||=1.995e-10 acc=0.1055 gamma_dfa=0.0521
[DFA] Ep 69: ||h_L||=9.486e+07 ||g_2||=1.975e-10 acc=0.1055 gamma_dfa=0.0522
[DFA] Ep 70: ||h_L||=9.607e+07 ||g_2||=1.956e-10 acc=0.1055 gamma_dfa=0.0521
[DFA] Ep 71: ||h_L||=9.723e+07 ||g_2||=1.938e-10 acc=0.1055 gamma_dfa=0.0521
[DFA] Ep 72: ||h_L||=9.818e+07 ||g_2||=1.921e-10 acc=0.1055 gamma_dfa=0.0522
[DFA] Ep 73: ||h_L||=9.925e+07 ||g_2||=1.908e-10 acc=0.1055 gamma_dfa=0.0523
[DFA] Ep 74: ||h_L||=1.003e+08 ||g_2||=1.891e-10 acc=0.1055 gamma_dfa=0.0523
[DFA] Ep 75: ||h_L||=1.012e+08 ||g_2||=1.877e-10 acc=0.1055 gamma_dfa=0.0524
[DFA] Ep 76: ||h_L||=1.020e+08 ||g_2||=1.867e-10 acc=0.1055 gamma_dfa=0.0523
[DFA] Ep 77: ||h_L||=1.028e+08 ||g_2||=1.857e-10 acc=0.1055 gamma_dfa=0.0524
[DFA] Ep 78: ||h_L||=1.035e+08 ||g_2||=1.846e-10 acc=0.1055 gamma_dfa=0.0524
[DFA] Ep 79: ||h_L||=1.041e+08 ||g_2||=1.838e-10 acc=0.1055 gamma_dfa=0.0525
[DFA] Ep 80: ||h_L||=1.047e+08 ||g_2||=1.829e-10 acc=0.1055 gamma_dfa=0.0526
[DFA] Ep 81: ||h_L||=1.052e+08 ||g_2||=1.821e-10 acc=0.1055 gamma_dfa=0.0527
[DFA] Ep 82: ||h_L||=1.057e+08 ||g_2||=1.815e-10 acc=0.1055 gamma_dfa=0.0527
[DFA] Ep 83: ||h_L||=1.062e+08 ||g_2||=1.808e-10 acc=0.1055 gamma_dfa=0.0526
[DFA] Ep 84: ||h_L||=1.066e+08 ||g_2||=1.802e-10 acc=0.1055 gamma_dfa=0.0527
[DFA] Ep 85: ||h_L||=1.070e+08 ||g_2||=1.797e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 86: ||h_L||=1.073e+08 ||g_2||=1.794e-10 acc=0.1055 gamma_dfa=0.0527
[DFA] Ep 87: ||h_L||=1.076e+08 ||g_2||=1.790e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 88: ||h_L||=1.079e+08 ||g_2||=1.787e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 89: ||h_L||=1.081e+08 ||g_2||=1.784e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 90: ||h_L||=1.082e+08 ||g_2||=1.782e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 91: ||h_L||=1.084e+08 ||g_2||=1.780e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 92: ||h_L||=1.085e+08 ||g_2||=1.778e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 93: ||h_L||=1.086e+08 ||g_2||=1.777e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 94: ||h_L||=1.087e+08 ||g_2||=1.776e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 95: ||h_L||=1.087e+08 ||g_2||=1.776e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 96: ||h_L||=1.087e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 97: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 98: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 99: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528
[DFA] Ep 100: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528
Saved results/h2_no_residual_full_s456/snapshot_evolution_s456.json
|