1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
|
{
"config": {
"seed": 42,
"max_epoch": 5,
"lr": 0.001,
"wd": 0.01,
"save_at": [
1,
2,
3,
4,
5
],
"output_dir": "results/vanilla_dfa_early_ckpts"
},
"log": [
{
"epoch": 0,
"h_norms": [
8.718070030212402,
8.780964851379395,
8.812002182006836,
8.828720092773438,
8.893179893493652
],
"g_norms": [
0.0010068593546748161,
0.000997236929833889,
0.0009934091940522194,
0.0009870644425973296,
0.0009829498594626784
]
},
{
"epoch": 1,
"h_norms": [
802.1658935546875,
3058.3173828125,
4910.8408203125,
6491.31494140625,
7304.1533203125
],
"g_norms": [
2.526000798752648e-06,
1.3625027577290894e-06,
1.3747999219049234e-06,
1.378283172925876e-06,
1.3869492931917193e-06
]
},
{
"epoch": 2,
"h_norms": [
1580.3233642578125,
13323.4609375,
22799.7890625,
32449.083984375,
37769.375
],
"g_norms": [
1.142504174822534e-06,
3.0893900770934124e-07,
3.109949489044084e-07,
3.1369876296594157e-07,
3.1714918691250205e-07
]
},
{
"epoch": 3,
"h_norms": [
2344.037841796875,
32468.109375,
58174.1328125,
87268.390625,
104689.5234375
],
"g_norms": [
8.221624625548429e-07,
1.3046170010966307e-07,
1.2744629884764436e-07,
1.2940536464611796e-07,
1.2926365400289797e-07
]
},
{
"epoch": 4,
"h_norms": [
3132.316162109375,
62912.65234375,
117831.9375,
183012.40625,
223974.890625
],
"g_norms": [
6.481430432359048e-07,
7.028656057173066e-08,
6.718681078154987e-08,
6.803762175877637e-08,
6.805611008076085e-08
]
},
{
"epoch": 5,
"h_norms": [
3947.822998046875,
109389.84375,
203877.265625,
330289.25,
405665.21875
],
"g_norms": [
5.139339123161335e-07,
4.3603474608744364e-08,
4.2005297018476995e-08,
4.2576637326874334e-08,
4.249179852422458e-08
]
}
]
}
|