1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
|
[
{
"method": "dfa",
"L": 4,
"d_hidden": 256,
"seed": 456,
"warmup_ratio": 0.2,
"term_grad_weight": 1.0,
"test_acc": 0.297,
"mean_gamma": 0.09892195643624291,
"mean_rho": -0.004888533148914576,
"mean_nudge": -3.1944364309310913e-07,
"per_layer_gamma": [
0.3969520926475525,
-0.0020016406197100878,
-0.0031630932353436947,
0.003900466952472925
],
"per_layer_rho": [
-0.019554132595658302,
0.0,
0.0,
0.0
],
"per_layer_nudge": [
-1.2777745723724365e-06,
0.0,
0.0,
0.0
]
},
{
"method": "cb_eT",
"L": 4,
"d_hidden": 256,
"seed": 456,
"warmup_ratio": 0.2,
"term_grad_weight": 1.0,
"test_acc": 0.2893,
"mean_gamma": 0.23417379707098007,
"mean_rho": -0.002338360995054245,
"mean_nudge": -5.409820005297661e-07,
"per_layer_gamma": [
0.41382449865341187,
0.12546014785766602,
0.1961553394794464,
0.201255202293396
],
"per_layer_rho": [
-0.00935344398021698,
0.0,
0.0,
0.0
],
"per_layer_nudge": [
-2.1639280021190643e-06,
0.0,
0.0,
0.0
]
}
]
|