1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
|
[
{
"method": "dfa",
"L": 4,
"d_hidden": 256,
"seed": 42,
"warmup_ratio": 0.2,
"term_grad_weight": 1.0,
"test_acc": 0.3116,
"mean_gamma": 0.10076353600015864,
"mean_rho": -0.00476757250726223,
"mean_nudge": -3.260793164372444e-07,
"per_layer_gamma": [
0.42987197637557983,
0.002452872460708022,
-0.014306485652923584,
-0.014964219182729721
],
"per_layer_rho": [
-0.01907029002904892,
0.0,
0.0,
0.0
],
"per_layer_nudge": [
-1.3024546205997467e-06,
-1.862645149230957e-09,
0.0,
0.0
]
},
{
"method": "cb_eT",
"L": 4,
"d_hidden": 256,
"seed": 42,
"warmup_ratio": 0.2,
"term_grad_weight": 1.0,
"test_acc": 0.283,
"mean_gamma": 0.17921950668096542,
"mean_rho": 0.008699589408934116,
"mean_nudge": -8.21426510810852e-07,
"per_layer_gamma": [
0.5069771409034729,
0.05348020792007446,
0.07490736246109009,
0.08151331543922424
],
"per_layer_rho": [
0.034798357635736465,
0.0,
0.0,
0.0
],
"per_layer_nudge": [
-3.285706043243408e-06,
0.0,
0.0,
0.0
]
}
]
|