1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
|
{
"config": {
"output_dir": "results/h2_smoketest",
"epochs": 1,
"lr": 0.001,
"wd": 0.01,
"seed": 42,
"depth": 4,
"d_hidden": 256,
"log_every": 1,
"no_residual_add": true,
"w2_std": 0.05
},
"depth": 4,
"d_hidden": 256,
"num_classes": 10,
"bp_log": [
{
"hidden_norms": [
8.718070030212402,
4.280222415924072,
4.422238349914551,
4.604765892028809,
4.6893696784973145
],
"bp_grad_norms_per_sample_med": [
0.0010339331347495317,
0.0009070215164683759,
0.0008196940761990845,
0.000755702203605324,
0.0006969328387640417
],
"bp_grad_norms_F": [
0.036222200840711594,
0.030558692291378975,
0.027158580720424652,
0.02468229830265045,
0.022657815366983414
],
"gamma_dfa": NaN,
"acc_eval": 0.1123046875,
"loss_eval": 2.414133310317993,
"epoch": 0
},
{
"hidden_norms": [
85.9231185913086,
17.862314224243164,
18.3341064453125,
20.362960815429688,
26.587692260742188
],
"bp_grad_norms_per_sample_med": [
8.575361425755545e-05,
8.537247049389407e-05,
8.530700870323926e-05,
8.512997737852857e-05,
8.473115303786471e-05
],
"bp_grad_norms_F": [
0.0030727137345820665,
0.003054599277675152,
0.0030425451695919037,
0.0030279208440333605,
0.0030008067842572927
],
"gamma_dfa": NaN,
"acc_eval": 0.0576171875,
"loss_eval": 2.5138001441955566,
"epoch": 1
}
],
"dfa_log": [
{
"hidden_norms": [
8.718070030212402,
4.280222415924072,
4.422238349914551,
4.604765892028809,
4.6893696784973145
],
"bp_grad_norms_per_sample_med": [
0.0010339331347495317,
0.0009070215164683759,
0.0008196940761990845,
0.000755702203605324,
0.0006969328387640417
],
"bp_grad_norms_F": [
0.036222200840711594,
0.030558692291378975,
0.027158580720424652,
0.02468229830265045,
0.022657815366983414
],
"gamma_dfa": 0.004694993258453906,
"acc_eval": 0.1123046875,
"loss_eval": 2.414133310317993,
"epoch": 0
},
{
"hidden_norms": [
1363.396484375,
5623.7373046875,
6282.16259765625,
6187.54150390625,
3601.992919921875
],
"bp_grad_norms_per_sample_med": [
1.0316066436644178e-06,
8.392997301598371e-07,
8.332735319527274e-07,
8.32648026971583e-07,
8.310838666147902e-07
],
"bp_grad_norms_F": [
7.324694888666272e-05,
4.777986396220513e-05,
4.688410263042897e-05,
4.647139576263726e-05,
4.622975757229142e-05
],
"gamma_dfa": 0.029530375730246305,
"acc_eval": 0.1015625,
"loss_eval": 2.2971253395080566,
"epoch": 1
}
]
}
|