1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
|
{
"config": {
"output_dir": "results/optionA_smoke",
"epochs": 3,
"lr": 0.001,
"wd": 0.01,
"seed": 42,
"depth": 4,
"d_hidden": 256,
"log_every": 1,
"no_residual_add": false,
"w2_std": 0.01,
"random_targets": true,
"skip_bp": true
},
"depth": 4,
"d_hidden": 256,
"num_classes": 10,
"bp_log": null,
"dfa_log": [
{
"hidden_norms": [
8.718070030212402,
8.780964851379395,
8.812002182006836,
8.828720092773438,
8.893179893493652
],
"bp_grad_norms_per_sample_med": [
0.0010068593546748161,
0.000997236929833889,
0.0009934091940522194,
0.0009870644425973296,
0.0009829498594626784
],
"bp_grad_norms_F": [
0.03544403985142708,
0.03507080301642418,
0.03477022796869278,
0.03443896397948265,
0.03407429903745651
],
"gamma_dfa": 0.007406219025142491,
"acc_eval": 0.115234375,
"loss_eval": 2.383650302886963,
"epoch": 0
},
{
"hidden_norms": [
290.9817199707031,
627.6629028320312,
1287.7171630859375,
1459.1513671875,
1616.4718017578125
],
"bp_grad_norms_per_sample_med": [
5.262210834189318e-06,
5.14477824253845e-06,
5.1224119488324504e-06,
5.1222677939222194e-06,
5.123215942148818e-06
],
"bp_grad_norms_F": [
0.0008317740284837782,
0.0008041572291404009,
0.0007967103738337755,
0.0007942747906781733,
0.0007939037750475109
],
"gamma_dfa": -0.01952565903775394,
"acc_eval": 0.078125,
"loss_eval": 2.3129711151123047,
"epoch": 1
},
{
"hidden_norms": [
467.1022644042969,
3057.49267578125,
7424.37353515625,
8857.5537109375,
9767.6162109375
],
"bp_grad_norms_per_sample_med": [
9.694709888208308e-07,
8.50241519856354e-07,
8.498120678268606e-07,
8.498261649947381e-07,
8.499836781084014e-07
],
"bp_grad_norms_F": [
0.0005667012883350253,
0.0005514815566129982,
0.0005513231735676527,
0.0005382975214160979,
0.0005368698039092124
],
"gamma_dfa": -0.02370089991018176,
"acc_eval": 0.0810546875,
"loss_eval": 2.320453643798828,
"epoch": 2
},
{
"hidden_norms": [
524.08203125,
4883.1953125,
11064.0263671875,
13177.29296875,
14508.083984375
],
"bp_grad_norms_per_sample_med": [
6.069666369512561e-07,
5.623286938316596e-07,
5.621984087156306e-07,
5.621164973490522e-07,
5.620748311230273e-07
],
"bp_grad_norms_F": [
0.0005193821853026748,
0.0004981618840247393,
0.0004926337860524654,
0.0004888861440122128,
0.0004883570945821702
],
"gamma_dfa": -0.024675255175679922,
"acc_eval": 0.0712890625,
"loss_eval": 2.3067145347595215,
"epoch": 3
}
]
}
|