1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
|
{
"config": {
"num_blocks": 6,
"d_hidden": 256,
"seed": 42,
"bp_epochs": 100,
"estimator_epochs": 100,
"lr_fb": 0.001,
"lam": 0.1,
"K": 4,
"sigma_bridge": 0.05,
"ema_momentum": 0.995,
"term_grad_weight": 1.0
},
"bp_acc": 0.6172,
"summary": {
"dfa": {
"mean_gamma": 0.008224744617473334,
"mean_rho": -0.007729481750478347,
"mean_nudge": -1.4484473164581383e-05
},
"sb_eT": {
"mean_gamma": 0.28419415106376006,
"mean_rho": 0.24331255008776984,
"mean_nudge": -0.0010212107930177201
},
"cb_eT": {
"mean_gamma": 0.1356087997245292,
"mean_rho": 0.11836575530469418,
"mean_nudge": -0.000398846738486706
},
"cb_deltaL": {
"mean_gamma": 0.06269844393245876,
"mean_rho": 0.07167995596925418,
"mean_nudge": -0.000200468028197065
}
},
"per_layer": {
"dfa": {
"bp_cosine": [
-0.010780696198344231,
-0.0024464363697916268,
0.006427376973442733,
0.023271656595170498,
0.017338427528738976,
0.015538139175623656
],
"perturbation_rho": [
-0.018140554428100586,
0.003606993705034256,
-0.045406848192214966,
0.023949457332491875,
-0.016462121158838272,
0.00607618223875761
],
"nudging_0.001": [
3.0692412110511214e-05,
7.64157812227495e-06,
-9.760969987837598e-08,
-3.085116622969508e-05,
-1.6509711713297293e-05,
-1.9992370653199032e-05
],
"nudging_0.003": [
9.20678285183385e-05,
2.31226204050472e-05,
-2.7300666260998696e-07,
-9.241211228072643e-05,
-4.9478214350529015e-05,
-5.993395461700857e-05
],
"nudging_0.01": [
0.0003075606073252857,
7.720924622844905e-05,
-5.05835487274453e-07,
-0.0003076052526012063,
-0.00016470525588374585,
-0.00019945789244957268
]
},
"sb_eT": {
"bp_cosine": [
0.1685526818037033,
0.23167533278465272,
0.2697907418012619,
0.30822172164916994,
0.3446090370416641,
0.3823153913021088
],
"perturbation_rho": [
0.07154904305934906,
0.19288617372512817,
0.2876003682613373,
0.27649810910224915,
0.3115084767341614,
0.3198331296443939
],
"nudging_0.001": [
-0.00018972528050653636,
-0.0002750377752818167,
-0.00032653682865202427,
-0.00039390879101119936,
-0.00042474071960896254,
-0.00043361991993151605
],
"nudging_0.003": [
-0.0005688090459443629,
-0.0008246920770034194,
-0.0009791019838303328,
-0.00118098477832973,
-0.001273483969271183,
-0.001300192903727293
],
"nudging_0.01": [
-0.0018940127920359373,
-0.0027450949419289827,
-0.0032586848828941584,
-0.003929748199880123,
-0.004237486980855465,
-0.004327159374952316
]
},
"cb_eT": {
"bp_cosine": [
0.045225401408970356,
0.053792066499590875,
0.08010791838169098,
0.12435948699712754,
0.19471128135919571,
0.31545664370059967
],
"perturbation_rho": [
0.024685420095920563,
-0.01572572812438011,
0.08793376386165619,
0.11664978414773941,
0.1602637767791748,
0.3363875150680542
],
"nudging_0.001": [
-2.2263082428253256e-05,
-5.150778451934457e-05,
-7.369300146820024e-05,
-0.00012175041774753481,
-0.00019730909843929112,
-0.000331797928083688
],
"nudging_0.003": [
-6.678207137156278e-05,
-0.00015438658010680228,
-0.0002208092628279701,
-0.00036489206831902266,
-0.0005915500223636627,
-0.0009946604259312153
],
"nudging_0.01": [
-0.00022176679340191185,
-0.0005135145038366318,
-0.0007348398794420063,
-0.0012142673367634416,
-0.0019682790152728558,
-0.0033080100547522306
]
},
"cb_deltaL": {
"bp_cosine": [
0.01903119832277298,
0.03658499242737889,
0.04136112704873085,
0.05426537357270718,
0.07572877742350101,
0.14921919479966164
],
"perturbation_rho": [
-0.004729617387056351,
0.06955375522375107,
0.07996401935815811,
0.11149539798498154,
0.055956777185201645,
0.11783940345048904
],
"nudging_0.001": [
-3.080447640968487e-05,
-4.9154667067341506e-05,
-5.3297979320632294e-05,
-5.973243969492614e-05,
-7.465035014320165e-05,
-0.00013362003664951771
],
"nudging_0.003": [
-9.23606421565637e-05,
-0.00014715960423927754,
-0.00015975572750903666,
-0.00017912944895215333,
-0.00022374786203727126,
-0.0004006548842880875
],
"nudging_0.01": [
-0.00030725268879905343,
-0.0004887805553153157,
-0.0005310464184731245,
-0.0005952278152108192,
-0.0007444550283253193,
-0.0013336975825950503
]
}
},
"sb_pred_error": [
8914.44174921875,
5038.8783640625,
4058.455402734375,
3433.17113046875,
2884.829894921875,
2573.41313515625
]
}
|