1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
|
{
"config": {
"num_blocks": 4,
"d_hidden": 256,
"seed": 42,
"bp_epochs": 100,
"estimator_epochs": 100,
"lr_fb": 0.001,
"lam": 0.1,
"K": 4,
"sigma_bridge": 0.05,
"ema_momentum": 0.995,
"term_grad_weight": 1.0
},
"bp_acc": 0.6173,
"summary": {
"dfa": {
"mean_gamma": 0.005605479117366485,
"mean_rho": 0.005194449331611395,
"mean_nudge": -2.151036460418254e-05
},
"sb_eT": {
"mean_gamma": 0.2866372682154179,
"mean_rho": 0.24588057771325111,
"mean_nudge": -0.0009568915702402592
},
"cb_eT": {
"mean_gamma": 0.11484479499049485,
"mean_rho": 0.125152001157403,
"mean_nudge": -0.00036998098585172556
},
"cb_deltaL": {
"mean_gamma": 0.06995358848944307,
"mean_rho": 0.06243711616843939,
"mean_nudge": -0.00015994706336641684
}
},
"per_layer": {
"dfa": {
"bp_cosine": [
0.01097307917661965,
-0.00982702277833596,
0.004532583430409432,
0.016743276640772818
],
"perturbation_rho": [
0.0032103070989251137,
-0.030966611579060555,
0.06208299845457077,
-0.01354889664798975
],
"nudging_0.001": [
-3.2122152333613485e-06,
7.709997589699924e-06,
-2.053854950645473e-05,
-1.2655042155529372e-05
],
"nudging_0.003": [
-9.568146197125316e-06,
2.312526703462936e-05,
-6.160693010315299e-05,
-3.799164915108122e-05
],
"nudging_0.01": [
-3.1933166610542685e-05,
7.745913171675056e-05,
-0.0002052279596682638,
-0.00012646839604713023
]
},
"sb_eT": {
"bp_cosine": [
0.19993784725666047,
0.2704531639814377,
0.3183140277862549,
0.35784403383731844
],
"perturbation_rho": [
0.14796550571918488,
0.23224923014640808,
0.27324193716049194,
0.33006563782691956
],
"nudging_0.001": [
-0.00020024771220050752,
-0.00030526291811838746,
-0.0003735219652298838,
-0.0003972915874328464
],
"nudging_0.003": [
-0.0006005102768540382,
-0.0009154834551736712,
-0.001120006782002747,
-0.0011915657669305801
],
"nudging_0.01": [
-0.002000064356252551,
-0.0030484027229249477,
-0.0037288377061486244,
-0.0039670998230576515
]
},
"cb_eT": {
"bp_cosine": [
0.045131212659180166,
0.06221269443631172,
0.1209193505346775,
0.23111592233181
],
"perturbation_rho": [
0.05690425634384155,
0.10793692618608475,
0.10616493225097656,
0.2296018898487091
],
"nudging_0.001": [
-5.6506225519115105e-05,
-8.837308996589854e-05,
-0.00011208542855456471,
-0.00023653265088796616
],
"nudging_0.003": [
-0.00016947659605648369,
-0.00026502960827201605,
-0.0003360719420015812,
-0.0007093457970768213
],
"nudging_0.01": [
-0.0005644541233778,
-0.0008825073018670082,
-0.0011192080564796925,
-0.0023615544196218252
]
},
"cb_deltaL": {
"bp_cosine": [
0.03819061610847711,
0.05208469983190298,
0.06935825981199742,
0.12018077820539474
],
"perturbation_rho": [
0.047517478466033936,
0.013643201440572739,
0.04729664325714111,
0.14129114151000977
],
"nudging_0.001": [
-2.239555396954529e-05,
-2.458264680171851e-05,
-4.0700091631151736e-05,
-0.0001256012765225023
],
"nudging_0.003": [
-6.710628804285079e-05,
-7.37799855414778e-05,
-0.00012205714301671833,
-0.00037684483686462045
],
"nudging_0.01": [
-0.0002235029242001474,
-0.00024507055059075356,
-0.00040636284393258393,
-0.0012548293452709913
]
}
},
"sb_pred_error": [
9093.49886875,
3872.840365234375,
2899.67371015625,
2407.756592578125
]
}
|