1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
|
{
"config": {
"num_blocks": 4,
"d_hidden": 512,
"seed": 42,
"bp_epochs": 100,
"estimator_epochs": 100,
"lr_fb": 0.001,
"lam": 0.1,
"K": 4,
"sigma_bridge": 0.05,
"ema_momentum": 0.995,
"term_grad_weight": 1.0
},
"bp_acc": 0.6046,
"summary": {
"dfa": {
"mean_gamma": 0.00014940524997655283,
"mean_rho": 0.0021846434101462364,
"mean_nudge": 9.80043569143163e-06
},
"sb_eT": {
"mean_gamma": 0.16364388447254896,
"mean_rho": 0.1367498729377985,
"mean_nudge": -0.0008324724767589942
},
"cb_eT": {
"mean_gamma": 0.05695507084019482,
"mean_rho": 0.10538733564317226,
"mean_nudge": -0.00041578355740057305
},
"cb_deltaL": {
"mean_gamma": 0.03857357995584607,
"mean_rho": 0.02690578391775489,
"mean_nudge": -0.00015572691336274147
}
},
"per_layer": {
"dfa": {
"bp_cosine": [
0.0003761224914342165,
0.0014630826306529343,
0.0025856316089630125,
-0.0038272157311439515
],
"perturbation_rho": [
0.041057292371988297,
0.04760625958442688,
-0.04939739778637886,
-0.03052758052945137
],
"nudging_0.001": [
-6.823556759627536e-07,
5.570012035605032e-06,
7.243079380714335e-07,
7.61153205530718e-06
],
"nudging_0.003": [
-2.2219755919650197e-06,
1.6406695067416877e-05,
2.2961030481383204e-06,
2.2720920242136344e-05
],
"nudging_0.01": [
-7.2418697527609766e-06,
5.4833959438838065e-05,
7.364731573034078e-06,
7.559901860076934e-05
]
},
"sb_eT": {
"bp_cosine": [
0.11779971644282342,
0.15058264434337615,
0.1757924109697342,
0.2104007661342621
],
"perturbation_rho": [
0.05106552690267563,
0.14929687976837158,
0.1366019994020462,
0.21003508567810059
],
"nudging_0.001": [
-0.00020435426267795265,
-0.000274428486591205,
-0.0003065963101107627,
-0.0003246065170969814
],
"nudging_0.003": [
-0.0006134338327683508,
-0.0008232325781136751,
-0.0009195499587804079,
-0.0009736735373735428
],
"nudging_0.01": [
-0.0020439010113477707,
-0.0027431542985141277,
-0.0030633914284408092,
-0.003243957180529833
]
},
"cb_eT": {
"bp_cosine": [
0.028400307334959508,
0.030753960087895393,
0.04988271631300449,
0.11878329962491989
],
"perturbation_rho": [
0.06698533892631531,
0.07322317361831665,
0.11097840219736099,
0.1703624278306961
],
"nudging_0.001": [
-8.199035073630512e-05,
-9.967104415409267e-05,
-0.00014070692122913897,
-0.00023186377075035125
],
"nudging_0.003": [
-0.000246370182139799,
-0.000298988597933203,
-0.0004220257396809757,
-0.0006957497098483145
],
"nudging_0.01": [
-0.0008211369859054685,
-0.0009962331969290972,
-0.0014064292190596461,
-0.0023175508249551058
]
},
"cb_deltaL": {
"bp_cosine": [
0.019338275119662286,
0.03327283784747124,
0.040172213315963747,
0.061510993540287016
],
"perturbation_rho": [
-0.0003883522003889084,
0.029364485293626785,
0.04492279514670372,
0.03372420743107796
],
"nudging_0.001": [
-2.7410198526922613e-05,
-5.19197310495656e-05,
-6.934596603969112e-05,
-5.898199015064165e-05
],
"nudging_0.003": [
-8.237811562139541e-05,
-0.00015559815801680088,
-0.00020809093257412314,
-0.00017684044723864645
],
"nudging_0.01": [
-0.00027475334354676306,
-0.000518541899509728,
-0.0006934736738912761,
-0.0005893784109503031
]
}
},
"sb_pred_error": [
32627.8307125,
17715.490584375,
13710.30735,
10994.33838125
]
}
|