1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
|
{
"config": {
"num_blocks": 4,
"d_hidden": 256,
"seed": 42,
"bp_acc": 0.6173,
"estimator_epochs": 100
},
"summary": {
"dfa": {
"mean_gamma": 0.004863154428312555,
"mean_rho": 0.0046705943532288074,
"mean_nudge": -5.86726059736975e-06
},
"sb_eT": {
"mean_gamma": 0.2866372682154179,
"mean_rho": 0.2637173905968666,
"mean_nudge": -0.0009568915702402592
},
"cb_eT": {
"mean_gamma": 0.11484479499049485,
"mean_rho": 0.1202746294438839,
"mean_nudge": -0.00036998098585172556
},
"cb_deltaL": {
"mean_gamma": 0.06995358848944307,
"mean_rho": 0.034168413607403636,
"mean_nudge": -0.00015994706336641684
},
"vec_eT_M4": {
"mean_gamma": 0.3634969729930162,
"mean_rho": 0.42595484107732773,
"mean_nudge": -0.0014062844711588696
},
"vec_eT_M8": {
"mean_gamma": 0.3636624652892351,
"mean_rho": 0.3955033980309963,
"mean_nudge": -0.0013793499529128894
},
"vec_eT_M16": {
"mean_gamma": 0.3677208840847015,
"mean_rho": 0.42224912345409393,
"mean_nudge": -0.001392927297274582
}
},
"per_layer": {
"dfa": {
"bp_cosine": [
0.0033329044468700885,
-0.007507461798377335,
0.022020796407014133,
0.0016063786577433347
],
"perturbation_rho": [
-0.0401616208255291,
-0.018128124997019768,
0.04789097607135773,
0.02908114716410637
],
"nudging_0.003": [
4.354264819994569e-05,
3.3159449230879545e-05,
-9.052902169059962e-05,
-9.642118129704613e-06
]
},
"sb_eT": {
"bp_cosine": [
0.19993784725666047,
0.2704531639814377,
0.3183140277862549,
0.35784403383731844
],
"perturbation_rho": [
0.1395200788974762,
0.2829156517982483,
0.2831076979637146,
0.34932613372802734
],
"nudging_0.003": [
-0.0006005102768540382,
-0.0009154834551736712,
-0.001120006782002747,
-0.0011915657669305801
]
},
"cb_eT": {
"bp_cosine": [
0.045131212659180166,
0.06221269443631172,
0.1209193505346775,
0.23111592233181
],
"perturbation_rho": [
0.03551628440618515,
0.11640645563602448,
0.07594657689332962,
0.25322920083999634
],
"nudging_0.003": [
-0.00016947659605648369,
-0.00026502960827201605,
-0.0003360719420015812,
-0.0007093457970768213
]
},
"cb_deltaL": {
"bp_cosine": [
0.03819061610847711,
0.05208469983190298,
0.06935825981199742,
0.12018077820539474
],
"perturbation_rho": [
-0.01345862727612257,
-0.014757020398974419,
0.03974407538771629,
0.12514522671699524
],
"nudging_0.003": [
-6.710628804285079e-05,
-7.37799855414778e-05,
-0.00012205714301671833,
-0.00037684483686462045
]
},
"vec_eT_M4": {
"bp_cosine": [
0.16388139724731446,
0.26098581701517104,
0.41548662185668944,
0.61363405585289
],
"perturbation_rho": [
0.22898420691490173,
0.339008092880249,
0.4533805847167969,
0.6824464797973633
],
"nudging_0.003": [
-0.0007082110387273133,
-0.0010581386741250753,
-0.0016506186220794916,
-0.002208169549703598
]
},
"vec_eT_M8": {
"bp_cosine": [
0.17386804670095443,
0.268336746096611,
0.406103777885437,
0.606341290473938
],
"perturbation_rho": [
0.19708333909511566,
0.2918933629989624,
0.4379217028617859,
0.6551151871681213
],
"nudging_0.003": [
-0.0007086814730428159,
-0.0010243982542306185,
-0.0016026028897613287,
-0.0021817171946167946
]
},
"vec_eT_M16": {
"bp_cosine": [
0.17664430439472198,
0.27206156253814695,
0.41649516522884367,
0.6056825041770935
],
"perturbation_rho": [
0.20988652110099792,
0.3382995128631592,
0.469192236661911,
0.6716182231903076
],
"nudging_0.003": [
-0.0007140585803426802,
-0.0010502493241801858,
-0.0016202025581151247,
-0.0021871987264603376
]
}
}
}
|