summaryrefslogtreecommitdiff
path: root/results/h2_smoke_w0.1/snapshot_evolution_s42.json
blob: d085d3c902de2ac74a61dcabf00a2c3e18dd0971 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
{
  "config": {
    "output_dir": "results/h2_smoke_w0.1",
    "epochs": 3,
    "lr": 0.001,
    "wd": 0.01,
    "seed": 42,
    "depth": 4,
    "d_hidden": 256,
    "log_every": 1,
    "no_residual_add": true,
    "w2_std": 0.1
  },
  "depth": 4,
  "d_hidden": 256,
  "num_classes": 10,
  "bp_log": [
    {
      "hidden_norms": [
        8.718070030212402,
        8.560444831848145,
        8.845171928405762,
        9.21005916595459,
        9.379204750061035
      ],
      "bp_grad_norms_per_sample_med": [
        0.001055641332641244,
        0.0007215326768346131,
        0.0005827629356645048,
        0.0004979022196494043,
        0.00043998067849315703
      ],
      "bp_grad_norms_F": [
        0.036981210112571716,
        0.023669881746172905,
        0.018871067091822624,
        0.016073165461421013,
        0.014115042984485626
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.09375,
      "loss_eval": 2.4311001300811768,
      "epoch": 0
    },
    {
      "hidden_norms": [
        85.71797180175781,
        28.746126174926758,
        27.666101455688477,
        31.958999633789062,
        39.62472915649414
      ],
      "bp_grad_norms_per_sample_med": [
        8.686084765940905e-05,
        8.580532448831946e-05,
        8.54266545502469e-05,
        8.48824274726212e-05,
        8.353861630894244e-05
      ],
      "bp_grad_norms_F": [
        0.003033322049304843,
        0.002979709068313241,
        0.0029494145419448614,
        0.002918587066233158,
        0.0028573593590408564
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.05859375,
      "loss_eval": 2.529827356338501,
      "epoch": 1
    },
    {
      "hidden_norms": [
        103.60254669189453,
        33.103458404541016,
        32.14752197265625,
        38.19721984863281,
        48.121864318847656
      ],
      "bp_grad_norms_per_sample_med": [
        7.112277671694756e-05,
        7.050936983432621e-05,
        7.047054532449692e-05,
        6.984646461205557e-05,
        6.839916750323027e-05
      ],
      "bp_grad_norms_F": [
        0.002462180098518729,
        0.0024272387381643057,
        0.002406709361821413,
        0.002380331512540579,
        0.0023274135310202837
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.0703125,
      "loss_eval": 2.518604278564453,
      "epoch": 2
    },
    {
      "hidden_norms": [
        99.88206481933594,
        32.27016830444336,
        29.376516342163086,
        35.85775375366211,
        44.175907135009766
      ],
      "bp_grad_norms_per_sample_med": [
        7.549120346084237e-05,
        7.506681140512228e-05,
        7.482277578674257e-05,
        7.426074444083497e-05,
        7.269046182045713e-05
      ],
      "bp_grad_norms_F": [
        0.002598837483674288,
        0.00256195105612278,
        0.002536388346925378,
        0.0025058977771550417,
        0.002439383417367935
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.072265625,
      "loss_eval": 2.5117571353912354,
      "epoch": 3
    }
  ],
  "dfa_log": [
    {
      "hidden_norms": [
        8.718070030212402,
        8.560444831848145,
        8.845171928405762,
        9.21005916595459,
        9.379204750061035
      ],
      "bp_grad_norms_per_sample_med": [
        0.001055641332641244,
        0.0007215326768346131,
        0.0005827629356645048,
        0.0004979022196494043,
        0.00043998067849315703
      ],
      "bp_grad_norms_F": [
        0.036981210112571716,
        0.023669881746172905,
        0.018871067091822624,
        0.016073165461421013,
        0.014115042984485626
      ],
      "gamma_dfa": 0.0034602322848513722,
      "acc_eval": 0.09375,
      "loss_eval": 2.4311001300811768,
      "epoch": 0
    },
    {
      "hidden_norms": [
        1321.57177734375,
        5876.37109375,
        5211.20947265625,
        5922.93798828125,
        3697.69580078125
      ],
      "bp_grad_norms_per_sample_med": [
        1.0980336355714826e-06,
        8.924058079173847e-07,
        8.845478305374854e-07,
        8.81322591794742e-07,
        8.844919534567453e-07
      ],
      "bp_grad_norms_F": [
        7.150410965550691e-05,
        5.026865619583987e-05,
        4.9243793910136446e-05,
        4.888495459454134e-05,
        4.859357068198733e-05
      ],
      "gamma_dfa": 0.03524830285459757,
      "acc_eval": 0.1181640625,
      "loss_eval": 2.2935099601745605,
      "epoch": 1
    },
    {
      "hidden_norms": [
        2543.9384765625,
        26885.123046875,
        22657.53515625,
        23760.638671875,
        13455.5205078125
      ],
      "bp_grad_norms_per_sample_med": [
        3.232785559248441e-07,
        2.0931234701038193e-07,
        2.086635788600688e-07,
        2.0885721596641815e-07,
        2.086642325593857e-07
      ],
      "bp_grad_norms_F": [
        3.009554711752571e-05,
        1.4969685253163334e-05,
        1.4619089597545099e-05,
        1.4558195289282594e-05,
        1.4452642062678933e-05
      ],
      "gamma_dfa": 0.03537877253256738,
      "acc_eval": 0.1201171875,
      "loss_eval": 2.3101487159729004,
      "epoch": 2
    },
    {
      "hidden_norms": [
        2961.771484375,
        39258.7265625,
        31789.115234375,
        32956.20703125,
        18197.2578125
      ],
      "bp_grad_norms_per_sample_med": [
        2.570918979927228e-07,
        1.4994434138770885e-07,
        1.4976241402564483e-07,
        1.4952657068079134e-07,
        1.4944804149763513e-07
      ],
      "bp_grad_norms_F": [
        2.3238537323777564e-05,
        1.1003003237419762e-05,
        1.0661849046300631e-05,
        1.0592500984785147e-05,
        1.0497028597455937e-05
      ],
      "gamma_dfa": 0.03636467596516013,
      "acc_eval": 0.12109375,
      "loss_eval": 2.3122406005859375,
      "epoch": 3
    }
  ]
}