summaryrefslogtreecommitdiff
path: root/results/h2_smoke_w0.5/snapshot_evolution_s42.json
blob: 8c75ebdda37e39a1e96a8a6ca416551ee26876f5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
{
  "config": {
    "output_dir": "results/h2_smoke_w0.5",
    "epochs": 3,
    "lr": 0.001,
    "wd": 0.01,
    "seed": 42,
    "depth": 4,
    "d_hidden": 256,
    "log_every": 1,
    "no_residual_add": true,
    "w2_std": 0.5
  },
  "depth": 4,
  "d_hidden": 256,
  "num_classes": 10,
  "bp_log": [
    {
      "hidden_norms": [
        8.718070030212402,
        42.802223205566406,
        44.22697067260742,
        46.05121994018555,
        46.896766662597656
      ],
      "bp_grad_norms_per_sample_med": [
        0.0010791289387270808,
        0.0002035950165009126,
        0.00014324457151815295,
        0.00011542177526280284,
        9.846547618508339e-05
      ],
      "bp_grad_norms_F": [
        0.0380445197224617,
        0.00666962843388319,
        0.0046500470489263535,
        0.003719294909387827,
        0.003155440790578723
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.080078125,
      "loss_eval": 2.446239709854126,
      "epoch": 0
    },
    {
      "hidden_norms": [
        86.00836944580078,
        130.30899047851562,
        107.6886215209961,
        127.31951141357422,
        155.31224060058594
      ],
      "bp_grad_norms_per_sample_med": [
        5.636421337840147e-05,
        4.504464232013561e-05,
        4.254864325048402e-05,
        4.0549883124185726e-05,
        3.8371628761524335e-05
      ],
      "bp_grad_norms_F": [
        0.0019479888724163175,
        0.0014867106219753623,
        0.0013919975608587265,
        0.001322419848293066,
        0.0012390650808811188
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.1435546875,
      "loss_eval": 2.293787717819214,
      "epoch": 1
    },
    {
      "hidden_norms": [
        103.2545166015625,
        142.36724853515625,
        117.42737579345703,
        145.57473754882812,
        174.0562744140625
      ],
      "bp_grad_norms_per_sample_med": [
        5.0501937948865816e-05,
        4.213622378301807e-05,
        3.962606206187047e-05,
        3.741410546354018e-05,
        3.486485002213158e-05
      ],
      "bp_grad_norms_F": [
        0.001744136679917574,
        0.0013844756176695228,
        0.0012931021628901362,
        0.0012163385981693864,
        0.0011240089079365134
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.1640625,
      "loss_eval": 2.2804112434387207,
      "epoch": 2
    },
    {
      "hidden_norms": [
        99.97102355957031,
        140.33131408691406,
        110.34066772460938,
        136.7115936279297,
        163.25784301757812
      ],
      "bp_grad_norms_per_sample_med": [
        5.4715037549613044e-05,
        4.477328184293583e-05,
        4.2219675378873944e-05,
        3.9974820538191125e-05,
        3.672601087600924e-05
      ],
      "bp_grad_norms_F": [
        0.0019211760954931378,
        0.0015042650047689676,
        0.0013935193419456482,
        0.0013014256255701184,
        0.0011887947330251336
      ],
      "gamma_dfa": NaN,
      "acc_eval": 0.1630859375,
      "loss_eval": 2.294424057006836,
      "epoch": 3
    }
  ],
  "dfa_log": [
    {
      "hidden_norms": [
        8.718070030212402,
        42.802223205566406,
        44.22697067260742,
        46.05121994018555,
        46.896766662597656
      ],
      "bp_grad_norms_per_sample_med": [
        0.0010791289387270808,
        0.0002035950165009126,
        0.00014324457151815295,
        0.00011542177526280284,
        9.846547618508339e-05
      ],
      "bp_grad_norms_F": [
        0.0380445197224617,
        0.00666962843388319,
        0.0046500470489263535,
        0.003719294909387827,
        0.003155440790578723
      ],
      "gamma_dfa": 0.004864378133788705,
      "acc_eval": 0.080078125,
      "loss_eval": 2.446239709854126,
      "epoch": 0
    },
    {
      "hidden_norms": [
        1180.2318115234375,
        5768.2900390625,
        5472.90234375,
        6369.3427734375,
        5295.2470703125
      ],
      "bp_grad_norms_per_sample_med": [
        1.2146981589467032e-06,
        8.634061714474228e-07,
        8.587696811446222e-07,
        8.589160529481887e-07,
        8.53334995554178e-07
      ],
      "bp_grad_norms_F": [
        6.592504360014573e-05,
        4.607137088896707e-05,
        4.4360855099512264e-05,
        4.341698149801232e-05,
        4.290258584660478e-05
      ],
      "gamma_dfa": 0.0467059058137238,
      "acc_eval": 0.15625,
      "loss_eval": 2.2713985443115234,
      "epoch": 1
    },
    {
      "hidden_norms": [
        2312.98193359375,
        25168.3515625,
        22182.9609375,
        23364.205078125,
        16927.552734375
      ],
      "bp_grad_norms_per_sample_med": [
        4.0056002603705565e-07,
        2.224278716767003e-07,
        2.2240433850129193e-07,
        2.2153939482905116e-07,
        2.2145297862152802e-07
      ],
      "bp_grad_norms_F": [
        3.370734702912159e-05,
        1.619783870410174e-05,
        1.508272544015199e-05,
        1.4707649825140834e-05,
        1.4549447769240942e-05
      ],
      "gamma_dfa": 0.04014483268838376,
      "acc_eval": 0.1513671875,
      "loss_eval": 2.315417528152466,
      "epoch": 2
    },
    {
      "hidden_norms": [
        2703.50634765625,
        35877.58203125,
        30404.849609375,
        31748.2421875,
        22049.421875
      ],
      "bp_grad_norms_per_sample_med": [
        3.239594548176683e-07,
        1.6274317715669895e-07,
        1.625548691208678e-07,
        1.6296479543598252e-07,
        1.628933432584745e-07
      ],
      "bp_grad_norms_F": [
        2.923223473771941e-05,
        1.1944111065531615e-05,
        1.1137096407765057e-05,
        1.09043749034754e-05,
        1.0791579370561522e-05
      ],
      "gamma_dfa": 0.039210652525071055,
      "acc_eval": 0.1484375,
      "loss_eval": 2.3342530727386475,
      "epoch": 3
    }
  ]
}