summaryrefslogtreecommitdiff
path: root/results/smoke_test/results_fashionmnist.json
blob: 8fd82c036bbaa33686cd95a581d33d3361df91cf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
{
  "42": {
    "bp": {
      "log": {
        "train_loss": [
          0.7028828698158264,
          0.5331447437604269,
          0.4640675885995229,
          0.416527880080541,
          0.3784152720451355
        ],
        "train_acc": [
          0.73755,
          0.8002166666666667,
          0.8256666666666667,
          0.8436666666666667,
          0.8591833333333333
        ],
        "test_acc": [
          0.7939,
          0.8157,
          0.8379,
          0.8606,
          0.8658
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          1.0,
          1.0,
          1.0,
          1.0,
          1.0,
          1.0,
          1.0,
          1.0
        ],
        "perturbation_rho": [
          0.9998708367347717,
          0.9998407959938049,
          0.9997469186782837,
          0.9998122453689575,
          0.9997262358665466,
          0.9996491074562073,
          0.9996585845947266,
          0.9995328783988953
        ],
        "nudging": {
          "0.001": [
            -0.0019641336984932423,
            -0.00174636859446764,
            -0.00154352025128901,
            -0.0013810225063934922,
            -0.0012467722408473492,
            -0.0011190228397026658,
            -0.0010304137831553817,
            -0.0009783159475773573
          ],
          "0.003": [
            -0.005858615506440401,
            -0.005213461350649595,
            -0.004612031392753124,
            -0.004128905013203621,
            -0.0037290011532604694,
            -0.003348270896822214,
            -0.003083921270444989,
            -0.002928499598056078
          ],
          "0.01": [
            -0.019138235598802567,
            -0.017080917954444885,
            -0.015158241614699364,
            -0.013598069548606873,
            -0.01229821052402258,
            -0.01105712354183197,
            -0.010194781236350536,
            -0.009686501696705818
          ]
        }
      },
      "drift": {
        "embed.weight": 1.1395236897587921,
        "embed.bias": 0.6760135861021652,
        "blocks.0.ln.weight": 0.0347786583006382,
        "blocks.0.w1.weight": 0.8267150385727446,
        "blocks.0.w1.bias": 0.7665003752239994,
        "blocks.0.w2.weight": 2.522163826858937,
        "blocks.1.ln.weight": 0.0373835414648056,
        "blocks.1.w1.weight": 0.8094006579319112,
        "blocks.1.w1.bias": 0.7074648417912711,
        "blocks.1.w2.weight": 2.427488314293417,
        "blocks.2.ln.weight": 0.0362338162958622,
        "blocks.2.w1.weight": 0.7981608599321399,
        "blocks.2.w1.bias": 0.6653993627306621,
        "blocks.2.w2.weight": 2.3264717248101827,
        "blocks.3.ln.weight": 0.03489774093031883,
        "blocks.3.w1.weight": 0.8024856088475522,
        "blocks.3.w1.bias": 0.6243261101573547,
        "blocks.3.w2.weight": 2.2732641732905714,
        "blocks.4.ln.weight": 0.036862026900053024,
        "blocks.4.w1.weight": 0.7702369058900084,
        "blocks.4.w1.bias": 0.671902653164234,
        "blocks.4.w2.weight": 2.11229934068397,
        "blocks.5.ln.weight": 0.04049132019281387,
        "blocks.5.w1.weight": 0.74033776504041,
        "blocks.5.w1.bias": 0.6447910547850285,
        "blocks.5.w2.weight": 1.9146335569252138,
        "blocks.6.ln.weight": 0.03797098994255066,
        "blocks.6.w1.weight": 0.7241522377185389,
        "blocks.6.w1.bias": 0.6486550903936706,
        "blocks.6.w2.weight": 1.8210870137239685,
        "blocks.7.ln.weight": 0.03962903097271919,
        "blocks.7.w1.weight": 0.6992516513120532,
        "blocks.7.w1.bias": 0.7021825186584477,
        "blocks.7.w2.weight": 1.7902862835380957,
        "out_ln.weight": 0.026629405096173286,
        "out_head.weight": 0.5610428179907003,
        "out_head.bias": 0.24151687322978704
      }
    },
    "dfa": {
      "log": {
        "train_loss": [
          1.4100907169977823,
          1.4334057479222615,
          1.4326289967854817,
          1.4254953683853149,
          1.4169784986495972
        ],
        "train_acc": [
          0.4805,
          0.49806666666666666,
          0.49725,
          0.5031166666666667,
          0.5098
        ],
        "test_acc": [
          0.5175,
          0.5282,
          0.5025,
          0.5027,
          0.5338
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          0.2141590267419815,
          0.0797841027379036,
          0.04707183688879013,
          0.0032249214127659798,
          0.024886084720492363,
          -0.0050605954602360725,
          0.009758025407791138,
          0.020020857453346252
        ],
        "perturbation_rho": [
          0.07338915765285492,
          -0.004745986312627792,
          0.018682830035686493,
          0.031185101717710495,
          -0.02063235454261303,
          0.0006608979310840368,
          0.0,
          0.04759033024311066
        ],
        "nudging": {
          "0.001": [
            -3.5976991057395935e-06,
            2.3283064365386963e-09,
            -9.313225746154785e-10,
            -9.313225746154785e-09,
            4.656612873077393e-10,
            -3.725290298461914e-09,
            1.3969838619232178e-09,
            9.313225746154785e-10
          ],
          "0.003": [
            -1.0745832696557045e-05,
            2.3283064365386963e-09,
            1.6298145055770874e-09,
            -2.3283064365386963e-09,
            6.752088665962219e-09,
            1.0244548320770264e-08,
            -4.6566128730773926e-09,
            0.0
          ],
          "0.01": [
            -3.5760458558797836e-05,
            -9.313225746154785e-10,
            1.3271346688270569e-08,
            -1.0244548320770264e-08,
            -8.381903171539307e-09,
            4.1443854570388794e-08,
            8.847564458847046e-09,
            1.30385160446167e-08
          ]
        }
      },
      "drift": {
        "embed.weight": 34.15137184586086,
        "embed.bias": 25.886722942466992,
        "blocks.0.ln.weight": 2.2413852214813232,
        "blocks.0.w1.weight": 42.91370684219911,
        "blocks.0.w1.bias": 42.38937429728957,
        "blocks.0.w2.weight": 115.11173260217275,
        "blocks.1.ln.weight": 2.0233230590820312,
        "blocks.1.w1.weight": 36.64772802731374,
        "blocks.1.w1.bias": 34.57367344043412,
        "blocks.1.w2.weight": 84.1198032305499,
        "blocks.2.ln.weight": 1.9000216722488403,
        "blocks.2.w1.weight": 33.172328512058,
        "blocks.2.w1.bias": 31.908254113444393,
        "blocks.2.w2.weight": 78.32752075434591,
        "blocks.3.ln.weight": 1.9099335670471191,
        "blocks.3.w1.weight": 36.73019631908303,
        "blocks.3.w1.bias": 32.60666919280332,
        "blocks.3.w2.weight": 83.75068434979308,
        "blocks.4.ln.weight": 1.891120195388794,
        "blocks.4.w1.weight": 35.27032832987592,
        "blocks.4.w1.bias": 38.017692746712825,
        "blocks.4.w2.weight": 80.26417466790754,
        "blocks.5.ln.weight": 2.0106024742126465,
        "blocks.5.w1.weight": 42.09808335703852,
        "blocks.5.w1.bias": 43.15100280108635,
        "blocks.5.w2.weight": 94.64753309078039,
        "blocks.6.ln.weight": 1.8941009044647217,
        "blocks.6.w1.weight": 38.94163125135345,
        "blocks.6.w1.bias": 38.10426587138794,
        "blocks.6.w2.weight": 84.40488806201412,
        "blocks.7.ln.weight": 1.9035111665725708,
        "blocks.7.w1.weight": 38.65051912560395,
        "blocks.7.w1.bias": 40.760402959190415,
        "blocks.7.w2.weight": 81.97372863530312,
        "out_ln.weight": 0.39740806818008423,
        "out_head.weight": 3.609484615833081,
        "out_head.bias": 0.8344298895862311
      }
    },
    "state_bridge": {
      "log": {
        "train_loss": [
          1.7336509002049765,
          1.5851847206751506,
          1.8742321704864502,
          1.8100628153483074,
          1.5580067304611207
        ],
        "train_acc": [
          0.32705,
          0.3616333333333333,
          0.2679166666666667,
          0.31853333333333333,
          0.4080166666666667
        ],
        "test_acc": [
          0.4036,
          0.4047,
          0.3046,
          0.4005,
          0.4651
        ],
        "state_pred_error": [
          5076234.573784879,
          343992182.36586666,
          517900685.38026667,
          557639895.7226666,
          383439664.5205333
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          0.35149621963500977,
          0.27368226647377014,
          0.045176729559898376,
          0.04587914049625397,
          0.06403794139623642,
          0.06599076837301254,
          0.10026843845844269,
          0.11267217993736267
        ],
        "perturbation_rho": [
          0.37996596097946167,
          0.0075237625278532505,
          -0.017497196793556213,
          0.001783197745680809,
          0.026772135868668556,
          0.011043311096727848,
          0.0037202914245426655,
          0.008577261120080948
        ],
        "nudging": {
          "0.001": [
            -7.0138368755579e-05,
            -1.0319054126739502e-06,
            -6.495974957942963e-08,
            -4.190951585769653e-09,
            -3.3993273973464966e-08,
            -2.2584572434425354e-08,
            -6.123445928096771e-08,
            -4.1443854570388794e-08
          ],
          "0.003": [
            -0.00021021789871156216,
            -3.0745286494493484e-06,
            -1.0547228157520294e-07,
            -4.866160452365875e-08,
            -8.591450750827789e-08,
            -6.938353180885315e-08,
            -1.1292286217212677e-07,
            -9.825453162193298e-08
          ],
          "0.01": [
            -0.0006983885541558266,
            -1.027202233672142e-05,
            -3.688037395477295e-07,
            -1.073349267244339e-07,
            -2.153683453798294e-07,
            -2.0815059542655945e-07,
            -2.6938505470752716e-07,
            -3.08966264128685e-07
          ]
        }
      },
      "drift": {
        "embed.weight": 4.244627827603776,
        "embed.bias": 2.284214237417933,
        "blocks.0.ln.weight": 0.7376585006713867,
        "blocks.0.w1.weight": 10.052587254542228,
        "blocks.0.w1.bias": 12.863219234970343,
        "blocks.0.w2.weight": 32.7856072339516,
        "blocks.1.ln.weight": 0.8459606170654297,
        "blocks.1.w1.weight": 17.10440998330836,
        "blocks.1.w1.bias": 22.587196662115986,
        "blocks.1.w2.weight": 48.94107595877311,
        "blocks.2.ln.weight": 0.5776991248130798,
        "blocks.2.w1.weight": 12.17296546064332,
        "blocks.2.w1.bias": 14.464613959802604,
        "blocks.2.w2.weight": 33.58238884289355,
        "blocks.3.ln.weight": 0.6916943788528442,
        "blocks.3.w1.weight": 11.021146543598332,
        "blocks.3.w1.bias": 11.779720628235973,
        "blocks.3.w2.weight": 25.18170826322489,
        "blocks.4.ln.weight": 0.5363020300865173,
        "blocks.4.w1.weight": 8.488676390390957,
        "blocks.4.w1.bias": 11.968348972417077,
        "blocks.4.w2.weight": 23.562556821259157,
        "blocks.5.ln.weight": 0.749293863773346,
        "blocks.5.w1.weight": 13.199470836216618,
        "blocks.5.w1.bias": 17.384581140704626,
        "blocks.5.w2.weight": 36.38642209120496,
        "blocks.6.ln.weight": 0.45835214853286743,
        "blocks.6.w1.weight": 10.662863447362852,
        "blocks.6.w1.bias": 15.855775302559838,
        "blocks.6.w2.weight": 28.70293410646866,
        "blocks.7.ln.weight": 0.4122738838195801,
        "blocks.7.w1.weight": 7.193545064718527,
        "blocks.7.w1.bias": 7.340520731384394,
        "blocks.7.w2.weight": 22.53669113456487,
        "out_ln.weight": 0.06885236501693726,
        "out_head.weight": 1.473306835980063,
        "out_head.bias": 1.5084479134035678
      }
    },
    "credit_bridge": {
      "log": {
        "train_loss": [
          2.0466531958262126,
          2.2737758037567137,
          2.280587441889445,
          2.25820095837911,
          2.270971960576375
        ],
        "train_acc": [
          0.22976666666666667,
          0.13306666666666667,
          0.13921666666666666,
          0.15853333333333333,
          0.15521666666666667
        ],
        "test_acc": [
          0.1866,
          0.101,
          0.1455,
          0.1616,
          0.0958
        ],
        "value_loss": [
          1.105676996310552,
          0.06329173700014751,
          0.02014747195293506,
          0.01469622576336066,
          0.0050645585257560015
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          -0.04117349535226822,
          0.006370606832206249,
          0.03125208616256714,
          -0.015287259593605995,
          -0.04197325184941292,
          -0.021368175745010376,
          0.009605868719518185,
          0.029422588646411896
        ],
        "perturbation_rho": [
          -0.09283949434757233,
          -0.030718784779310226,
          0.00206748116761446,
          0.0,
          -0.0060626850463449955,
          -0.015737878158688545,
          0.02677903138101101,
          -0.040315717458724976
        ],
        "nudging": {
          "0.001": [
            3.939494490623474e-06,
            -1.4901161193847656e-08,
            0.0,
            0.0,
            0.0,
            0.0,
            0.0,
            0.0
          ],
          "0.003": [
            1.1788681149482727e-05,
            -3.725290298461914e-09,
            1.862645149230957e-09,
            0.0,
            0.0,
            -1.862645149230957e-09,
            1.862645149230957e-09,
            0.0
          ],
          "0.01": [
            3.923662006855011e-05,
            2.60770320892334e-08,
            7.450580596923828e-09,
            -1.862645149230957e-09,
            1.862645149230957e-09,
            1.862645149230957e-09,
            1.862645149230957e-09,
            5.587935447692871e-09
          ]
        }
      },
      "drift": {
        "embed.weight": 5.5176286267072285,
        "embed.bias": 5.84115130180781,
        "blocks.0.ln.weight": 0.7516779899597168,
        "blocks.0.w1.weight": 13.130250396475844,
        "blocks.0.w1.bias": 16.418874968953887,
        "blocks.0.w2.weight": 35.524006089100524,
        "blocks.1.ln.weight": 1.0247337818145752,
        "blocks.1.w1.weight": 24.629494668532566,
        "blocks.1.w1.bias": 31.389502706524333,
        "blocks.1.w2.weight": 66.32116257377548,
        "blocks.2.ln.weight": 1.0405563116073608,
        "blocks.2.w1.weight": 19.820545045709153,
        "blocks.2.w1.bias": 21.04420170821489,
        "blocks.2.w2.weight": 47.599865577930004,
        "blocks.3.ln.weight": 0.698647677898407,
        "blocks.3.w1.weight": 11.782448138509505,
        "blocks.3.w1.bias": 11.300932589985935,
        "blocks.3.w2.weight": 29.52897326429494,
        "blocks.4.ln.weight": 0.7269545197486877,
        "blocks.4.w1.weight": 12.151248949786332,
        "blocks.4.w1.bias": 11.545512427875654,
        "blocks.4.w2.weight": 31.11028303079019,
        "blocks.5.ln.weight": 0.7007301449775696,
        "blocks.5.w1.weight": 10.093534441471926,
        "blocks.5.w1.bias": 8.779689334059729,
        "blocks.5.w2.weight": 24.2612493038314,
        "blocks.6.ln.weight": 0.7457646727561951,
        "blocks.6.w1.weight": 9.34015610077582,
        "blocks.6.w1.bias": 7.819986138941612,
        "blocks.6.w2.weight": 24.326245888357803,
        "blocks.7.ln.weight": 0.7317199110984802,
        "blocks.7.w1.weight": 10.73492434511088,
        "blocks.7.w1.bias": 9.150645079981764,
        "blocks.7.w2.weight": 27.11222424242763,
        "out_ln.weight": 0.07713422179222107,
        "out_head.weight": 1.4131541672079744,
        "out_head.bias": 0.7976411656775528
      }
    }
  },
  "config": {
    "dataset": "fashionmnist",
    "d_hidden": 256,
    "num_blocks": 8,
    "batch_size": 128,
    "epochs": 5,
    "lr": 0.001,
    "lr_fb": 0.001,
    "wd": 0.01,
    "lam": 0.1,
    "K": 4,
    "sigma_bridge": 0.05,
    "ema_momentum": 0.995,
    "term_grad_weight": 1.0,
    "seeds": [
      42
    ],
    "gpu": 0,
    "output_dir": "results/smoke_test",
    "num_classes": 10
  }
}