summaryrefslogtreecommitdiff
path: root/results/round38_cb_penalty_30ep_s123/results_cifar10.json
blob: ae68c960ffb6bb8fff028b5daacf5abf528a2cb3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
{
  "123": {
    "credit_bridge": {
      "log": {
        "train_loss": [
          1.9903950632476806,
          1.9436892071533203,
          1.9378673068237304,
          1.9346954096221924,
          1.9363043911361695,
          1.9327283626937866,
          1.9476709210586547,
          1.9389762512588502,
          1.9266566958236695,
          1.919404111404419,
          1.9120563073730468,
          1.9111018649291993,
          1.9005808422088624,
          1.8967266842269896,
          1.8907416219329833,
          1.882234052658081,
          1.8722203524017333,
          1.8694015215301514,
          1.8656991873168944,
          1.8682857693862915,
          1.8697387396621703,
          1.8678798027801513,
          1.8690597088241576,
          1.8677466773223876,
          1.871109571685791,
          1.8732738525009156,
          1.8745700274658204,
          1.8710524578094483,
          1.8755342425155639,
          1.8727011511993408
        ],
        "train_acc": [
          0.28218,
          0.30712,
          0.31004,
          0.3135,
          0.31522,
          0.31594,
          0.31198,
          0.31488,
          0.31484,
          0.32026,
          0.32228,
          0.32102,
          0.32762,
          0.32718,
          0.33116,
          0.33436,
          0.33864,
          0.33738,
          0.34008,
          0.34056,
          0.34068,
          0.34044,
          0.34202,
          0.34188,
          0.34192,
          0.34224,
          0.3414,
          0.343,
          0.34144,
          0.34402
        ],
        "test_acc": [
          0.3362,
          0.3403,
          0.3354,
          0.3262,
          0.3373,
          0.3421,
          0.3428,
          0.349,
          0.3517,
          0.3491,
          0.353,
          0.347,
          0.3444,
          0.3545,
          0.3505,
          0.3617,
          0.3671,
          0.363,
          0.3697,
          0.3615,
          0.3623,
          0.3666,
          0.3608,
          0.3692,
          0.3652,
          0.3677,
          0.3652,
          0.3645,
          0.364,
          0.3642
        ],
        "value_loss": [
          0.6501392752981185,
          0.19012001507282258,
          0.1075794908285141,
          0.07698172752141952,
          0.06917850073337554,
          0.05796519654870033,
          0.10017188906908035,
          0.06868275530338287,
          0.06073615624547005,
          0.05232048670530319,
          0.045059604372978214,
          0.04662440485239029,
          0.04121920494437218,
          0.044443060465455056,
          0.04122906471073628,
          0.03664021657347679,
          0.03124810820043087,
          0.0269432488912344,
          0.02596988540112972,
          0.024900869569778442,
          0.02048479182034731,
          0.018211499471366407,
          0.0170548377931118,
          0.01694579794406891,
          0.01826157638669014,
          0.014401317476630211,
          0.014872411508262157,
          0.010797930763959884,
          0.01634573257163167,
          0.01106238992586732
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          0.6450029015541077,
          0.6589623689651489,
          0.6671799421310425,
          0.6754908561706543
        ],
        "perturbation_rho": [
          0.3963339030742645,
          0.4112011194229126,
          0.4508204460144043,
          0.49511781334877014
        ],
        "nudging": {
          "0.001": [
            -4.538437133305706e-05,
            -4.164675556239672e-05,
            -3.897584610967897e-05,
            -3.720284075825475e-05
          ],
          "0.003": [
            -0.00013614483759738505,
            -0.00012491861707530916,
            -0.00011692544649122283,
            -0.00011161504517076537
          ],
          "0.01": [
            -0.00045391899766400456,
            -0.00041642854921519756,
            -0.00038977732765488327,
            -0.00037192515446804464
          ]
        },
        "hidden_norms_per_layer": [
          5795.3388671875,
          5812.16650390625,
          5825.60498046875,
          5806.94384765625,
          5834.41455078125
        ],
        "bp_grad_norms_per_layer": [
          2.1459092749864794e-05,
          2.0404753740876913e-05,
          1.9721255739568733e-05,
          1.843643985921517e-05,
          1.812805021472741e-05
        ]
      },
      "drift": {
        "embed.weight": 47.265920858379104,
        "embed.bias": 64.03327510119414,
        "blocks.0.ln.weight": 0.31550925970077515,
        "blocks.0.w1.weight": 3.9393207442198896,
        "blocks.0.w1.bias": 7.116536540852231,
        "blocks.0.w2.weight": 18.565318744639406,
        "blocks.1.ln.weight": 0.3102896213531494,
        "blocks.1.w1.weight": 3.814831040782521,
        "blocks.1.w1.bias": 7.074615401132259,
        "blocks.1.w2.weight": 18.672674667307152,
        "blocks.2.ln.weight": 0.32316333055496216,
        "blocks.2.w1.weight": 3.901017267398649,
        "blocks.2.w1.bias": 6.366350200102534,
        "blocks.2.w2.weight": 19.721825160296877,
        "blocks.3.ln.weight": 0.2990249991416931,
        "blocks.3.w1.weight": 4.002164431729751,
        "blocks.3.w1.bias": 5.90919777616421,
        "blocks.3.w2.weight": 21.568416770540885,
        "out_ln.weight": 0.09184015542268753,
        "out_head.weight": 2.070435355745074,
        "out_head.bias": 1.855754764316957
      }
    }
  },
  "config": {
    "dataset": "cifar10",
    "d_hidden": 256,
    "num_blocks": 4,
    "batch_size": 128,
    "epochs": 30,
    "lr": 0.001,
    "lr_fb": 0.001,
    "wd": 0.01,
    "lam": 0.1,
    "K": 4,
    "sigma_bridge": 0.05,
    "ema_momentum": 0.995,
    "term_grad_weight": 1.0,
    "seeds": [
      123
    ],
    "gpu": 0,
    "output_dir": "results/round38_cb_penalty_30ep_s123",
    "methods": [
      "credit_bridge"
    ],
    "random_targets": false,
    "penalty_lam": 0.01,
    "num_classes": 10
  }
}