summaryrefslogtreecommitdiff
path: root/results/round38_cb_penalty_30ep_s456/results_cifar10.json
blob: 50e9f4bee05246f7dde9ef150a9405c4194348ff (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
{
  "456": {
    "credit_bridge": {
      "log": {
        "train_loss": [
          1.9934451489257812,
          1.9314295723724366,
          1.9235225268173217,
          1.9217069106292726,
          1.9212194289398192,
          1.916630177383423,
          1.9345502002716064,
          1.9283877908325195,
          1.9177326504898071,
          1.9165373708343505,
          1.9105737041854858,
          1.8997189542388917,
          1.891296152076721,
          1.8811385650253296,
          1.8842703173446655,
          1.8762526668930053,
          1.8802709610366821,
          1.8837381246566773,
          1.8947839934921265,
          1.8876838129425049,
          1.878063057937622,
          1.8691059185791015,
          1.8723352920913696,
          1.8673814739990235,
          1.86444116481781,
          1.8651199575424193,
          1.8679865084838867,
          1.8683458470916747,
          1.8682409041595458,
          1.8695441330337523
        ],
        "train_acc": [
          0.27654,
          0.30874,
          0.31612,
          0.3179,
          0.31686,
          0.31922,
          0.314,
          0.31612,
          0.31764,
          0.3182,
          0.31802,
          0.3238,
          0.33024,
          0.33216,
          0.33292,
          0.33354,
          0.33402,
          0.33356,
          0.33096,
          0.33232,
          0.33684,
          0.33706,
          0.33616,
          0.34138,
          0.3399,
          0.34038,
          0.34008,
          0.34048,
          0.33706,
          0.341
        ],
        "test_acc": [
          0.3431,
          0.3495,
          0.3477,
          0.356,
          0.3511,
          0.3474,
          0.3323,
          0.3466,
          0.3508,
          0.3451,
          0.341,
          0.3566,
          0.3514,
          0.3453,
          0.3491,
          0.3525,
          0.3464,
          0.3496,
          0.3429,
          0.3456,
          0.343,
          0.3448,
          0.3481,
          0.3549,
          0.3545,
          0.354,
          0.3557,
          0.355,
          0.3562,
          0.3562
        ],
        "value_loss": [
          0.6358358229446411,
          0.20003649864196776,
          0.1189081085062027,
          0.0873355598807335,
          0.07387620919823647,
          0.06212632877349854,
          0.09646473777532577,
          0.08277876357793808,
          0.06577274338841438,
          0.05903506823539734,
          0.060327464895248414,
          0.0471712444293499,
          0.05392980309844017,
          0.04334379373788834,
          0.04389793854594231,
          0.04077757358431816,
          0.03543120482087135,
          0.03244814622402191,
          0.03196794641435146,
          0.02516974647641182,
          0.018719528279304506,
          0.019053550893962382,
          0.019475930092334746,
          0.01711861621081829,
          0.015539742150306702,
          0.018024257761240007,
          0.01626725864171982,
          0.016166514835059643,
          0.015814910601973535,
          0.015810824376344682
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          0.6528493165969849,
          0.6737558841705322,
          0.6874117851257324,
          0.6945056915283203
        ],
        "perturbation_rho": [
          0.45550960302352905,
          0.4658626317977905,
          0.4093303084373474,
          0.44921162724494934
        ],
        "nudging": {
          "0.001": [
            -4.855693259742111e-05,
            -4.6262473915703595e-05,
            -4.405167419463396e-05,
            -4.2281331843696535e-05
          ],
          "0.003": [
            -0.00014562674914486706,
            -0.0001387652737321332,
            -0.00013202497211750597,
            -0.00012669814168475568
          ],
          "0.01": [
            -0.00048537791008129716,
            -0.00046242878306657076,
            -0.00043993344297632575,
            -0.00042223266791552305
          ]
        },
        "hidden_norms_per_layer": [
          5652.72998046875,
          5664.4931640625,
          5686.38916015625,
          5758.30419921875,
          5775.17431640625
        ],
        "bp_grad_norms_per_layer": [
          2.290221891598776e-05,
          2.191648854932282e-05,
          2.0994630176573992e-05,
          2.07327520911349e-05,
          2.0050258171977475e-05
        ]
      },
      "drift": {
        "embed.weight": 47.17655243675414,
        "embed.bias": 69.22157757464541,
        "blocks.0.ln.weight": 0.30546510219573975,
        "blocks.0.w1.weight": 3.9210619545041143,
        "blocks.0.w1.bias": 5.970693807323712,
        "blocks.0.w2.weight": 18.22592321226308,
        "blocks.1.ln.weight": 0.29675590991973877,
        "blocks.1.w1.weight": 3.7748035547298446,
        "blocks.1.w1.bias": 5.95370365502356,
        "blocks.1.w2.weight": 18.273244666485375,
        "blocks.2.ln.weight": 0.29545143246650696,
        "blocks.2.w1.weight": 3.797978708503024,
        "blocks.2.w1.bias": 6.318915016989016,
        "blocks.2.w2.weight": 18.715277379402863,
        "blocks.3.ln.weight": 0.29928261041641235,
        "blocks.3.w1.weight": 3.9126807823570937,
        "blocks.3.w1.bias": 6.287240256219296,
        "blocks.3.w2.weight": 18.91014036108483,
        "out_ln.weight": 0.10117902606725693,
        "out_head.weight": 2.2020174609192082,
        "out_head.bias": 2.0786513163395623
      }
    }
  },
  "config": {
    "dataset": "cifar10",
    "d_hidden": 256,
    "num_blocks": 4,
    "batch_size": 128,
    "epochs": 30,
    "lr": 0.001,
    "lr_fb": 0.001,
    "wd": 0.01,
    "lam": 0.1,
    "K": 4,
    "sigma_bridge": 0.05,
    "ema_momentum": 0.995,
    "term_grad_weight": 1.0,
    "seeds": [
      456
    ],
    "gpu": 0,
    "output_dir": "results/round38_cb_penalty_30ep_s456",
    "methods": [
      "credit_bridge"
    ],
    "random_targets": false,
    "penalty_lam": 0.01,
    "num_classes": 10
  }
}