summaryrefslogtreecommitdiff
path: root/results/round38_sb_penalty_30ep_s123/results_cifar10.json
blob: 09d7c81935a52d06716de3c683ea9873bd8c4790 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
{
  "123": {
    "state_bridge": {
      "log": {
        "train_loss": [
          2.0394552979278564,
          1.907211668624878,
          1.8378597689056397,
          1.8050992700958253,
          1.782720252342224,
          1.7607325444793702,
          1.7526287609481812,
          1.7301886476898194,
          1.7114346005249024,
          1.7017147624969482,
          1.6891529846572877,
          1.6735555848693848,
          1.6678473961639404,
          1.6606992713165283,
          1.6562059018707276,
          1.6442966329956055,
          1.6339350330352784,
          1.637065968284607,
          1.6251955394744872,
          1.6232860974502563,
          1.62067741481781,
          1.6153102271270752,
          1.6100856274032593,
          1.6128213213348388,
          1.6058022644805907,
          1.6015477989959717,
          1.6040523609161377,
          1.6024808090591431,
          1.5986408697128296,
          1.5955050112533569
        ],
        "train_acc": [
          0.2546,
          0.31232,
          0.3415,
          0.35616,
          0.36698,
          0.37548,
          0.3775,
          0.38916,
          0.39518,
          0.40052,
          0.40288,
          0.40992,
          0.4117,
          0.4142,
          0.41554,
          0.42002,
          0.42486,
          0.42292,
          0.42918,
          0.4291,
          0.4284,
          0.4346,
          0.4362,
          0.43588,
          0.44048,
          0.44034,
          0.43952,
          0.43918,
          0.44066,
          0.4431
        ],
        "test_acc": [
          0.3128,
          0.3548,
          0.3591,
          0.378,
          0.3826,
          0.3814,
          0.4011,
          0.4028,
          0.404,
          0.4254,
          0.4276,
          0.4332,
          0.4345,
          0.4356,
          0.4316,
          0.4384,
          0.4423,
          0.4425,
          0.4369,
          0.4439,
          0.4447,
          0.4442,
          0.4483,
          0.452,
          0.453,
          0.453,
          0.4498,
          0.4524,
          0.4513,
          0.4514
        ],
        "state_pred_error": [
          0.2664960029602051,
          0.17006848256111146,
          0.1373988006401062,
          0.13497620005130767,
          0.1264824439716339,
          0.11186170087099076,
          0.10831025877714157,
          0.10117165217876434,
          0.0942336485338211,
          0.09043296098470688,
          0.08660082973480225,
          0.08747579972743988,
          0.07973947757720948,
          0.07509488174915313,
          0.07382626082420349,
          0.07346862325191497,
          0.07132561764001846,
          0.07077178321242332,
          0.06908800168275833,
          0.06767414944648743,
          0.06569002504706382,
          0.062389732856750486,
          0.05864977328658104,
          0.05680723578810692,
          0.053985064004659654,
          0.05206361443519592,
          0.0498943436563015,
          0.047763368364572525,
          0.04550520754933357,
          0.043678019300699235
        ]
      },
      "diagnostics": {
        "bp_cosine": [
          0.42979174852371216,
          0.37390586733818054,
          0.32618582248687744,
          0.28139200806617737
        ],
        "perturbation_rho": [
          0.5135085582733154,
          0.5129182934761047,
          0.38893166184425354,
          0.37062373757362366
        ],
        "nudging": {
          "0.001": [
            -0.0003920057788491249,
            -0.00025207665748894215,
            -0.00018884101882576942,
            -0.00014588376507163048
          ],
          "0.003": [
            -0.001175526063889265,
            -0.0007562476675957441,
            -0.000566466711461544,
            -0.00043755793012678623
          ],
          "0.01": [
            -0.003914414905011654,
            -0.002520129084587097,
            -0.0018878313712775707,
            -0.0014582867734134197
          ]
        },
        "hidden_norms_per_layer": [
          231.49375915527344,
          238.22596740722656,
          252.5166473388672,
          278.00189208984375,
          310.919189453125
        ],
        "bp_grad_norms_per_layer": [
          0.000271676923148334,
          0.00023371262068394572,
          0.00020241527818143368,
          0.000180525952600874,
          0.00017415167530998588
        ]
      },
      "drift": {
        "embed.weight": 6.87082720778762,
        "embed.bias": 27.93003811703859,
        "blocks.0.ln.weight": 0.1618085354566574,
        "blocks.0.w1.weight": 3.191546927288011,
        "blocks.0.w1.bias": 6.668010298438182,
        "blocks.0.w2.weight": 15.615942220294206,
        "blocks.1.ln.weight": 0.12653203308582306,
        "blocks.1.w1.weight": 3.159400666127824,
        "blocks.1.w1.bias": 7.198150324919049,
        "blocks.1.w2.weight": 14.61006448474005,
        "blocks.2.ln.weight": 0.1170191541314125,
        "blocks.2.w1.weight": 3.2969716684544164,
        "blocks.2.w1.bias": 7.019388383996979,
        "blocks.2.w2.weight": 15.258183997524307,
        "blocks.3.ln.weight": 0.11643991619348526,
        "blocks.3.w1.weight": 3.5673772866278055,
        "blocks.3.w1.bias": 6.951775133615225,
        "blocks.3.w2.weight": 15.726364417935486,
        "out_ln.weight": 0.21612103283405304,
        "out_head.weight": 1.2186449227295404,
        "out_head.bias": 1.8007506807173053
      }
    }
  },
  "config": {
    "dataset": "cifar10",
    "d_hidden": 256,
    "num_blocks": 4,
    "batch_size": 128,
    "epochs": 30,
    "lr": 0.001,
    "lr_fb": 0.001,
    "wd": 0.01,
    "lam": 0.1,
    "K": 4,
    "sigma_bridge": 0.05,
    "ema_momentum": 0.995,
    "term_grad_weight": 1.0,
    "seeds": [
      123
    ],
    "gpu": 0,
    "output_dir": "results/round38_sb_penalty_30ep_s123",
    "methods": [
      "state_bridge"
    ],
    "random_targets": false,
    "penalty_lam": 0.01,
    "num_classes": 10
  }
}