diff options
Diffstat (limited to 'results/round38_sbcb_baseline_30ep/results_cifar10.json')
| -rw-r--r-- | results/round38_sbcb_baseline_30ep/results_cifar10.json | 437 |
1 files changed, 437 insertions, 0 deletions
diff --git a/results/round38_sbcb_baseline_30ep/results_cifar10.json b/results/round38_sbcb_baseline_30ep/results_cifar10.json new file mode 100644 index 0000000..4375072 --- /dev/null +++ b/results/round38_sbcb_baseline_30ep/results_cifar10.json @@ -0,0 +1,437 @@ +{ + "42": { + "state_bridge": { + "log": { + "train_loss": [ + 2.1615624513244627, + 2.201089162750244, + 2.182833108444214, + 2.1709032915496826, + 2.1161820389556887, + 2.2302013398742675, + 2.1329537266540526, + 2.10827269241333, + 2.0998276640319826, + 2.083012378692627, + 2.102786566772461, + 2.106615118637085, + 2.0964282553863525, + 2.0857217935943604, + 2.0992775797271728, + 2.0625892084503175, + 2.0862051232147216, + 2.1001052409362795, + 2.094951697998047, + 2.0933474546813966, + 2.0933452713775633, + 2.08693749671936, + 2.0883480770874026, + 2.086935211029053, + 2.0861202153015137, + 2.0841029391479493, + 2.082290132446289, + 2.0792110958099363, + 2.0804510121154784, + 2.081232653427124 + ], + "train_acc": [ + 0.19528, + 0.1606, + 0.17582, + 0.16834, + 0.18852, + 0.1556, + 0.17988, + 0.18368, + 0.19014, + 0.19926, + 0.19686, + 0.1923, + 0.1981, + 0.20012, + 0.19082, + 0.2146, + 0.20116, + 0.18934, + 0.19132, + 0.19428, + 0.18736, + 0.1931, + 0.19568, + 0.19958, + 0.20248, + 0.20444, + 0.2046, + 0.2062, + 0.20122, + 0.20856 + ], + "test_acc": [ + 0.2011, + 0.1577, + 0.176, + 0.1994, + 0.1896, + 0.1661, + 0.1688, + 0.181, + 0.1939, + 0.1873, + 0.1878, + 0.2058, + 0.2082, + 0.1967, + 0.2019, + 0.2005, + 0.1949, + 0.1854, + 0.1759, + 0.1734, + 0.1868, + 0.1995, + 0.1949, + 0.2007, + 0.2077, + 0.2085, + 0.2109, + 0.2079, + 0.2132, + 0.2126 + ], + "state_pred_error": [ + 0.3881664722061157, + 0.5467375702285766, + 0.4459853865337372, + 0.21270744318962098, + 0.2084006814146042, + 0.1407120229911804, + 0.19075847319602968, + 0.1764928385257721, + 0.10211428045988083, + 0.07563618842363358, + 0.05846105343937874, + 0.03846761897563934, + 0.03369148607134819, + 0.022906817595362665, + 0.015594833841919899, + 0.007780850533694029, + 0.005383170440495014, + 0.00387467138633132, + 0.0025940868555754423, + 0.0021150133569538595, + 0.001786851437687874, + 0.0014581093015894294, + 0.0012195721989311278, + 0.001029884922001511, + 0.0009008185034245252, + 0.0008114725712127983, + 0.0007245114441029728, + 0.0006559462931565941, + 0.0006020296776108444, + 0.0005471098060533404 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.2372891902923584, + 0.12591305375099182, + 0.1843540072441101, + 0.28460749983787537 + ], + "perturbation_rho": [ + 0.5516304969787598, + 0.003948327153921127, + -0.007016957737505436, + 0.0 + ], + "nudging": { + "0.001": [ + -1.981109380722046e-05, + -8.381903171539307e-09, + 0.0, + 0.0 + ], + "0.003": [ + -5.944725126028061e-05, + -1.862645149230957e-09, + 0.0, + 0.0 + ], + "0.01": [ + -0.00019809138029813766, + -1.862645149230957e-08, + 3.725290298461914e-09, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 695.4109497070312, + 561166.6875, + 5258578.5, + 12430880.0, + 9851606.0 + ], + "bp_grad_norms_per_layer": [ + 1.0803730219777208e-05, + 1.284981632210247e-08, + 9.346035056978508e-09, + 9.320208604890468e-09, + 9.30139343324754e-09 + ] + }, + "drift": { + "embed.weight": 10.683279498765518, + "embed.bias": 16.186979717078597, + "blocks.0.ln.weight": 1.8698891401290894, + "blocks.0.w1.weight": 34.012515230994815, + "blocks.0.w1.bias": 46.85058602976643, + "blocks.0.w2.weight": 124.44356621058887, + "blocks.1.ln.weight": 1.7833274602890015, + "blocks.1.w1.weight": 48.03603598766101, + "blocks.1.w1.bias": 58.602063412195584, + "blocks.1.w2.weight": 123.88140584500592, + "blocks.2.ln.weight": 2.2544941902160645, + "blocks.2.w1.weight": 66.40401175683013, + "blocks.2.w1.bias": 63.25326651988191, + "blocks.2.w2.weight": 127.01673478324264, + "blocks.3.ln.weight": 1.7423062324523926, + "blocks.3.w1.weight": 37.248001175030076, + "blocks.3.w1.bias": 38.949358252268084, + "blocks.3.w2.weight": 101.10015971156598, + "out_ln.weight": 0.1668696403503418, + "out_head.weight": 1.4905390969722283, + "out_head.bias": 1.6423172242266484 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.039658761978149, + 2.0134409933471678, + 2.00583283241272, + 2.009486458129883, + 2.008044157333374, + 2.0073662790679934, + 2.0122061133575437, + 2.040649677429199, + 2.0651579305267336, + 2.0854766065979002, + 2.099567792701721, + 2.1041016172790528, + 2.111146937561035, + 2.0936275885772706, + 2.100649955825806, + 2.1145339432525634, + 2.1261457512664794, + 2.134411395187378, + 2.138650359802246, + 2.1414046758270264, + 2.1410846240997317, + 2.140825333404541, + 2.1406545039367675, + 2.1377127909851072, + 2.138584699020386, + 2.1371214043426514, + 2.137926218109131, + 2.134101504898071, + 2.1338819580078123, + 2.134741836090088 + ], + "train_acc": [ + 0.25218, + 0.26698, + 0.27004, + 0.26836, + 0.26838, + 0.26756, + 0.26486, + 0.2526, + 0.24742, + 0.23242, + 0.22372, + 0.2182, + 0.2176, + 0.21986, + 0.21266, + 0.2051, + 0.19802, + 0.1941, + 0.1906, + 0.18834, + 0.19216, + 0.19062, + 0.1907, + 0.19222, + 0.19358, + 0.19584, + 0.1945, + 0.19384, + 0.19432, + 0.19732 + ], + "test_acc": [ + 0.2777, + 0.2762, + 0.2822, + 0.3004, + 0.3017, + 0.2837, + 0.2964, + 0.2601, + 0.2555, + 0.2308, + 0.2401, + 0.2235, + 0.1973, + 0.2062, + 0.1917, + 0.232, + 0.2137, + 0.19, + 0.182, + 0.1824, + 0.1929, + 0.191, + 0.1938, + 0.2015, + 0.2114, + 0.2172, + 0.2056, + 0.2037, + 0.2205, + 0.2105 + ], + "value_loss": [ + 0.4988088236522675, + 0.10717420438051224, + 0.08406411410808563, + 0.06901271151542664, + 0.05796313747167587, + 0.04655733848810196, + 0.043197430835962294, + 0.04390601473927498, + 0.036221856105923655, + 0.03994749122738838, + 0.038669472066164015, + 0.03699167508423328, + 0.0456404883146286, + 0.026927970384061337, + 0.02069880782365799, + 0.01933776231765747, + 0.02080854148507118, + 0.016443329193592073, + 0.013170968658924103, + 0.012027110563218594, + 0.00889115786999464, + 0.0077953302666544915, + 0.005822759210169315, + 0.004206860280707479, + 0.003205367206633091, + 0.0018577339798584581, + 0.0014363039807975292, + 0.001063295077085495, + 0.0008753935668803751, + 0.000745832763761282 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.17070117592811584, + 0.12735798954963684, + 0.21822263300418854, + 0.2762623727321625 + ], + "perturbation_rho": [ + 0.021132776513695717, + -0.006791723892092705, + 0.0, + 0.023015428334474564 + ], + "nudging": { + "0.001": [ + -7.441267371177673e-07, + -1.5925616025924683e-07, + 0.0, + 0.0 + ], + "0.003": [ + -2.280808985233307e-06, + -5.373731255531311e-07, + 0.0, + 0.0 + ], + "0.01": [ + -7.669441401958466e-06, + -1.7955899238586426e-06, + 0.0, + 1.862645149230957e-09 + ] + }, + "hidden_norms_per_layer": [ + 7008.69921875, + 7480314.5, + 66006552.0, + 65819076.0, + 67016280.0 + ], + "bp_grad_norms_per_layer": [ + 9.282441055802337e-07, + 5.1517807797551995e-09, + 4.764760141995339e-09, + 4.764532768319896e-09, + 4.767270578298621e-09 + ] + }, + "drift": { + "embed.weight": 55.317448573929425, + "embed.bias": 47.56034585553186, + "blocks.0.ln.weight": 4.106407642364502, + "blocks.0.w1.weight": 67.89937919497739, + "blocks.0.w1.bias": 55.34124320193868, + "blocks.0.w2.weight": 132.61316975770185, + "blocks.1.ln.weight": 3.4333691596984863, + "blocks.1.w1.weight": 109.26717483313107, + "blocks.1.w1.bias": 120.3421088832556, + "blocks.1.w2.weight": 196.69358325668478, + "blocks.2.ln.weight": 2.4557623863220215, + "blocks.2.w1.weight": 55.033274573984386, + "blocks.2.w1.bias": 54.84317146947108, + "blocks.2.w2.weight": 98.576185000917, + "blocks.3.ln.weight": 2.2460579872131348, + "blocks.3.w1.weight": 51.81531440048247, + "blocks.3.w1.bias": 53.49338639187709, + "blocks.3.w2.weight": 92.14827023111492, + "out_ln.weight": 0.22502917051315308, + "out_head.weight": 2.8997412886471703, + "out_head.bias": 0.4396077262245561 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/round38_sbcb_baseline_30ep", + "methods": [ + "state_bridge", + "credit_bridge" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
