{ "456": { "bp": { "log": { "train_loss": [ 3.9721967333221437, 3.6422341596221925, 3.48317311088562, 3.384400603027344, 3.3024317309570312, 3.244081290435791, 3.1941285145568847, 3.1515661222839357, 3.110703917541504, 3.0678702397155764, 3.0385052178955076, 3.0125491227722168, 2.9755833444976805, 2.9489572755432127, 2.922896576004028, 2.8952785552215574, 2.8644921349334718, 2.837543485031128, 2.815750347290039, 2.7902291624450686, 2.7643565017700196, 2.749027015914917, 2.7195132698059084, 2.7054608350372313, 2.678812169647217, 2.655367773590088, 2.6455082903289795, 2.621019700469971, 2.6011389213562013, 2.592018772201538, 2.563096626586914, 2.5475857734680174, 2.5312666052246096, 2.507406205291748, 2.4910193432617187, 2.4760341359710694, 2.463254167022705, 2.443411533126831, 2.4220050102996824, 2.4045714128875733, 2.3885920139312744, 2.3683135289001465, 2.35701943649292, 2.339880431365967, 2.3229517127990724, 2.307848415145874, 2.2967623091125486, 2.277586201171875, 2.2599157135009764, 2.2420585137939453, 2.2226363661193846, 2.211539700012207, 2.1965325047302247, 2.181053132362366, 2.1636188303375246, 2.148667406234741, 2.1403865797424317, 2.118398011932373, 2.1047801040649414, 2.090780695877075, 2.0796419092178344, 2.0641602599716187, 2.046349721298218, 2.034338469238281, 2.0246941263580323, 2.010717328338623, 1.9879577135848998, 1.9908112752532958, 1.9648436877822877, 1.9547819673156739, 1.942468291015625, 1.9376066028594972, 1.9182865232086181, 1.9184452313232423, 1.9024611935424804, 1.8942070873641967, 1.8815567203521728, 1.8690018142318725, 1.8623281653213501, 1.8579870316314697, 1.8522963430404662, 1.836771893234253, 1.8371977347564696, 1.8297668377685548, 1.822632707901001, 1.8128088718032838, 1.8157146021270751, 1.8022041482162476, 1.8005397263336183, 1.80292332862854, 1.7940929901504516, 1.7858528171539307, 1.7898485187149047, 1.7881443228149414, 1.7818482210540771, 1.776848041419983, 1.7760994798278809, 1.7772335396957397, 1.7761591400146484, 1.7769086535644532 ], "train_acc": [ 0.09778, 0.1434, 0.17072, 0.18902, 0.20188, 0.21248, 0.22264, 0.22896, 0.23846, 0.24332, 0.2513, 0.25484, 0.26372, 0.26734, 0.27242, 0.27908, 0.2835, 0.28882, 0.29154, 0.29834, 0.30224, 0.30392, 0.31194, 0.3125, 0.31934, 0.32328, 0.32578, 0.3307, 0.33552, 0.33738, 0.34074, 0.34822, 0.3489, 0.35476, 0.35714, 0.3598, 0.36264, 0.3679, 0.373, 0.37474, 0.37926, 0.38364, 0.38482, 0.38824, 0.3921, 0.39568, 0.39682, 0.4015, 0.4051, 0.40902, 0.41356, 0.41618, 0.42064, 0.4233, 0.42546, 0.42778, 0.43316, 0.4337, 0.4397, 0.442, 0.44436, 0.45016, 0.4521, 0.45792, 0.45892, 0.4619, 0.46716, 0.46476, 0.47062, 0.475, 0.4752, 0.47938, 0.48198, 0.48142, 0.48788, 0.49032, 0.49212, 0.49664, 0.49638, 0.4973, 0.4982, 0.5018, 0.5012, 0.50402, 0.50828, 0.512, 0.50698, 0.51086, 0.51272, 0.5128, 0.51364, 0.5147, 0.51322, 0.51572, 0.51924, 0.51582, 0.52014, 0.51688, 0.519, 0.51792 ], "test_acc": [ 0.1436, 0.1724, 0.1976, 0.2161, 0.2193, 0.2286, 0.2386, 0.2425, 0.2508, 0.2496, 0.2572, 0.2667, 0.2678, 0.266, 0.2744, 0.2762, 0.278, 0.277, 0.2819, 0.2857, 0.2884, 0.2924, 0.2971, 0.2938, 0.2967, 0.2984, 0.2994, 0.2987, 0.3023, 0.3018, 0.3005, 0.3058, 0.3086, 0.3118, 0.3122, 0.317, 0.3139, 0.3083, 0.3131, 0.3166, 0.3193, 0.3185, 0.318, 0.3176, 0.319, 0.3176, 0.3157, 0.3158, 0.3241, 0.3165, 0.3253, 0.3217, 0.3224, 0.3244, 0.3217, 0.3181, 0.3206, 0.3261, 0.3208, 0.3204, 0.3198, 0.324, 0.322, 0.3227, 0.3184, 0.3193, 0.323, 0.3233, 0.3254, 0.3202, 0.3196, 0.3251, 0.3243, 0.3247, 0.3209, 0.3245, 0.3267, 0.322, 0.3224, 0.3177, 0.3213, 0.3196, 0.3218, 0.3207, 0.3219, 0.3223, 0.3244, 0.3202, 0.3248, 0.3217, 0.3236, 0.3228, 0.3211, 0.3231, 0.3222, 0.3215, 0.3217, 0.3216, 0.3217, 0.3219 ] }, "diagnostics": { "bp_cosine": [ 1.0, 1.0, 1.0, 1.0 ], "perturbation_rho": [ 0.9977043271064758, 0.9984360337257385, 0.9986849427223206, 0.998687744140625 ], "nudging": { "0.001": [ -0.0023326585069298744, -0.0024166624061763287, -0.002438523806631565, -0.002317411359399557 ], "0.003": [ -0.006994417868554592, -0.007245808374136686, -0.007311580237001181, -0.0069488403387367725 ], "0.01": [ -0.023275790736079216, -0.024107107892632484, -0.02432604506611824, -0.023123476654291153 ] }, "hidden_norms_per_layer": [ 233.81195068359375, 216.790283203125, 197.1819305419922, 192.0648956298828, 192.4108123779297 ], "bp_grad_norms_per_layer": [ 0.0011535885278135538, 0.0012452645460143685, 0.0012428142363205552, 0.0011899643577635288, 0.0009729627054184675 ] }, "drift": { "embed.weight": 7.39398977590873, "embed.bias": 12.21138556118351, "blocks.0.ln.weight": 0.14770954847335815, "blocks.0.w1.weight": 3.60408439890455, "blocks.0.w1.bias": 5.22994684696013, "blocks.0.w2.weight": 13.053238719433654, "blocks.1.ln.weight": 0.2946910560131073, "blocks.1.w1.weight": 4.020628252632815, "blocks.1.w1.bias": 4.08986730586542, "blocks.1.w2.weight": 14.948894323523715, "blocks.2.ln.weight": 0.3565492630004883, "blocks.2.w1.weight": 4.131160512042399, "blocks.2.w1.bias": 4.003626979292673, "blocks.2.w2.weight": 15.902707284756408, "blocks.3.ln.weight": 0.5485884547233582, "blocks.3.w1.weight": 4.454943236812576, "blocks.3.w1.bias": 3.7282169522367608, "blocks.3.w2.weight": 17.516109303089266, "out_ln.weight": 0.14718063175678253, "out_head.weight": 2.8761547030079035, "out_head.bias": 2.9449926838807814 } }, "dfa": { "log": { "train_loss": [ 4.161876879730225, 4.0187293235778805, 4.006406578216553, 4.022609137268066, 4.043629914093017, 4.065061766357422, 4.069896491699219, 4.078123603668213, 4.078062142028808, 4.077979364929199, 4.076888464050293, 4.075497508239746, 4.072547879943848, 4.0701713494110106, 4.069026535797119, 4.064811604537964, 4.061763154296875, 4.060759606628418, 4.057107001800537, 4.0601828897094725, 4.055534585723877, 4.054944921569824, 4.051256662597656, 4.050451954650879, 4.050393276824951, 4.046223313903808, 4.047258992919922, 4.047048767089843, 4.044600559692383, 4.0430317344665525, 4.043368485031128, 4.043571725158691, 4.04141174987793, 4.0433316299438475, 4.041590490188598, 4.042222282104492, 4.039775361480713, 4.0390912678527835, 4.040217839660644, 4.039096583099365, 4.040037224197388, 4.037792987365723, 4.037555375213623, 4.0370241506958005, 4.036846955261231, 4.037261250762939, 4.036293372497559, 4.036143635406495, 4.036682392578125, 4.037161629333496, 4.033746524200439, 4.0374753099060054, 4.035349784240722, 4.037173667144775, 4.0371518122863765, 4.035486927947998, 4.036137412185669, 4.036821200714112, 4.035519530792237, 4.035781366424561, 4.034954352722168, 4.03612970993042, 4.036103559722901, 4.03622392074585, 4.035975666046142, 4.036468890686035, 4.0351540557861325, 4.035398180618286, 4.034821971435547, 4.0340077725219725, 4.0375495939636235, 4.034684106140137, 4.034154214782715, 4.032997749557495, 4.033953489532471, 4.034259751586914, 4.034655684280396, 4.0341955810546875, 4.032625467605591, 4.033415794677734, 4.0320995791625975, 4.034218223724365, 4.033138923187256, 4.03524599899292, 4.03208328704834, 4.032160759277343, 4.034070838088989, 4.030838821868897, 4.031133236694336, 4.032454485397339, 4.0351671361541745, 4.032833539428711, 4.03182988456726, 4.035511425170898, 4.034130640563965, 4.030528937072754, 4.031213985443115, 4.02996834274292, 4.034611818542481, 4.032926365203857 ], "train_acc": [ 0.06838, 0.08666, 0.08636, 0.08428, 0.08436, 0.08, 0.07998, 0.0795, 0.08026, 0.07902, 0.08168, 0.08248, 0.08128, 0.08158, 0.0824, 0.08262, 0.08376, 0.08384, 0.08508, 0.08482, 0.0866, 0.08544, 0.08676, 0.08688, 0.08632, 0.08594, 0.0864, 0.08776, 0.08736, 0.0885, 0.08856, 0.08896, 0.08866, 0.08886, 0.08898, 0.09026, 0.08896, 0.09028, 0.09104, 0.08926, 0.08906, 0.08948, 0.09216, 0.09092, 0.0916, 0.09188, 0.09304, 0.09212, 0.09048, 0.0914, 0.09228, 0.09146, 0.09234, 0.09168, 0.09086, 0.09146, 0.09152, 0.0926, 0.0927, 0.09192, 0.09064, 0.09282, 0.09188, 0.09342, 0.09134, 0.09174, 0.09164, 0.09388, 0.09276, 0.0928, 0.09378, 0.0937, 0.09332, 0.09394, 0.09278, 0.09276, 0.09362, 0.09378, 0.0931, 0.09256, 0.09352, 0.0925, 0.09258, 0.0933, 0.09242, 0.09364, 0.09322, 0.09358, 0.09406, 0.09348, 0.09254, 0.09332, 0.09516, 0.09486, 0.09452, 0.09486, 0.09398, 0.09486, 0.0926, 0.09292 ], "test_acc": [ 0.0832, 0.0875, 0.0896, 0.0827, 0.0848, 0.0809, 0.0756, 0.0769, 0.0809, 0.0777, 0.0775, 0.0751, 0.0835, 0.0804, 0.0776, 0.0805, 0.0857, 0.0753, 0.0811, 0.0813, 0.0813, 0.0786, 0.0812, 0.0834, 0.0862, 0.0883, 0.0863, 0.0861, 0.0853, 0.0878, 0.0835, 0.087, 0.0873, 0.0833, 0.087, 0.0834, 0.08, 0.0867, 0.0897, 0.0872, 0.0834, 0.0871, 0.0804, 0.084, 0.0892, 0.0908, 0.0851, 0.0891, 0.0889, 0.0834, 0.0892, 0.0905, 0.0915, 0.0885, 0.09, 0.0895, 0.0863, 0.0889, 0.0923, 0.0884, 0.0901, 0.087, 0.0912, 0.0893, 0.0901, 0.0868, 0.09, 0.0877, 0.09, 0.0906, 0.0895, 0.0902, 0.0864, 0.0878, 0.0914, 0.0888, 0.0878, 0.0886, 0.089, 0.0879, 0.0894, 0.0902, 0.0885, 0.0887, 0.0886, 0.089, 0.0897, 0.0892, 0.09, 0.0898, 0.0898, 0.089, 0.0898, 0.0896, 0.0895, 0.0893, 0.0895, 0.0894, 0.0895, 0.0894 ] }, "diagnostics": { "bp_cosine": [ 0.1401812732219696, -0.0036733129527419806, -0.012468342669308186, -0.005749615840613842 ], "perturbation_rho": [ -0.006108707282692194, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -6.239861249923706e-07, 0.0, -7.450580596923828e-09, 0.0 ], "0.003": [ -1.9390136003494263e-06, -1.862645149230957e-09, -5.587935447692871e-09, -9.313225746154785e-10 ], "0.01": [ -6.262678653001785e-06, 7.450580596923828e-09, -9.313225746154785e-09, -9.313225746154785e-10 ] }, "hidden_norms_per_layer": [ 18858.84765625, 30104360.0, 115109720.0, 142242432.0, 189834320.0 ], "bp_grad_norms_per_layer": [ 1.6800353250800981e-06, 1.0384521687001325e-08, 1.0259526561640087e-08, 1.025457141423658e-08, 1.027041474088719e-08 ] }, "drift": { "embed.weight": 159.1972472218232, "embed.bias": 106.18499737865416, "blocks.0.ln.weight": 8.374361991882324, "blocks.0.w1.weight": 130.25292802776573, "blocks.0.w1.bias": 147.17751025342662, "blocks.0.w2.weight": 140.99980409584657, "blocks.1.ln.weight": 7.522654056549072, "blocks.1.w1.weight": 183.9407903471226, "blocks.1.w1.bias": 180.51106512410223, "blocks.1.w2.weight": 111.67829579527385, "blocks.2.ln.weight": 7.498361110687256, "blocks.2.w1.weight": 174.07305808153814, "blocks.2.w1.bias": 174.07821632973472, "blocks.2.w2.weight": 98.850301691257, "blocks.3.ln.weight": 7.616756439208984, "blocks.3.w1.weight": 196.59852287605085, "blocks.3.w1.bias": 194.4284525943356, "blocks.3.w2.weight": 107.54506697831434, "out_ln.weight": 1.6382553577423096, "out_head.weight": 8.655421610551045, "out_head.bias": 0.8148936743952768 } }, "fa": { "log": { "train_loss": [ 4.217838704376221, 4.173818229370117, 4.116404933776855, 4.05976043182373, 4.010950881347656, 3.9877797143554687, 3.9654394758605958, 3.9516948413085937, 3.9414562885284425, 3.933943572845459, 3.9315726831054687, 3.9283136461639403, 3.918033894042969, 3.912524202957153, 3.9111721415710448, 3.9033537468719484, 3.898933872528076, 3.8940574435424806, 3.888040324020386, 3.8902594078826906, 3.881309941253662, 3.879018879852295, 3.874496072845459, 3.871587658691406, 3.867957287750244, 3.8586695248413085, 3.858678229446411, 3.8550938296508788, 3.848460863571167, 3.843934544219971, 3.841355255813599, 3.838310421142578, 3.832888546218872, 3.8317080396270753, 3.8244371617126465, 3.826680388870239, 3.820091895675659, 3.8168691710662843, 3.8143892570495606, 3.8094303827667235, 3.811340135421753, 3.808084242401123, 3.8061284660339356, 3.8042135272979736, 3.803864609298706, 3.8014156354522703, 3.796123163604736, 3.7960259418487547, 3.794198034515381, 3.793316494140625, 3.7887488148498534, 3.7955673222351076, 3.787652738494873, 3.789291185760498, 3.7856833452606202, 3.7837219773864748, 3.7850829206848147, 3.7822190380859375, 3.780595345993042, 3.780773038482666, 3.7798492553710936, 3.777712000579834, 3.77948525390625, 3.7754471015930178, 3.7783823108673094, 3.7751461651611327, 3.7731632305908205, 3.7698883753204346, 3.7678470989227293, 3.7675471087646484, 3.768726477050781, 3.7664906182861326, 3.7642928605651855, 3.7634823627471925, 3.7624606089782713, 3.7626713751983645, 3.76369431892395, 3.7644162739562987, 3.759299655914307, 3.759175650482178, 3.758095093460083, 3.758687426223755, 3.7558257189941404, 3.758380405960083, 3.7552133833312986, 3.7560367737579345, 3.757290748748779, 3.7513376335144044, 3.7552056824493407, 3.7553686474609376, 3.754800821685791, 3.752587652511597, 3.7521287742614744, 3.754502056884766, 3.7546933338928223, 3.750953895263672, 3.749489372558594, 3.7477175559997558, 3.753209332885742, 3.75081868347168 ], "train_acc": [ 0.06112, 0.06028, 0.0684, 0.07838, 0.08954, 0.09232, 0.0962, 0.09766, 0.099, 0.10078, 0.1022, 0.10314, 0.10234, 0.1031, 0.10412, 0.10498, 0.10776, 0.10782, 0.109, 0.10792, 0.10914, 0.11072, 0.10982, 0.11022, 0.11282, 0.11262, 0.11402, 0.11302, 0.11302, 0.11694, 0.11542, 0.11602, 0.11642, 0.1175, 0.11876, 0.12074, 0.11926, 0.11816, 0.12184, 0.12202, 0.12178, 0.12238, 0.1222, 0.12238, 0.12092, 0.12362, 0.12338, 0.12428, 0.1248, 0.12516, 0.12588, 0.12532, 0.12592, 0.12498, 0.12348, 0.1247, 0.12646, 0.12716, 0.12708, 0.1273, 0.12668, 0.12754, 0.1268, 0.1288, 0.12586, 0.12914, 0.12678, 0.12832, 0.1304, 0.12808, 0.12922, 0.13104, 0.12964, 0.13008, 0.13144, 0.1314, 0.12958, 0.1298, 0.1312, 0.13116, 0.13188, 0.1315, 0.1315, 0.13028, 0.13222, 0.1339, 0.13118, 0.13218, 0.13354, 0.1333, 0.13136, 0.13216, 0.13268, 0.13262, 0.13292, 0.13426, 0.13368, 0.13344, 0.13306, 0.13192 ], "test_acc": [ 0.0534, 0.0616, 0.0812, 0.0837, 0.0888, 0.0944, 0.0942, 0.0981, 0.1007, 0.0999, 0.1021, 0.0988, 0.1083, 0.1019, 0.1073, 0.1051, 0.1085, 0.107, 0.1044, 0.1125, 0.1066, 0.1037, 0.1053, 0.1129, 0.1129, 0.1183, 0.1149, 0.1188, 0.1188, 0.1138, 0.114, 0.1201, 0.1229, 0.1223, 0.1169, 0.1239, 0.1156, 0.1221, 0.1195, 0.1228, 0.1275, 0.1226, 0.1232, 0.1264, 0.1312, 0.1262, 0.126, 0.1266, 0.126, 0.124, 0.1272, 0.1229, 0.1293, 0.1247, 0.125, 0.1265, 0.1232, 0.1295, 0.1274, 0.1275, 0.1273, 0.1276, 0.1285, 0.1266, 0.1285, 0.128, 0.1299, 0.1295, 0.1308, 0.1252, 0.1315, 0.1292, 0.1291, 0.1296, 0.1298, 0.1308, 0.1314, 0.1297, 0.1304, 0.1307, 0.13, 0.1335, 0.1296, 0.1302, 0.1329, 0.1303, 0.1313, 0.1315, 0.132, 0.1311, 0.1311, 0.1322, 0.1311, 0.1317, 0.1308, 0.1309, 0.1306, 0.1308, 0.1311, 0.131 ] }, "diagnostics": { "bp_cosine": [ 0.08354228734970093, 0.008694879710674286, -0.10087701678276062, 0.9982630610466003 ], "perturbation_rho": [ -0.00011634547263383865, 0.02022995427250862, -0.014473065733909607, -0.005974383093416691 ], "nudging": { "0.001": [ -1.8016435205936432e-06, -6.216578185558319e-08, 9.220093488693237e-08, -1.9045546650886536e-06 ], "0.003": [ -5.271751433610916e-06, -1.3830140233039856e-07, 7.264316082000732e-07, -7.401220500469208e-06 ], "0.01": [ -1.7585232853889465e-05, -5.245674401521683e-07, 3.0526425689458847e-06, -2.642977051436901e-05 ] }, "hidden_norms_per_layer": [ 11478.736328125, 155429.828125, 870084.3125, 1247755.625, 225384.953125 ], "bp_grad_norms_per_layer": [ 9.544731256028172e-06, 1.3853283462594845e-06, 1.3375421303862822e-06, 1.3386792261371738e-06, 1.3382986026044819e-06 ] }, "drift": { "embed.weight": 105.03852710133908, "embed.bias": 26.837405563994206, "blocks.0.ln.weight": 2.3730220794677734, "blocks.0.w1.weight": 28.170015713455946, "blocks.0.w1.bias": 23.197896445244968, "blocks.0.w2.weight": 73.04463083219117, "blocks.1.ln.weight": 1.476442575454712, "blocks.1.w1.weight": 29.314224337417265, "blocks.1.w1.bias": 28.13876609135274, "blocks.1.w2.weight": 39.8446977611363, "blocks.2.ln.weight": 1.1785210371017456, "blocks.2.w1.weight": 29.01006529023273, "blocks.2.w1.bias": 32.13611131919081, "blocks.2.w2.weight": 31.240416399097963, "blocks.3.ln.weight": 1.4267656803131104, "blocks.3.w1.weight": 32.92178917188402, "blocks.3.w1.bias": 34.64484336575641, "blocks.3.w2.weight": 31.82487883605455, "out_ln.weight": 0.5113871097564697, "out_head.weight": 3.9161050246024547, "out_head.bias": 2.224345965208238 } } }, "config": { "dataset": "cifar100", "d_hidden": 256, "num_blocks": 4, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 456 ], "gpu": 0, "output_dir": "results/cifar100_d256_L4", "methods": [ "bp", "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 100 } }