{ "0": { "dfa": { "log": { "train_loss": [ 2.0727519187164307, 2.0449732803344727, 2.0343947634887694, 2.0317279723739623, 2.029190194129944, 2.0266742729187013, 2.022695488433838, 2.0220756021881106, 2.017278121871948, 2.013867749862671, 2.0141937175750733, 2.0114837906265257, 2.0090159717559812, 2.006871261138916, 2.0085684817504883, 2.004453958129883, 2.0050127017211916, 2.004625142745972, 2.001847840270996, 2.0038710110855105, 2.0015532569885255, 2.001803522415161, 2.0029406197357176, 1.9984209733581544, 1.9999778453063966, 1.997875029144287, 2.002456622467041, 2.000510860939026, 1.9972556433105468, 1.9980127339935303, 1.9964525595092772, 1.9945909706878662, 1.994441053237915, 1.9951845182037353, 1.995466745147705, 1.992624706878662, 1.9937170362091063, 1.9947755416870117, 1.9944197441101075, 1.9952830042266845, 1.9904139096832276, 1.991399830932617, 1.9951595304870606, 1.9930326363754272, 1.9904268531799316, 1.9908876788330079, 1.9936137868499755, 1.9875998815917968, 1.992842328338623, 1.990330719833374, 1.9921186029815674, 1.9902390911102295, 1.9888944667053223, 1.9905146474456787, 1.9888609869384766, 1.9911943308258058, 1.9893802894592285, 1.9878305652618409, 1.9877847812652587, 1.9883021939849854, 1.988304048690796, 1.9873467050170899, 1.9866977008438111, 1.9872942990875244, 1.9863059562683105, 1.9860430270004272, 1.9863528005981446, 1.9857840370941162, 1.9861036871337892, 1.985937850112915, 1.9876243210601807, 1.9859837552642823, 1.9863339701080323, 1.9869920307922364, 1.9855867569732666, 1.984609903526306, 1.9867486194229127, 1.9843175145721434, 1.9860691648101807, 1.9842630282592773, 1.986168493347168, 1.9858933181762695, 1.98474868850708, 1.9866244787979126, 1.9833790422058106, 1.9852294052505493, 1.9821201675033568, 1.9854196563339233, 1.9846102389526368, 1.9820537503433227, 1.981782052307129, 1.984344421157837, 1.983909532699585, 1.9853303438949585, 1.984236333694458, 1.9829996084594728, 1.984313102684021, 1.9833407458496093, 1.983147784729004, 1.9833076025390626 ], "train_acc": [ 0.2332, 0.24532, 0.2542, 0.2564, 0.25326, 0.25504, 0.25822, 0.26022, 0.26324, 0.26234, 0.26278, 0.26454, 0.26348, 0.26876, 0.26432, 0.26712, 0.268, 0.26852, 0.27126, 0.26796, 0.2701, 0.27052, 0.26954, 0.27056, 0.27256, 0.27258, 0.26872, 0.27102, 0.2732, 0.27298, 0.27452, 0.27374, 0.27488, 0.273, 0.27604, 0.2756, 0.27576, 0.27472, 0.27344, 0.27474, 0.27776, 0.27826, 0.27318, 0.2762, 0.27666, 0.27602, 0.2763, 0.2777, 0.27724, 0.27716, 0.27566, 0.27832, 0.28138, 0.27918, 0.27922, 0.27668, 0.27846, 0.27786, 0.27796, 0.2762, 0.27946, 0.27984, 0.2795, 0.27926, 0.28092, 0.27924, 0.27978, 0.28098, 0.28132, 0.2802, 0.27814, 0.28184, 0.28178, 0.28284, 0.28128, 0.2829, 0.28048, 0.28194, 0.28236, 0.2801, 0.28106, 0.28278, 0.28308, 0.27886, 0.2815, 0.28188, 0.28254, 0.28202, 0.28158, 0.28336, 0.2825, 0.28316, 0.28312, 0.28218, 0.28288, 0.2816, 0.28218, 0.2807, 0.2835, 0.28354 ], "test_acc": [ 0.2507, 0.2596, 0.274, 0.2704, 0.2841, 0.2803, 0.2788, 0.2781, 0.303, 0.2941, 0.2905, 0.3016, 0.2779, 0.3052, 0.2819, 0.2911, 0.2931, 0.2886, 0.2812, 0.2924, 0.2947, 0.2701, 0.28, 0.2912, 0.3037, 0.2894, 0.3012, 0.3011, 0.3056, 0.2981, 0.2923, 0.2961, 0.3082, 0.3035, 0.2868, 0.2981, 0.3042, 0.2956, 0.3012, 0.296, 0.3077, 0.3082, 0.3, 0.3141, 0.2967, 0.3024, 0.3004, 0.3016, 0.308, 0.3028, 0.3072, 0.2933, 0.2907, 0.3126, 0.3036, 0.2973, 0.3001, 0.3054, 0.3115, 0.3004, 0.3026, 0.3022, 0.3051, 0.3109, 0.2968, 0.3092, 0.2998, 0.3062, 0.3081, 0.3035, 0.3032, 0.3114, 0.3147, 0.308, 0.3035, 0.3098, 0.3091, 0.3065, 0.3094, 0.3071, 0.3072, 0.309, 0.3012, 0.3067, 0.3016, 0.3028, 0.3048, 0.3083, 0.3082, 0.308, 0.3097, 0.3087, 0.3117, 0.3104, 0.3086, 0.3085, 0.3088, 0.3084, 0.3085, 0.3086 ] }, "diagnostics": { "bp_cosine": [ 0.395052969455719, 0.0004171400796622038, 8.336821338161826e-06, 0.0005622187163680792, 0.00013701531861443073, -0.00035643568844534457, 0.00012600264744833112, -0.00027335749473422766, 0.00016040689661167562, -6.0928698076168075e-05, 3.278384974692017e-05, 0.0003701794194057584 ], "perturbation_rho": [ 0.018501652404665947, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -4.1211023926734924e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.2032687664031982e-06, 0.0, 0.0, 0.0, 0.0, 3.725290298461914e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -4.2067840695381165e-06, -9.313225746154785e-10, -2.7939677238464355e-09, 9.313225746154785e-10, 0.0, 4.6566128730773926e-09, 1.862645149230957e-09, 0.0, 0.0, 0.0, 0.0, 0.0 ] }, "hidden_norms_per_layer": [ 52639.97265625, 1088866944.0, 4048803840.0, 5257923584.0, 5847087616.0, 5938909184.0, 7423066624.0, 9731870720.0, 11342387200.0, 11317005312.0, 11353008128.0, 12463034368.0, 13189959680.0 ], "bp_grad_norms_per_layer": [ 2.804916334753216e-07, 1.9205773083008637e-10, 1.9170887100017353e-10, 1.9189858035950635e-10, 1.919657766080718e-10, 1.919622516499686e-10, 1.919622516499686e-10, 1.9191119526862366e-10, 1.9192891720365424e-10, 1.919416292572862e-10, 1.9193641120907046e-10, 1.9192181177629664e-10, 1.9190903033372564e-10 ] }, "drift": { "embed.weight": 330.26007887921685, "embed.bias": 274.2168771279626, "blocks.0.ln.weight": 10.94628999409354, "blocks.0.w1.weight": 277.3643033410537, "blocks.0.w1.bias": 261.86497048407, "blocks.0.w2.weight": 484.6109947045105, "blocks.1.ln.weight": 9.35886499546542, "blocks.1.w1.weight": 360.26286845371646, "blocks.1.w1.bias": 355.66126981713177, "blocks.1.w2.weight": 392.1776082515924, "blocks.2.ln.weight": 9.350239389888953, "blocks.2.w1.weight": 370.0336198354507, "blocks.2.w1.bias": 337.8932267522991, "blocks.2.w2.weight": 352.1258021274022, "blocks.3.ln.weight": 9.767929501471052, "blocks.3.w1.weight": 331.5909899943081, "blocks.3.w1.bias": 303.3604214345198, "blocks.3.w2.weight": 312.3336342294667, "blocks.4.ln.weight": 6.8894143383412505, "blocks.4.w1.weight": 245.69582220582208, "blocks.4.w1.bias": 226.6077326792198, "blocks.4.w2.weight": 237.1578303477898, "blocks.5.ln.weight": 10.087708773364, "blocks.5.w1.weight": 391.6451916277919, "blocks.5.w1.bias": 364.5077034653599, "blocks.5.w2.weight": 375.80268056062386, "blocks.6.ln.weight": 10.894168165759849, "blocks.6.w1.weight": 446.1083385424109, "blocks.6.w1.bias": 408.24079100200436, "blocks.6.w2.weight": 421.6066446657385, "blocks.7.ln.weight": 10.280446652077675, "blocks.7.w1.weight": 417.5786268538863, "blocks.7.w1.bias": 412.3650615213133, "blocks.7.w2.weight": 413.1057523107626, "blocks.8.ln.weight": 7.628061136196448, "blocks.8.w1.weight": 280.87597195145304, "blocks.8.w1.bias": 261.4439841235217, "blocks.8.w2.weight": 269.85556299140023, "blocks.9.ln.weight": 7.035433277618009, "blocks.9.w1.weight": 236.54101277402214, "blocks.9.w1.bias": 227.70919757896647, "blocks.9.w2.weight": 225.58244999977697, "blocks.10.ln.weight": 10.07787136157841, "blocks.10.w1.weight": 405.6014059372381, "blocks.10.w1.bias": 387.7928293241623, "blocks.10.w2.weight": 391.3899843395933, "blocks.11.ln.weight": 9.615189319853535, "blocks.11.w1.weight": 379.5363902874608, "blocks.11.w1.bias": 358.37006314701347, "blocks.11.w2.weight": 355.59941733335387, "out_ln.weight": 0.6824993975107903, "out_head.weight": 9.861581662622491, "out_head.bias": 0.35061659338833756 } }, "fa": { "log": { "train_loss": [ 2.0293911264038087, 1.950565330429077, 1.917781063232422, 1.9023740824127198, 1.8861673935699463, 1.8825682291412353, 1.873201879234314, 1.8714005821990967, 1.8628303081512452, 1.8579199737548828, 1.8572168459320069, 1.8525300827789306, 1.845312434463501, 1.8409330677032472, 1.8335270806121826, 1.822513469543457, 1.8199686001205444, 1.8136085485458373, 1.8064511907196046, 1.803108533859253, 1.7962512873077392, 1.7911701647949219, 1.7911696646118165, 1.7887402313995362, 1.783379939842224, 1.7759505123901367, 1.780573166732788, 1.7734921991729737, 1.7670989339828491, 1.7612831104278563, 1.7572847888183594, 1.753526630859375, 1.750715301132202, 1.7472047467041016, 1.7457971502304077, 1.7424137032699585, 1.7345080102920531, 1.734222209701538, 1.7304457287216186, 1.7239187670898437, 1.7218291164398194, 1.7199537884902953, 1.7217532263565063, 1.7196246533584594, 1.7135296297836304, 1.706606083908081, 1.7079890319824218, 1.7041183599472045, 1.705560855026245, 1.7011269199371337, 1.7035633499908447, 1.6992430791854858, 1.6950508019638062, 1.7004030841064453, 1.691479129295349, 1.691718464050293, 1.6919280102157592, 1.6887580330657959, 1.6883217154693604, 1.688851436805725, 1.6853341622543334, 1.680581435546875, 1.678009653892517, 1.6784401907730102, 1.6803946784210204, 1.6761323783493043, 1.676516137046814, 1.6778211946868897, 1.6767865496444703, 1.6731242126083374, 1.675690205078125, 1.669817829246521, 1.6760586986923218, 1.670416958580017, 1.6687565314483643, 1.668258262901306, 1.6666069919204711, 1.666242490005493, 1.6675299571990967, 1.663490775527954, 1.6672910994720458, 1.6639445114517213, 1.6617960903167726, 1.6636806215667725, 1.6643552365112304, 1.6602695792007447, 1.6589048775100708, 1.6614284314727783, 1.6610555962753295, 1.6578762405014038, 1.6580958423614502, 1.6621724097061157, 1.6586555422210694, 1.657684158668518, 1.6587366760253905, 1.657404851913452, 1.6599628324127198, 1.6565218897247314, 1.6586303088760377, 1.6615223189544677 ], "train_acc": [ 0.2526, 0.29054, 0.30538, 0.31188, 0.31418, 0.31852, 0.32254, 0.3243, 0.32728, 0.33104, 0.33096, 0.33338, 0.33726, 0.33962, 0.3428, 0.34614, 0.34728, 0.34656, 0.35102, 0.35328, 0.35598, 0.35864, 0.35488, 0.35678, 0.35954, 0.36188, 0.36066, 0.36522, 0.36488, 0.36676, 0.36986, 0.3702, 0.3739, 0.37346, 0.37434, 0.37574, 0.3752, 0.3788, 0.37904, 0.38092, 0.38054, 0.38164, 0.37934, 0.38172, 0.38678, 0.3875, 0.38734, 0.38996, 0.38752, 0.39106, 0.38978, 0.39084, 0.39086, 0.39326, 0.39296, 0.39256, 0.39342, 0.39414, 0.39416, 0.39432, 0.39614, 0.39536, 0.3965, 0.39922, 0.39722, 0.39968, 0.3982, 0.39886, 0.40146, 0.4016, 0.40122, 0.4017, 0.39858, 0.40386, 0.40168, 0.4028, 0.4026, 0.4035, 0.40378, 0.40566, 0.4031, 0.4049, 0.40506, 0.4035, 0.40618, 0.40566, 0.406, 0.40476, 0.40564, 0.40724, 0.40646, 0.4061, 0.4079, 0.40568, 0.40498, 0.40842, 0.40674, 0.40746, 0.40728, 0.40684 ], "test_acc": [ 0.2924, 0.3363, 0.3349, 0.3386, 0.347, 0.3457, 0.3423, 0.3555, 0.3653, 0.3606, 0.3632, 0.3617, 0.3575, 0.3723, 0.3703, 0.3715, 0.3741, 0.3774, 0.374, 0.3745, 0.3836, 0.3907, 0.3702, 0.3831, 0.385, 0.3843, 0.3922, 0.4003, 0.3967, 0.3978, 0.3897, 0.3828, 0.401, 0.4012, 0.3991, 0.3999, 0.4055, 0.4085, 0.3968, 0.4064, 0.4066, 0.4082, 0.404, 0.4042, 0.4085, 0.4091, 0.4104, 0.4155, 0.4157, 0.4125, 0.4139, 0.4166, 0.4116, 0.4187, 0.4186, 0.4123, 0.4161, 0.4171, 0.4184, 0.414, 0.4179, 0.4184, 0.4197, 0.4193, 0.421, 0.4205, 0.423, 0.4233, 0.4201, 0.422, 0.4204, 0.4151, 0.4182, 0.4218, 0.4239, 0.4198, 0.425, 0.4239, 0.4204, 0.4215, 0.4253, 0.4199, 0.4235, 0.4206, 0.4235, 0.4255, 0.4222, 0.423, 0.4216, 0.426, 0.4245, 0.4245, 0.4239, 0.4248, 0.4224, 0.4245, 0.4246, 0.4241, 0.4242, 0.4239 ] }, "diagnostics": { "bp_cosine": [ 0.005966864060610533, 0.04795818775892258, 0.043208200484514236, -0.05298762395977974, -0.11785908043384552, -0.05540306121110916, -0.10012105107307434, -0.09065192937850952, -0.04056818038225174, -0.03824863210320473, -0.07007172703742981, 0.9948829412460327 ], "perturbation_rho": [ 0.028052061796188354, 0.03165658190846443, -0.006041648797690868, -0.027337782084941864, 0.01562969572842121, 0.01757640205323696, -0.025423342362046242, -0.024989785626530647, -0.03021504357457161, 0.021996641531586647, 0.03194758668541908, 0.01976931467652321 ], "nudging": { "0.001": [ 3.7101563066244125e-07, -6.126938387751579e-07, -3.066379576921463e-07, 1.6076955944299698e-07, 3.3061951398849487e-07, 1.5937257558107376e-07, 2.9441434890031815e-07, 2.859160304069519e-07, 1.284060999751091e-07, 1.5040859580039978e-07, 2.1443702280521393e-07, -3.2152747735381126e-06 ], "0.003": [ 1.007108949124813e-06, -1.6828998923301697e-06, -6.601912900805473e-07, 4.4493936002254486e-07, 1.1789379641413689e-06, 5.08967787027359e-07, 1.0151416063308716e-06, 8.791685104370117e-07, 3.866152837872505e-07, 3.688037395477295e-07, 6.126938387751579e-07, -1.0434770956635475e-05 ], "0.01": [ 3.6874553188681602e-06, -5.368026904761791e-06, -2.2364547476172447e-06, 1.735752448439598e-06, 3.992114216089249e-06, 1.860782504081726e-06, 3.5137636587023735e-06, 3.010733053088188e-06, 1.437612809240818e-06, 1.2825476005673409e-06, 2.246466465294361e-06, -3.491528332233429e-05 ] }, "hidden_norms_per_layer": [ 4702.6123046875, 44530.10546875, 108911.2109375, 164933.125, 283322.40625, 377155.46875, 407664.6875, 517485.0625, 562702.0625, 564809.5, 577993.1875, 617885.5625, 296847.03125 ], "bp_grad_norms_per_layer": [ 4.941995575791225e-05, 3.9530186768388376e-06, 1.528447455712012e-06, 1.3358264823182253e-06, 1.3305660786500084e-06, 1.3287758520164061e-06, 1.3350502285902621e-06, 1.339361574537179e-06, 1.3375677099247696e-06, 1.3184284171074978e-06, 1.3012635236009373e-06, 1.3201109823057777e-06, 1.27659131976543e-06 ] }, "drift": { "embed.weight": 36.945692873367385, "embed.bias": 13.300137685811876, "blocks.0.ln.weight": 0.901147599699004, "blocks.0.w1.weight": 13.367758537525685, "blocks.0.w1.bias": 10.72336098907488, "blocks.0.w2.weight": 46.304733049049524, "blocks.1.ln.weight": 0.7424575473753766, "blocks.1.w1.weight": 15.226852479991834, "blocks.1.w1.bias": 7.345119575250527, "blocks.1.w2.weight": 40.81729281725618, "blocks.2.ln.weight": 0.6752024292095198, "blocks.2.w1.weight": 13.877425620596014, "blocks.2.w1.bias": 7.829951186600198, "blocks.2.w2.weight": 39.52886223656965, "blocks.3.ln.weight": 0.6072219216215275, "blocks.3.w1.weight": 13.849387698880346, "blocks.3.w1.bias": 11.302805784789012, "blocks.3.w2.weight": 31.48991587682597, "blocks.4.ln.weight": 0.3513996294280428, "blocks.4.w1.weight": 12.017687634070212, "blocks.4.w1.bias": 12.545759692163585, "blocks.4.w2.weight": 19.78672753090035, "blocks.5.ln.weight": 0.27340079470413037, "blocks.5.w1.weight": 10.049144366681992, "blocks.5.w1.bias": 9.943637751012846, "blocks.5.w2.weight": 19.227980350358227, "blocks.6.ln.weight": 0.3688735234588941, "blocks.6.w1.weight": 12.460300257534458, "blocks.6.w1.bias": 13.383277160534908, "blocks.6.w2.weight": 19.760938996380943, "blocks.7.ln.weight": 0.34359755221214905, "blocks.7.w1.weight": 11.768674295896531, "blocks.7.w1.bias": 13.150434923761187, "blocks.7.w2.weight": 21.174060669259852, "blocks.8.ln.weight": 0.3997077790355334, "blocks.8.w1.weight": 11.48289450791943, "blocks.8.w1.bias": 8.028224303872328, "blocks.8.w2.weight": 35.011661428887535, "blocks.9.ln.weight": 0.43894400900661307, "blocks.9.w1.weight": 11.84935422288265, "blocks.9.w1.bias": 8.899824293598352, "blocks.9.w2.weight": 34.666647832790865, "blocks.10.ln.weight": 0.4701858246153278, "blocks.10.w1.weight": 12.779979416376127, "blocks.10.w1.bias": 12.40660396279328, "blocks.10.w2.weight": 30.770398182409856, "blocks.11.ln.weight": 0.502840402610306, "blocks.11.w1.weight": 15.51482213849637, "blocks.11.w1.bias": 16.777463254010712, "blocks.11.w2.weight": 27.32990799926724, "out_ln.weight": 0.2952693196309993, "out_head.weight": 4.4773532602382, "out_head.bias": 1.8150038464128413 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 12, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 0 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L12_seed0", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }