{ "42": { "fa": { "log": { "train_loss": [ 2.049124941177368, 1.971964567337036, 1.9483523839569092, 1.9344041421508789, 1.9224640267944335, 1.9110223713684082, 1.9013612536621094, 1.8914563995742797, 1.8888161966705321, 1.8849480002212524, 1.8800471724700927, 1.8740126901245118, 1.8716543948745727, 1.8681818910217285, 1.867931474647522, 1.866554428138733, 1.8656607852935791, 1.85699001285553, 1.855739754257202, 1.8523859079360963, 1.8532698722076415, 1.8493807650375367, 1.84840350189209, 1.8443957958602906, 1.842935036239624, 1.8395105728912353, 1.8337825148773192, 1.8333892483520509, 1.8321472442245483, 1.8294915601348878, 1.8279203462982179, 1.826354044494629, 1.8228275035858155, 1.8226369649887084, 1.8176784851837158, 1.8198615470123292, 1.8155909259796144, 1.8137150632476806, 1.8144374758911133, 1.816846872291565, 1.8122928824234008, 1.8105264510345458, 1.8050418474578858, 1.810307405052185, 1.8034298502349853, 1.8004834436798096, 1.8044248488616943, 1.8068354278182983, 1.8045337250518798, 1.8001124160766602, 1.7975274431991577, 1.7963342412567138, 1.7940989971923829, 1.7987028061294557, 1.7954791347503662, 1.7969434225845338, 1.794546351585388, 1.790341936378479, 1.7904112981414795, 1.796010117111206, 1.7922658501434325, 1.7879667960357666, 1.787852370376587, 1.7872013766479493, 1.7859069106292724, 1.7856995489120484, 1.7886004698944091, 1.7876731681060791, 1.7865260543823243, 1.785853352394104, 1.7849980658340454, 1.7868319046020509, 1.7825030782318114, 1.7818804879379273, 1.7835813956069946, 1.7858538039779663, 1.7806534545516968, 1.7811814181900025, 1.7809104974365235, 1.7819213286972047, 1.7821454078674317, 1.782828011817932, 1.779138667678833, 1.778261279373169, 1.7800345748901367, 1.776551816444397, 1.7768282559967041, 1.7764475776672364, 1.7771262689590455, 1.7769524020767211, 1.7762922687149048, 1.7768514712524415, 1.779178479270935, 1.7777679949951173, 1.7764834703826904, 1.77460149269104, 1.7745818335342407, 1.7761323275375367, 1.7797669164276122, 1.7776144277954102 ], "train_acc": [ 0.2436, 0.27338, 0.2898, 0.29694, 0.30116, 0.3039, 0.30988, 0.31412, 0.31788, 0.31722, 0.31988, 0.32372, 0.323, 0.32762, 0.32672, 0.3276, 0.32934, 0.33266, 0.3352, 0.33332, 0.33394, 0.33564, 0.33554, 0.33832, 0.33744, 0.33804, 0.34066, 0.34208, 0.34102, 0.34436, 0.34358, 0.34454, 0.34578, 0.34732, 0.34992, 0.34824, 0.3498, 0.35008, 0.35088, 0.35076, 0.35254, 0.35354, 0.35364, 0.35176, 0.35556, 0.35626, 0.35458, 0.35408, 0.35588, 0.35876, 0.35938, 0.36056, 0.36056, 0.35998, 0.36086, 0.35718, 0.35898, 0.36128, 0.36022, 0.3575, 0.36098, 0.36178, 0.36196, 0.36508, 0.36294, 0.3645, 0.36438, 0.36428, 0.36462, 0.36086, 0.3643, 0.3637, 0.36544, 0.36562, 0.36574, 0.36544, 0.3643, 0.36654, 0.36688, 0.36584, 0.36738, 0.36538, 0.3685, 0.36706, 0.3681, 0.36614, 0.36798, 0.36682, 0.36688, 0.36772, 0.3687, 0.36828, 0.36478, 0.3676, 0.36774, 0.36956, 0.36956, 0.36768, 0.3664, 0.36848 ], "test_acc": [ 0.2789, 0.3105, 0.3048, 0.3148, 0.323, 0.3367, 0.3399, 0.3468, 0.3417, 0.3416, 0.3511, 0.3527, 0.342, 0.353, 0.3624, 0.349, 0.354, 0.3675, 0.3543, 0.3609, 0.3613, 0.3656, 0.3683, 0.3572, 0.365, 0.3682, 0.3725, 0.3578, 0.3725, 0.3714, 0.3683, 0.3666, 0.3621, 0.3689, 0.3747, 0.3784, 0.368, 0.383, 0.3698, 0.3823, 0.379, 0.3766, 0.3793, 0.3789, 0.3879, 0.3813, 0.373, 0.3839, 0.3814, 0.3842, 0.3882, 0.381, 0.3834, 0.3841, 0.3851, 0.387, 0.3809, 0.3833, 0.3834, 0.3806, 0.3854, 0.3907, 0.3796, 0.3892, 0.3915, 0.3907, 0.391, 0.3903, 0.3921, 0.3892, 0.3916, 0.3909, 0.3912, 0.3923, 0.3912, 0.3912, 0.3937, 0.3894, 0.3946, 0.3919, 0.3897, 0.3923, 0.3973, 0.392, 0.3971, 0.3938, 0.3908, 0.3947, 0.3922, 0.3913, 0.3909, 0.3931, 0.3937, 0.3931, 0.3933, 0.392, 0.392, 0.3926, 0.3928, 0.3929 ] }, "diagnostics": { "bp_cosine": [ 0.028316663578152657, 0.0230555459856987, -0.10937326401472092, 0.9985983967781067 ], "perturbation_rho": [ -0.018305372446775436, -0.05561023950576782, 0.04369408264756203, 0.0030625772196799517 ], "nudging": { "0.001": [ -1.237727701663971e-06, -8.684583008289337e-08, 2.3283064365386963e-09, -1.1352822184562683e-06 ], "0.003": [ -3.5907141864299774e-06, -3.394670784473419e-07, 4.407484084367752e-07, -4.475703462958336e-06 ], "0.01": [ -1.1818483471870422e-05, -7.816124707460403e-07, 1.9797589629888535e-06, -1.6960781067609787e-05 ] }, "hidden_norms_per_layer": [ 5829.11083984375, 96512.5703125, 1033049.3125, 1362033.875, 493509.875 ], "bp_grad_norms_per_layer": [ 1.7891748939291574e-05, 1.2141871366111445e-06, 8.851626489558839e-07, 8.892926075532159e-07, 8.88764532191999e-07 ] }, "drift": { "embed.weight": 61.065183980831414, "embed.bias": 37.30479105851126, "blocks.0.ln.weight": 1.813413381576538, "blocks.0.w1.weight": 19.65702484459222, "blocks.0.w1.bias": 18.43264760143014, "blocks.0.w2.weight": 80.7069052062468, "blocks.1.ln.weight": 1.5857534408569336, "blocks.1.w1.weight": 30.581704417045803, "blocks.1.w1.bias": 32.64715538359668, "blocks.1.w2.weight": 51.04559112831385, "blocks.2.ln.weight": 1.1075904369354248, "blocks.2.w1.weight": 27.221029191801634, "blocks.2.w1.bias": 31.23130799360825, "blocks.2.w2.weight": 40.72448084896488, "blocks.3.ln.weight": 1.233646035194397, "blocks.3.w1.weight": 30.670509581621424, "blocks.3.w1.bias": 34.319449767073166, "blocks.3.w2.weight": 50.44485584477348, "out_ln.weight": 0.31939876079559326, "out_head.weight": 5.424347923413205, "out_head.bias": 2.5070306021804907 } } }, "123": { "fa": { "log": { "train_loss": [ 2.039442294845581, 1.953594453125, 1.9264128439712525, 1.9111677870941162, 1.9046263507843018, 1.8970699446868897, 1.8877645287322997, 1.8802119188690185, 1.8676571554565429, 1.8596859856796264, 1.8576147148895263, 1.8543415798950196, 1.847902306289673, 1.843341840286255, 1.8415791506576538, 1.8326364449691772, 1.8275398804473877, 1.825090225830078, 1.8180097577667236, 1.812808359451294, 1.8083131935882568, 1.806013644104004, 1.8015524674224854, 1.7926762564086913, 1.7879434857177734, 1.7820632962799072, 1.781419140357971, 1.7759368832397462, 1.7757835355377198, 1.7717899426651, 1.7707528903579712, 1.7696525680923463, 1.7655191495895386, 1.765033065109253, 1.762537513771057, 1.7627749864959716, 1.7591946435546875, 1.7589446157455444, 1.7533805700683593, 1.757075972213745, 1.7514215006256104, 1.7560174445343018, 1.7500310370254517, 1.7495898828125, 1.7477490761566161, 1.7467513186264039, 1.7485883990859985, 1.7423759655380249, 1.7408935341644287, 1.7417366515731811, 1.7416620874023439, 1.7395717266845703, 1.735324585494995, 1.7391719909667969, 1.7375017526245118, 1.738703854637146, 1.739165567626953, 1.7372404578018188, 1.7375502878189086, 1.740667166519165, 1.7426861660766602, 1.7352294305801392, 1.7360000601577759, 1.7363917623901368, 1.7359804382705688, 1.7362036960601808, 1.7375494842529298, 1.7357752603149414, 1.7346405282211304, 1.734609012107849, 1.7384431924057007, 1.7361973517227174, 1.7336053954696655, 1.7382006414794922, 1.7355592263031006, 1.7354922631072998, 1.738483149909973, 1.733718469810486, 1.7319189379882813, 1.7344261421203613, 1.731631244506836, 1.7336486722564697, 1.7326741513061523, 1.7326253693389893, 1.7323636251449586, 1.7339774234771728, 1.73317182472229, 1.7338639688491821, 1.7331051165008544, 1.7340733782196045, 1.7288542190170288, 1.732238768005371, 1.7312932516860962, 1.7317837997436523, 1.7301695737075806, 1.7338779425430297, 1.7309321548461913, 1.726007070274353, 1.7297403479385376, 1.7313430319213867 ], "train_acc": [ 0.25042, 0.28976, 0.30134, 0.30602, 0.3089, 0.31554, 0.31428, 0.3196, 0.32306, 0.32846, 0.33142, 0.33322, 0.33642, 0.33992, 0.34194, 0.34438, 0.34432, 0.34526, 0.34954, 0.35184, 0.35138, 0.35452, 0.35486, 0.35792, 0.35968, 0.36406, 0.36522, 0.36342, 0.3657, 0.36458, 0.36718, 0.36438, 0.3672, 0.37022, 0.37054, 0.36724, 0.36996, 0.37222, 0.3746, 0.37048, 0.37312, 0.37208, 0.37302, 0.37558, 0.37478, 0.37606, 0.37594, 0.37622, 0.37692, 0.37654, 0.37762, 0.37828, 0.38134, 0.37722, 0.37784, 0.37886, 0.37892, 0.37816, 0.38044, 0.37908, 0.37866, 0.37992, 0.38136, 0.38112, 0.38068, 0.37866, 0.38062, 0.38226, 0.38224, 0.38394, 0.37886, 0.38148, 0.38066, 0.37898, 0.3827, 0.38146, 0.38008, 0.38496, 0.38278, 0.3828, 0.38456, 0.38362, 0.38398, 0.38284, 0.384, 0.38284, 0.38282, 0.38388, 0.38298, 0.38384, 0.3847, 0.38326, 0.38218, 0.38316, 0.38288, 0.38104, 0.3823, 0.38442, 0.38372, 0.3814 ], "test_acc": [ 0.2905, 0.3333, 0.3424, 0.3445, 0.3473, 0.357, 0.3561, 0.3439, 0.3547, 0.3514, 0.3624, 0.3717, 0.3659, 0.3715, 0.3653, 0.3669, 0.3677, 0.375, 0.3807, 0.3801, 0.3731, 0.3794, 0.3873, 0.3816, 0.3903, 0.3866, 0.3876, 0.387, 0.3915, 0.3944, 0.3878, 0.391, 0.3973, 0.3913, 0.3949, 0.4015, 0.3969, 0.3971, 0.3933, 0.3937, 0.4026, 0.3957, 0.3986, 0.3994, 0.4041, 0.4033, 0.3987, 0.4023, 0.3982, 0.4046, 0.4073, 0.4061, 0.3998, 0.4057, 0.4036, 0.4066, 0.4057, 0.4056, 0.4099, 0.4087, 0.4031, 0.4052, 0.4102, 0.4108, 0.4056, 0.4083, 0.4111, 0.4113, 0.4088, 0.4048, 0.4085, 0.4104, 0.4085, 0.4067, 0.4074, 0.406, 0.4059, 0.4112, 0.4093, 0.407, 0.4077, 0.4078, 0.4096, 0.4083, 0.4103, 0.4093, 0.4092, 0.4094, 0.4095, 0.4093, 0.41, 0.409, 0.4071, 0.4087, 0.4098, 0.4095, 0.4103, 0.4095, 0.4099, 0.4099 ] }, "diagnostics": { "bp_cosine": [ 0.024554381147027016, 0.11956729739904404, -0.05824935808777809, 0.9959120750427246 ], "perturbation_rho": [ 0.04051800072193146, 0.000565994530916214, -0.01674405112862587, 0.03625570237636566 ], "nudging": { "0.001": [ -1.0242220014333725e-06, -8.98377038538456e-07, 1.8649734556674957e-07, -3.294786438345909e-06 ], "0.003": [ -2.9887305572628975e-06, -2.6676570996642113e-06, 6.059417501091957e-07, -1.0517891496419907e-05 ], "0.01": [ -1.013989094644785e-05, -9.021139703691006e-06, 1.9457656890153885e-06, -3.530189860612154e-05 ] }, "hidden_norms_per_layer": [ 4442.23876953125, 69271.0234375, 112683.53125, 377440.78125, 101219.984375 ], "bp_grad_norms_per_layer": [ 3.0517328923451714e-05, 3.3021829040080775e-06, 1.6336410908479593e-06, 1.6025945797082386e-06, 1.6025023796828464e-06 ] }, "drift": { "embed.weight": 42.23262803830075, "embed.bias": 38.89359718847897, "blocks.0.ln.weight": 1.485857367515564, "blocks.0.w1.weight": 16.185781545723177, "blocks.0.w1.bias": 19.38631244368407, "blocks.0.w2.weight": 67.24000322735762, "blocks.1.ln.weight": 1.1729528903961182, "blocks.1.w1.weight": 16.924164447681708, "blocks.1.w1.bias": 12.398522096155984, "blocks.1.w2.weight": 66.57045868925029, "blocks.2.ln.weight": 1.1481270790100098, "blocks.2.w1.weight": 22.87352078284913, "blocks.2.w1.bias": 15.551994064272593, "blocks.2.w2.weight": 47.0174765021604, "blocks.3.ln.weight": 1.3614349365234375, "blocks.3.w1.weight": 24.802445502073887, "blocks.3.w1.bias": 20.203860687494405, "blocks.3.w2.weight": 27.95273009401102, "out_ln.weight": 0.2712816894054413, "out_head.weight": 3.4626060309461333, "out_head.bias": 5.313953466040826 } } }, "456": { "fa": { "log": { "train_loss": [ 2.064060781517029, 1.9899321492004394, 1.9583305028533935, 1.9413242259979249, 1.9259093924713135, 1.9170702835845947, 1.9052985552215576, 1.896912885131836, 1.8825988665771485, 1.8796403802490234, 1.8680178726577759, 1.866754577331543, 1.8631378329849244, 1.8581646213150025, 1.8511347687530517, 1.8506925588226317, 1.8502174087905883, 1.844791806640625, 1.8447570569229126, 1.8405440747833253, 1.8362063940048219, 1.8338028798675536, 1.8322235885238647, 1.8271099829483033, 1.8259497284698487, 1.8257087524032594, 1.8204508585357666, 1.8167411252593995, 1.8126173525619507, 1.8123734192276002, 1.8087152871322631, 1.808808218383789, 1.8022823331069946, 1.801023843383789, 1.7965255283355712, 1.7960807333755493, 1.7931187894439697, 1.7941291955947876, 1.7897003564453124, 1.7906446847534179, 1.786394164466858, 1.7862309146881103, 1.780618618774414, 1.7832628304672242, 1.7785604644012452, 1.7788331238174437, 1.7817785488510132, 1.7777097594833373, 1.7799998865509032, 1.775255680809021, 1.7771116664886475, 1.7775196334075927, 1.7734333945465088, 1.774940083694458, 1.7707776821517944, 1.7724536269378661, 1.7712063220214844, 1.769450744857788, 1.7644718740463257, 1.7703942450332641, 1.7682801098251342, 1.7650428762817383, 1.766692326889038, 1.7640820398330688, 1.7642735467147828, 1.7657033821868897, 1.7645520711517333, 1.7599635735702515, 1.7630397510528564, 1.7610415447616576, 1.7589880530548097, 1.759702002029419, 1.758202407836914, 1.7584852575683594, 1.758759799156189, 1.7612190747833252, 1.756975512008667, 1.7578368276977538, 1.752756251296997, 1.7538298551177978, 1.7545775293350219, 1.7533795291137695, 1.7553060709381103, 1.7546167678833007, 1.7510459091186523, 1.7534167892074586, 1.7509777270889282, 1.7524606351089478, 1.753954182395935, 1.7540196291732788, 1.7530623047637939, 1.754902084274292, 1.7526578115844726, 1.7541147797012329, 1.7511920746612548, 1.7532148589324952, 1.7491467144393922, 1.7507730041885377, 1.7531463625335693, 1.7500363696670531 ], "train_acc": [ 0.24014, 0.26772, 0.28264, 0.29302, 0.29948, 0.30404, 0.30992, 0.31306, 0.3199, 0.31706, 0.32588, 0.32474, 0.32728, 0.32896, 0.33068, 0.332, 0.33344, 0.3358, 0.33592, 0.33646, 0.33824, 0.34346, 0.34112, 0.3446, 0.3442, 0.34498, 0.34916, 0.35224, 0.3488, 0.35114, 0.35106, 0.35238, 0.35462, 0.35262, 0.35602, 0.35642, 0.3596, 0.35778, 0.35798, 0.35972, 0.36258, 0.36078, 0.36174, 0.36244, 0.36306, 0.3641, 0.3633, 0.361, 0.36384, 0.36622, 0.36642, 0.3651, 0.36634, 0.36576, 0.3673, 0.36726, 0.36696, 0.36972, 0.3705, 0.36848, 0.36996, 0.36794, 0.37034, 0.37048, 0.37012, 0.367, 0.37118, 0.37072, 0.37212, 0.37374, 0.37076, 0.37256, 0.37136, 0.37392, 0.37394, 0.3732, 0.37276, 0.37222, 0.37412, 0.3723, 0.37526, 0.37592, 0.37682, 0.37498, 0.37556, 0.37602, 0.3759, 0.37684, 0.37452, 0.37624, 0.3739, 0.37434, 0.37596, 0.37428, 0.37492, 0.3748, 0.37806, 0.37718, 0.37634, 0.37502 ], "test_acc": [ 0.2713, 0.3034, 0.3137, 0.3223, 0.3204, 0.3317, 0.3372, 0.3338, 0.3448, 0.3422, 0.3584, 0.3723, 0.3648, 0.363, 0.3547, 0.3679, 0.3611, 0.3653, 0.3704, 0.3666, 0.3724, 0.3691, 0.3744, 0.3743, 0.379, 0.375, 0.3703, 0.3688, 0.3839, 0.3808, 0.3808, 0.3799, 0.3901, 0.3821, 0.3861, 0.388, 0.3872, 0.3823, 0.3851, 0.3872, 0.3816, 0.3883, 0.3914, 0.3866, 0.3824, 0.3861, 0.3912, 0.3831, 0.3882, 0.39, 0.3935, 0.3951, 0.3927, 0.3947, 0.3931, 0.3904, 0.3849, 0.3965, 0.389, 0.3957, 0.3993, 0.3929, 0.3939, 0.3988, 0.3972, 0.3919, 0.3956, 0.3937, 0.3964, 0.3968, 0.3954, 0.3934, 0.3957, 0.3954, 0.3983, 0.399, 0.3964, 0.3988, 0.3968, 0.3999, 0.3998, 0.3988, 0.3981, 0.3991, 0.3994, 0.4001, 0.3957, 0.3991, 0.3996, 0.3992, 0.4004, 0.3989, 0.3985, 0.4004, 0.4008, 0.3998, 0.4001, 0.3995, 0.3999, 0.3996 ] }, "diagnostics": { "bp_cosine": [ -0.005567306652665138, 0.07410226762294769, -0.08782696723937988, 0.9968396425247192 ], "perturbation_rho": [ 0.018982190638780594, 0.020260581746697426, -0.010329723358154297, -0.0005609926301985979 ], "nudging": { "0.001": [ 1.0007061064243317e-06, -3.9103906601667404e-07, 1.1315569281578064e-07, -1.5826663002371788e-06 ], "0.003": [ 3.3027026802301407e-06, -1.0563526302576065e-06, 3.9511360228061676e-07, -5.659414455294609e-06 ], "0.01": [ 1.0776100680232048e-05, -3.261142410337925e-06, 1.505366526544094e-06, -1.979817170649767e-05 ] }, "hidden_norms_per_layer": [ 7183.7138671875, 54252.28125, 433092.46875, 853070.375, 358308.375 ], "bp_grad_norms_per_layer": [ 2.274825965287164e-05, 2.2719700609741267e-06, 1.0948514272968168e-06, 1.0902091389652924e-06, 1.0879763294724398e-06 ] }, "drift": { "embed.weight": 59.198994919141114, "embed.bias": 39.04210511940659, "blocks.0.ln.weight": 1.5643459558486938, "blocks.0.w1.weight": 17.61955302910138, "blocks.0.w1.bias": 14.864856243639734, "blocks.0.w2.weight": 72.0693062056265, "blocks.1.ln.weight": 1.3596134185791016, "blocks.1.w1.weight": 23.46545214362022, "blocks.1.w1.bias": 20.737719695924945, "blocks.1.w2.weight": 57.54218956802357, "blocks.2.ln.weight": 1.0050276517868042, "blocks.2.w1.weight": 26.292893266385775, "blocks.2.w1.bias": 30.330843617032436, "blocks.2.w2.weight": 38.29821365284518, "blocks.3.ln.weight": 1.097004771232605, "blocks.3.w1.weight": 25.15473199291234, "blocks.3.w1.bias": 27.34892428441179, "blocks.3.w2.weight": 48.94715322109553, "out_ln.weight": 0.27024972438812256, "out_head.weight": 4.837433858659456, "out_head.bias": 1.4275285869872485 } } }, "config": { "dataset": "cifar10", "d_hidden": 256, "num_blocks": 4, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 42, 123, 456 ], "gpu": 0, "output_dir": "results/fa_main_audit", "methods": [ "fa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }