{ "8": { "dfa": { "log": { "train_loss": [ 2.0461414054870604, 2.028953609237671, 2.0224830960845948, 2.0189640741348267, 2.0186043047332762, 2.011939255371094, 2.00884051902771, 2.006375752105713, 2.0061196725463866, 2.0044810569763185, 2.000473762359619, 1.999425143661499, 1.9991976582336426, 1.9983828188323975, 1.9999516902160646, 2.000131714401245, 2.000538674583435, 1.999087513999939, 1.9965772060394287, 1.9952695233154296, 1.9958783276367187, 1.9935351610565186, 1.9946063667297362, 1.9927719008636475, 1.9930043865203857, 1.992498685836792, 1.9923327257537842, 1.9919360898208618, 1.9922407612609863, 1.992235760192871, 1.992523240623474, 1.9913750788116455, 1.9934618493652343, 1.9923072975921632, 1.991889149017334, 1.9904881185913086, 1.9916703072357178, 1.9886171953582763, 1.9906551904296874, 1.9912475842285156, 1.9906490882873535, 1.9897464477920532, 1.9902090267562866, 1.98889538230896, 1.9899030431365967, 1.9914473651885987, 1.987290951499939, 1.9882332851409912, 1.987876655883789, 1.986627554321289, 1.9874235430526734, 1.985631577758789, 1.9859224739074708, 1.984819174156189, 1.9877312922668458, 1.9880256802749634, 1.9883026748657227, 1.9880133050918578, 1.9872900528717041, 1.9861614239501952, 1.9879061701202392, 1.986334129486084, 1.9889874462509156, 1.9848816363143922, 1.985108938598633, 1.9852813848114013, 1.9847304062652589, 1.9842171102142334, 1.986599141769409, 1.9858817081451416, 1.9852649099349975, 1.982235690460205, 1.9838326638793946, 1.9827596533966065, 1.9836663906097411, 1.9844815605163575, 1.9842618350982666, 1.984488549156189, 1.9830066680908203, 1.9835596384048462, 1.9822921755981446, 1.9845924890899658, 1.9827096743392945, 1.9821208544158935, 1.983244455909729, 1.9823134091567993, 1.9837292085266114, 1.9827219149017334, 1.9828275063323975, 1.9811715400695802, 1.9821106326675415, 1.9830516720199585, 1.9831754531097412, 1.9825017529296876, 1.9844729486465453, 1.9823845765686035, 1.9825008573913574, 1.9817371285247802, 1.9809684440612794, 1.981824859008789 ], "train_acc": [ 0.24566, 0.25216, 0.25672, 0.2583, 0.25908, 0.2611, 0.26292, 0.26504, 0.26436, 0.26372, 0.26838, 0.2684, 0.26774, 0.26886, 0.26864, 0.26928, 0.26802, 0.26984, 0.27068, 0.27056, 0.27002, 0.27018, 0.27034, 0.27138, 0.27238, 0.27266, 0.27208, 0.27464, 0.27406, 0.27306, 0.27278, 0.27354, 0.27164, 0.27506, 0.27494, 0.27682, 0.27244, 0.2749, 0.27302, 0.2745, 0.2736, 0.27382, 0.27478, 0.27344, 0.27582, 0.2732, 0.27662, 0.27616, 0.2763, 0.27742, 0.27642, 0.27984, 0.2777, 0.28112, 0.27754, 0.27344, 0.2769, 0.27664, 0.27734, 0.27754, 0.27784, 0.27642, 0.27598, 0.2796, 0.27964, 0.27868, 0.27864, 0.27868, 0.27826, 0.27986, 0.27616, 0.2817, 0.28024, 0.27688, 0.28002, 0.27942, 0.27838, 0.2787, 0.27856, 0.28034, 0.27972, 0.27722, 0.27992, 0.28172, 0.27796, 0.2775, 0.28122, 0.2803, 0.27958, 0.27936, 0.28062, 0.2791, 0.2797, 0.28202, 0.27898, 0.27894, 0.27866, 0.27832, 0.28, 0.28114 ], "test_acc": [ 0.2641, 0.2447, 0.2423, 0.2586, 0.2666, 0.2868, 0.2779, 0.27, 0.2886, 0.2704, 0.2846, 0.2825, 0.2801, 0.2912, 0.277, 0.2834, 0.2838, 0.2802, 0.2793, 0.2883, 0.2871, 0.2825, 0.288, 0.2913, 0.2813, 0.2931, 0.2994, 0.3001, 0.2753, 0.2966, 0.2996, 0.2965, 0.2835, 0.3002, 0.2979, 0.2783, 0.3017, 0.2848, 0.2846, 0.2928, 0.2956, 0.2705, 0.2811, 0.292, 0.2763, 0.2834, 0.2837, 0.2949, 0.2998, 0.2894, 0.2853, 0.2921, 0.2986, 0.2918, 0.2933, 0.28, 0.2988, 0.2925, 0.2828, 0.2875, 0.2985, 0.2927, 0.2922, 0.3016, 0.2947, 0.2952, 0.2936, 0.2923, 0.2992, 0.2968, 0.2915, 0.2992, 0.2941, 0.2969, 0.2936, 0.2972, 0.2964, 0.2928, 0.2958, 0.2973, 0.2958, 0.2971, 0.2983, 0.2983, 0.2951, 0.2963, 0.2953, 0.2964, 0.2963, 0.293, 0.2951, 0.2967, 0.2967, 0.297, 0.2966, 0.2967, 0.2967, 0.2966, 0.2966, 0.2967 ] }, "diagnostics": { "bp_cosine": [ 0.3839848041534424, -0.0006596383173018694 ], "perturbation_rho": [ 0.02412901259958744, 0.0 ], "nudging": { "0.001": [ -4.284083843231201e-07, 0.0 ], "0.003": [ -1.3029202818870544e-06, 0.0 ], "0.01": [ -4.258938133716583e-06, 0.0 ] }, "hidden_norms_per_layer": [ 53606.07421875, 782741952.0, 4561426432.0 ], "bp_grad_norms_per_layer": [ 3.0959373020778003e-07, 3.211692578553027e-10, 3.2110258896267396e-10 ] }, "drift": { "embed.weight": 322.14716880304843, "embed.bias": 253.7663922411994, "blocks.0.ln.weight": 9.639264948834146, "blocks.0.w1.weight": 278.73838749620353, "blocks.0.w1.bias": 250.4325839565606, "blocks.0.w2.weight": 488.7145731499842, "blocks.1.ln.weight": 9.351844341907716, "blocks.1.w1.weight": 376.1230199590697, "blocks.1.w1.bias": 376.4920228948829, "blocks.1.w2.weight": 403.36194320458816, "out_ln.weight": 0.513534701987637, "out_head.weight": 7.742896807554914, "out_head.bias": 1.1408249446090957 } }, "fa": { "log": { "train_loss": [ 2.0653204177856446, 1.9681754495239259, 1.9207439241790771, 1.8943786935806275, 1.8802625274276734, 1.8628883916473389, 1.8490794301605225, 1.8400364615249634, 1.8355530837249756, 1.8266534114837647, 1.8170614450454712, 1.8170341843414306, 1.809728816757202, 1.80435710231781, 1.8044258756256104, 1.7987670265960694, 1.7999644842147826, 1.7953315704345703, 1.7825802756118774, 1.7845099126434327, 1.7779603283691405, 1.7730702184677125, 1.7695367748260498, 1.7647147689056397, 1.7608037928009033, 1.7535330474090576, 1.75540680393219, 1.7487119026947022, 1.7451758492279053, 1.745663233718872, 1.7409377331924438, 1.7372819427871704, 1.7388353146743774, 1.7410107398605346, 1.7357459603881835, 1.7290400104522705, 1.7318879638290405, 1.729545888900757, 1.7291300962066651, 1.733487999343872, 1.7302352466583253, 1.7331863732147217, 1.7339300806045532, 1.7359314554595948, 1.7347373684310914, 1.7375746230316162, 1.7313235457611085, 1.7353338851165772, 1.73820286403656, 1.7340232833862306, 1.7341221398925781, 1.7339955667114257, 1.7339833393096924, 1.7300079647064208, 1.7303287143707275, 1.7298947993469238, 1.7274299069213868, 1.7319763919067384, 1.7264507590103149, 1.7299312719726563, 1.7262817291641235, 1.7270497384262085, 1.7246126723098756, 1.7255360033798217, 1.7196656997680664, 1.7214281465911865, 1.7198693132781981, 1.7217327685546875, 1.7179188094329834, 1.7154542624664306, 1.7195643279266357, 1.7149108078384399, 1.7153279098510743, 1.7153327802276612, 1.7094103066253663, 1.7162176602554322, 1.7122739435195924, 1.7128758419418335, 1.708295757408142, 1.7086283514785767, 1.7106998838043213, 1.711903858909607, 1.7090504042434693, 1.7111234002304077, 1.7090101749420166, 1.7079448748779298, 1.707335115890503, 1.7080174974822997, 1.705443286972046, 1.7056840801239013, 1.708050958175659, 1.7072754711151124, 1.7059114752960205, 1.7063753726959228, 1.7061457764434815, 1.7009761544418336, 1.707751445274353, 1.7066948248291016, 1.7041513320922852, 1.7030947677612305 ], "train_acc": [ 0.24824, 0.29, 0.30804, 0.32064, 0.32604, 0.33114, 0.33818, 0.3373, 0.34064, 0.3462, 0.34982, 0.34634, 0.35334, 0.35346, 0.35488, 0.3554, 0.35676, 0.35738, 0.36206, 0.36144, 0.36364, 0.3671, 0.36916, 0.3698, 0.37032, 0.3709, 0.37188, 0.3757, 0.37546, 0.37376, 0.37888, 0.37908, 0.37828, 0.37822, 0.37984, 0.3791, 0.38144, 0.38286, 0.37966, 0.3797, 0.38152, 0.38084, 0.3812, 0.3809, 0.38156, 0.382, 0.38494, 0.38258, 0.38066, 0.3824, 0.38058, 0.38342, 0.3823, 0.38198, 0.38534, 0.38368, 0.38524, 0.38594, 0.38536, 0.38514, 0.38676, 0.38838, 0.38778, 0.38664, 0.39118, 0.38748, 0.39154, 0.3882, 0.38852, 0.39078, 0.38918, 0.39202, 0.39086, 0.39128, 0.39242, 0.3935, 0.39422, 0.39322, 0.39388, 0.39516, 0.39496, 0.39414, 0.39428, 0.39522, 0.39426, 0.3953, 0.39628, 0.39662, 0.39662, 0.39608, 0.39646, 0.39568, 0.39606, 0.39558, 0.3961, 0.3992, 0.39438, 0.39786, 0.39626, 0.39922 ], "test_acc": [ 0.297, 0.3142, 0.3407, 0.3409, 0.3537, 0.3628, 0.3482, 0.3626, 0.3557, 0.351, 0.3614, 0.3693, 0.363, 0.3681, 0.374, 0.3756, 0.3778, 0.3795, 0.3757, 0.3742, 0.3801, 0.3732, 0.3782, 0.3805, 0.3718, 0.3786, 0.3914, 0.3924, 0.3797, 0.3967, 0.3891, 0.3829, 0.3811, 0.3967, 0.3876, 0.3862, 0.3945, 0.3851, 0.3807, 0.3871, 0.3924, 0.3941, 0.3823, 0.392, 0.3942, 0.3908, 0.3979, 0.3954, 0.4003, 0.401, 0.3938, 0.3938, 0.3997, 0.3943, 0.4069, 0.4012, 0.4056, 0.408, 0.4037, 0.3996, 0.4115, 0.4098, 0.4062, 0.4083, 0.4115, 0.4094, 0.4147, 0.4109, 0.4101, 0.4084, 0.4112, 0.4114, 0.4127, 0.4113, 0.407, 0.4126, 0.4167, 0.4132, 0.4156, 0.4138, 0.4122, 0.4128, 0.417, 0.4138, 0.4128, 0.4136, 0.4137, 0.4132, 0.4153, 0.4136, 0.4123, 0.413, 0.4134, 0.4142, 0.4155, 0.4155, 0.4142, 0.4147, 0.4149, 0.4146 ] }, "diagnostics": { "bp_cosine": [ 0.02496020682156086, 0.9624444246292114 ], "perturbation_rho": [ -0.018970193341374397, 0.1267668902873993 ], "nudging": { "0.001": [ -2.1758460206910968e-06, -7.471287972293794e-06 ], "0.003": [ -6.601490895263851e-06, -2.2840846213512123e-05 ], "0.01": [ -2.1907704649493098e-05, -7.614441710757092e-05 ] }, "hidden_norms_per_layer": [ 6420.08984375, 205601.1875, 92651.546875 ], "bp_grad_norms_per_layer": [ 2.9750526664429344e-05, 2.456108632031828e-06, 2.075838210657821e-06 ] }, "drift": { "embed.weight": 37.110060620728056, "embed.bias": 24.00213600327038, "blocks.0.ln.weight": 1.3952106680756078, "blocks.0.w1.weight": 19.29938322080228, "blocks.0.w1.bias": 17.715456046599957, "blocks.0.w2.weight": 54.87838247174745, "blocks.1.ln.weight": 1.0669201771550085, "blocks.1.w1.weight": 18.224214324200183, "blocks.1.w1.bias": 17.474148202150594, "blocks.1.w2.weight": 31.754151778532563, "out_ln.weight": 0.42931707858608786, "out_head.weight": 4.036471355678216, "out_head.bias": 7.088871139191845 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 2, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 8 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L2_seed8", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }