{ "0": { "dfa": { "log": { "train_loss": [ 2.0753555574798583, 2.0437081289672854, 2.031278556365967, 2.027659920578003, 2.0243590501403808, 2.0202790953826906, 2.0175082940673827, 2.015957561340332, 2.016036532974243, 2.013858056335449, 2.0126232041931154, 2.006905050048828, 2.0110664825439453, 2.0065614931488036, 2.007456555709839, 2.0070649071502684, 2.0075456425476075, 2.004424341583252, 2.005271594772339, 2.0039944921875, 2.0024667238998415, 2.000112854309082, 1.9993625988769532, 2.002483249664307, 2.0039204889678954, 1.9985878760528564, 2.0006166967010497, 2.0003138301086425, 1.9996023558807372, 1.9986100010681151, 1.99738998298645, 1.9980814916229248, 1.996693759994507, 2.0003671773529055, 1.9974340956878662, 1.9980345281982421, 1.9958612198638916, 1.9961950925445557, 1.9993210222625732, 1.9953513426971436, 1.9962950857925414, 1.9969137393951415, 1.9964947815704346, 1.9980549166870116, 1.9973483322525025, 1.9953596134185791, 1.995900859451294, 1.9963403786849976, 1.9947577867126465, 1.996345650177002, 1.9976896784210205, 1.9959460092163086, 1.9935208990478515, 1.9943153414154053, 1.9918208218765259, 1.9932028875350951, 1.9944638661956786, 1.995019360809326, 1.9929348825073243, 1.9962419706726073, 1.9949486227035522, 1.991672697906494, 1.9935600751495361, 1.9919422644424438, 1.994082801437378, 1.9919944891738892, 1.9940126430511476, 1.9923382126617433, 1.9926940571594238, 1.9947953038024901, 1.993876279335022, 1.992678325843811, 1.992137566757202, 1.9900086630630494, 1.9903694836044312, 1.9928425230407716, 1.9906801569366455, 1.9912908507919311, 1.9918341095352172, 1.9906631398773194, 1.9910551013183593, 1.9912693448257446, 1.9916500932312011, 1.992011311416626, 1.9930540170669555, 1.9900453987121582, 1.9914034769058226, 1.9921153451156617, 1.9884680337142944, 1.9897785013198852, 1.9896507069396974, 1.9915314351654052, 1.9887127932357789, 1.9907834010314942, 1.990130773010254, 1.9915763851547241, 1.9891119548797607, 1.9894035186386108, 1.9906070321273803, 1.990175763015747 ], "train_acc": [ 0.23202, 0.24612, 0.2534, 0.25296, 0.25586, 0.25736, 0.26078, 0.25968, 0.26376, 0.26194, 0.26464, 0.26644, 0.26328, 0.26692, 0.26742, 0.26744, 0.26808, 0.2689, 0.26662, 0.26898, 0.27116, 0.27066, 0.27046, 0.2737, 0.26932, 0.27098, 0.27496, 0.2742, 0.27396, 0.27362, 0.27356, 0.27542, 0.2752, 0.27348, 0.27492, 0.2737, 0.27614, 0.27596, 0.27528, 0.27582, 0.27624, 0.27556, 0.27432, 0.27686, 0.27726, 0.278, 0.27874, 0.27706, 0.27906, 0.27922, 0.27678, 0.27996, 0.27996, 0.27956, 0.27936, 0.27786, 0.27958, 0.27888, 0.2801, 0.2786, 0.28002, 0.281, 0.28102, 0.27928, 0.27852, 0.2814, 0.28026, 0.28168, 0.28254, 0.27894, 0.28102, 0.28146, 0.27998, 0.28272, 0.28324, 0.28034, 0.28126, 0.28156, 0.28228, 0.28094, 0.28084, 0.28196, 0.28344, 0.28236, 0.28084, 0.28244, 0.2821, 0.28254, 0.28398, 0.2826, 0.28278, 0.28214, 0.28376, 0.28172, 0.28234, 0.28182, 0.28146, 0.28132, 0.2826, 0.28366 ], "test_acc": [ 0.2527, 0.2731, 0.2652, 0.2735, 0.2758, 0.2862, 0.2692, 0.2901, 0.2963, 0.2897, 0.2793, 0.2945, 0.2734, 0.3044, 0.2915, 0.2965, 0.2975, 0.2951, 0.3018, 0.2954, 0.2868, 0.2943, 0.3068, 0.2639, 0.3007, 0.303, 0.3009, 0.3059, 0.3024, 0.2876, 0.2984, 0.2926, 0.3024, 0.3034, 0.2906, 0.3054, 0.2978, 0.2872, 0.3036, 0.3052, 0.2874, 0.3045, 0.3028, 0.2949, 0.2981, 0.3047, 0.3073, 0.2937, 0.3078, 0.2894, 0.3098, 0.2913, 0.2897, 0.306, 0.3075, 0.302, 0.3025, 0.2982, 0.2983, 0.31, 0.3071, 0.3013, 0.309, 0.3042, 0.3009, 0.2958, 0.3024, 0.3013, 0.3055, 0.3016, 0.3041, 0.3077, 0.3023, 0.3111, 0.308, 0.3005, 0.3051, 0.3101, 0.3103, 0.3006, 0.3025, 0.3034, 0.3043, 0.3082, 0.3011, 0.3069, 0.3051, 0.3023, 0.3033, 0.3051, 0.3041, 0.3044, 0.3029, 0.3047, 0.3047, 0.3048, 0.3056, 0.3056, 0.3053, 0.3053 ] }, "diagnostics": { "bp_cosine": [ 0.3933757543563843, -0.00033686644746921957, -0.00029227498453110456, 0.00023268867516890168, -0.00033252357388846576, -0.0006308911251835525 ], "perturbation_rho": [ -0.005786933470517397, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -4.791654646396637e-07, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.2507662177085876e-06, 0.0, 0.0, -3.725290298461914e-09, 0.0, 0.0 ], "0.01": [ -4.01865690946579e-06, 0.0, 1.862645149230957e-09, -3.725290298461914e-09, 0.0, 0.0 ] }, "hidden_norms_per_layer": [ 52006.18359375, 1299919104.0, 4471346176.0, 5541193216.0, 6115124736.0, 6220777984.0, 7776075776.0 ], "bp_grad_norms_per_layer": [ 2.7690890647136257e-07, 2.9755062302960766e-10, 2.9703242643286387e-10, 2.9693505987360425e-10, 2.969274826014612e-10, 2.96939195454371e-10, 2.9694927072831945e-10 ] }, "drift": { "embed.weight": 330.18669911453446, "embed.bias": 275.0701726252062, "blocks.0.ln.weight": 9.87127425013801, "blocks.0.w1.weight": 288.2752398777733, "blocks.0.w1.bias": 276.1693244742186, "blocks.0.w2.weight": 476.3482702241823, "blocks.1.ln.weight": 9.208131003871356, "blocks.1.w1.weight": 379.93945965650295, "blocks.1.w1.bias": 370.165908360661, "blocks.1.w2.weight": 391.3759720182112, "blocks.2.ln.weight": 9.291829925999405, "blocks.2.w1.weight": 372.47037498699524, "blocks.2.w1.bias": 340.94957924841253, "blocks.2.w2.weight": 343.62414266271355, "blocks.3.ln.weight": 9.704848817987399, "blocks.3.w1.weight": 334.76567440579134, "blocks.3.w1.bias": 307.03384934243365, "blocks.3.w2.weight": 310.86785550010995, "blocks.4.ln.weight": 6.86934636896043, "blocks.4.w1.weight": 263.30065941816594, "blocks.4.w1.bias": 243.63618296008045, "blocks.4.w2.weight": 243.60310044137827, "blocks.5.ln.weight": 10.060319390509356, "blocks.5.w1.weight": 402.62899842011797, "blocks.5.w1.bias": 374.4871410963097, "blocks.5.w2.weight": 379.02482222844293, "out_ln.weight": 0.614063493216844, "out_head.weight": 8.991195841592733, "out_head.bias": 0.8181543795651063 } }, "fa": { "log": { "train_loss": [ 2.0268119436264036, 1.9347526413726808, 1.9036040418243407, 1.8875383782958985, 1.8758800409317016, 1.8637015169525146, 1.8550788135147094, 1.8481883679580688, 1.8380642176055908, 1.831563844680786, 1.82749318901062, 1.814368692855835, 1.817901651649475, 1.8037349676895142, 1.8005951739883423, 1.7895659107208253, 1.7900659426879884, 1.781074461402893, 1.7845501969146729, 1.776343214149475, 1.7684208422470094, 1.7643969812774658, 1.7617348025894164, 1.7578030713653565, 1.7565854375457763, 1.7562964432525634, 1.7528118307113647, 1.7484837558364867, 1.743814429550171, 1.7366932116699219, 1.7326225136566162, 1.728937064590454, 1.7266727477645873, 1.7240253580474854, 1.7245794469833373, 1.7228408333969116, 1.7203827739715576, 1.711478896446228, 1.7089925986099244, 1.7088872208023071, 1.7068994373321533, 1.7094496100234986, 1.7018463577270508, 1.7043216220855713, 1.6993152593231202, 1.6993111734771729, 1.6920886862182618, 1.6940990381622314, 1.6973865487670898, 1.693602544631958, 1.6929154531478883, 1.6890407666397094, 1.685359003982544, 1.684633869857788, 1.6784778961181641, 1.6846174112701415, 1.6849634936904907, 1.6800030670928956, 1.6778543420410157, 1.6783534344482423, 1.6748548553848266, 1.675967246170044, 1.674832339515686, 1.6731126987075806, 1.6737006020355225, 1.670804006958008, 1.6716182923126222, 1.6689927773284912, 1.6716524493026734, 1.6704032614517212, 1.6676370931625366, 1.6686026779174805, 1.6649452212142943, 1.6682810161972046, 1.6657524144744873, 1.666575444908142, 1.6638936541748046, 1.6632415933609008, 1.6630835901641845, 1.6650469580078124, 1.661507155380249, 1.6635552446746826, 1.6633718565368651, 1.6654531225204467, 1.660396284713745, 1.6597816809463501, 1.6641134811019898, 1.6597988692855834, 1.6597074938583374, 1.6637430121612549, 1.657964035987854, 1.6597277429580688, 1.65512205078125, 1.66050142578125, 1.6606662057495116, 1.6582156159210204, 1.657457571105957, 1.6597890829086304, 1.6602586605834961, 1.6589343154525757 ], "train_acc": [ 0.2612, 0.30246, 0.31784, 0.3241, 0.32576, 0.33054, 0.33502, 0.33912, 0.34148, 0.34222, 0.34698, 0.34792, 0.34712, 0.35504, 0.35516, 0.35796, 0.35952, 0.36286, 0.36188, 0.36396, 0.36778, 0.36878, 0.3676, 0.36954, 0.37154, 0.36936, 0.37584, 0.3732, 0.37446, 0.37702, 0.37832, 0.38196, 0.37868, 0.3824, 0.38276, 0.38352, 0.38208, 0.3852, 0.3863, 0.38682, 0.38838, 0.38784, 0.3886, 0.38966, 0.38966, 0.39112, 0.39534, 0.39184, 0.39354, 0.39498, 0.39364, 0.39514, 0.3952, 0.39942, 0.40118, 0.39886, 0.3962, 0.39814, 0.39946, 0.40066, 0.39902, 0.40112, 0.40356, 0.40358, 0.40162, 0.40426, 0.40428, 0.4024, 0.40284, 0.40386, 0.4073, 0.4049, 0.40354, 0.40386, 0.40588, 0.4046, 0.40704, 0.40718, 0.40888, 0.405, 0.41078, 0.40724, 0.40814, 0.40858, 0.40918, 0.40666, 0.40436, 0.41216, 0.40734, 0.40822, 0.40996, 0.40958, 0.411, 0.40964, 0.40704, 0.40942, 0.41122, 0.40922, 0.40942, 0.40982 ], "test_acc": [ 0.3205, 0.3401, 0.3549, 0.3534, 0.3599, 0.3678, 0.3633, 0.3657, 0.3754, 0.3736, 0.3895, 0.3818, 0.3742, 0.3765, 0.383, 0.3823, 0.3883, 0.4012, 0.3985, 0.3927, 0.3954, 0.3928, 0.3965, 0.3899, 0.4035, 0.4001, 0.4034, 0.4104, 0.4022, 0.4106, 0.3951, 0.4038, 0.4094, 0.4181, 0.4124, 0.4094, 0.4171, 0.417, 0.4163, 0.418, 0.4157, 0.4251, 0.4269, 0.4201, 0.4151, 0.4222, 0.4264, 0.4171, 0.4209, 0.4171, 0.4187, 0.4239, 0.4214, 0.4154, 0.4241, 0.4166, 0.424, 0.4208, 0.4265, 0.427, 0.4223, 0.4248, 0.4301, 0.4312, 0.4273, 0.4313, 0.4304, 0.4296, 0.426, 0.4255, 0.4306, 0.4314, 0.4315, 0.4326, 0.4331, 0.432, 0.432, 0.4294, 0.4335, 0.433, 0.437, 0.4319, 0.4304, 0.4327, 0.4321, 0.4319, 0.4333, 0.4357, 0.4315, 0.4337, 0.434, 0.4346, 0.4342, 0.4334, 0.4336, 0.4328, 0.434, 0.4344, 0.434, 0.434 ] }, "diagnostics": { "bp_cosine": [ 0.020984500646591187, 0.06538723409175873, -0.02862982451915741, -0.14415404200553894, -0.12824469804763794, 0.9942382574081421 ], "perturbation_rho": [ 0.04626474529504776, 0.00916149839758873, 0.02606651559472084, -0.0706678107380867, 0.0447549931704998, -0.07931974530220032 ], "nudging": { "0.001": [ -2.3448956198990345e-06, -6.940681487321854e-07, 9.400537237524986e-08, 4.384201020002365e-07, 2.918532118201256e-07, -2.525397576391697e-06 ], "0.003": [ -7.02321995049715e-06, -2.0685838535428047e-06, 3.417953848838806e-07, 1.5673576854169369e-06, 1.2195087037980556e-06, -9.568408131599426e-06 ], "0.01": [ -2.358935307711363e-05, -7.018155883997679e-06, 9.208451956510544e-07, 4.6023051254451275e-06, 4.1344319470226765e-06, -3.3148215152323246e-05 ] }, "hidden_norms_per_layer": [ 3922.13720703125, 49122.51171875, 264047.5, 465089.875, 831614.3125, 1037417.9375, 282876.625 ], "bp_grad_norms_per_layer": [ 3.9657443267060444e-05, 4.083395651832689e-06, 1.3594802794614225e-06, 1.2777863958035596e-06, 1.2765268593284418e-06, 1.2795584325431264e-06, 1.2760270919898176e-06 ] }, "drift": { "embed.weight": 31.47039846350604, "embed.bias": 18.02217544364072, "blocks.0.ln.weight": 0.9789876040215849, "blocks.0.w1.weight": 13.428105491977634, "blocks.0.w1.bias": 11.014509469722494, "blocks.0.w2.weight": 44.375832792200086, "blocks.1.ln.weight": 0.9256838094480255, "blocks.1.w1.weight": 16.049693958454462, "blocks.1.w1.bias": 12.671067703031834, "blocks.1.w2.weight": 46.940642430560914, "blocks.2.ln.weight": 0.768237594938939, "blocks.2.w1.weight": 16.878210463024953, "blocks.2.w1.bias": 14.246556953188842, "blocks.2.w2.weight": 45.47089120587146, "blocks.3.ln.weight": 0.6449156612044069, "blocks.3.w1.weight": 17.300866761556396, "blocks.3.w1.bias": 17.793175424183687, "blocks.3.w2.weight": 34.146538375073234, "blocks.4.ln.weight": 0.536074289047981, "blocks.4.w1.weight": 15.870552255415648, "blocks.4.w1.bias": 17.679587984495768, "blocks.4.w2.weight": 27.222411899497516, "blocks.5.ln.weight": 0.5977975068115631, "blocks.5.w1.weight": 18.813068681696937, "blocks.5.w1.bias": 22.173876530236612, "blocks.5.w2.weight": 27.925157214653215, "out_ln.weight": 0.29706709348499905, "out_head.weight": 4.788666797102501, "out_head.bias": 2.266760510860064 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 6, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 0 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L6_seed0", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }