{ "0": { "dfa": { "log": { "train_loss": [ 2.062894982070923, 2.042903160247803, 2.0362783416748047, 2.0289835427093506, 2.0305548177719115, 2.027372160644531, 2.0264537405395506, 2.024415637550354, 2.0239928167343137, 2.0210681298828126, 2.0223728131103518, 2.0176786605072023, 2.0183338179016115, 2.015661160888672, 2.017801855773926, 2.0157006243896483, 2.013551385803223, 2.013131450958252, 2.012682000961304, 2.0142799925231936, 2.010995005722046, 2.01094291557312, 2.010355429763794, 2.00825265914917, 2.0103073081207277, 2.0115878075790405, 2.00740104183197, 2.008656568450928, 2.007300491104126, 2.0068678036499024, 2.0060133220672607, 2.005689826889038, 2.0071374508666993, 2.0041723249053955, 2.007439960021973, 2.004801420516968, 2.007543896255493, 2.008051019935608, 2.0040309619140624, 2.002984625930786, 2.0036395249176024, 2.0038933919906614, 2.000672343521118, 2.002527554702759, 2.0040715547180175, 2.002382646026611, 2.002094281616211, 2.0012509018707276, 2.0035453020477294, 2.0021117819213865, 2.0006714540863038, 2.0024239098739622, 2.000547568016052, 2.0004410552978515, 2.000826226043701, 1.9995253698730469, 2.0001726056671143, 2.0008310513687135, 1.998274679107666, 1.9978595404052735, 1.9991289748382568, 1.9976552139663697, 1.9974908544540406, 1.9972500681304932, 1.9982564139556884, 1.9990739729309082, 1.9982671169281006, 1.9968176255035401, 1.9985010131072998, 1.997684263381958, 1.9971537530517578, 1.9961954132843018, 1.9972638996124268, 1.9965271125793458, 1.9960845895385741, 1.9970510581970216, 1.9964770040512085, 1.9966202107238769, 1.99665422416687, 1.9977766342163086, 1.9974106648254395, 1.9950730167007447, 1.9971654697418213, 1.995940417022705, 1.9962149201202393, 1.9963797412109374, 1.9944206412506102, 1.9952468407440185, 1.9964326373291015, 1.99426823387146, 1.9950427423477173, 1.9937485892105102, 1.995298335914612, 1.9937747159194947, 1.99329125541687, 1.9960021032333375, 1.9957950158309936, 1.9929876937103272, 1.994628695678711, 1.9954896281433105 ], "train_acc": [ 0.2387, 0.24782, 0.24834, 0.255, 0.2542, 0.25346, 0.2542, 0.25464, 0.25776, 0.25884, 0.25932, 0.26184, 0.26154, 0.2615, 0.26154, 0.26214, 0.26598, 0.26548, 0.26678, 0.26396, 0.2672, 0.2662, 0.26618, 0.26934, 0.2649, 0.26488, 0.26854, 0.2669, 0.26922, 0.27032, 0.2688, 0.26942, 0.26852, 0.2698, 0.2708, 0.27092, 0.27064, 0.2683, 0.27222, 0.2735, 0.27254, 0.26794, 0.27416, 0.27154, 0.2709, 0.2735, 0.27234, 0.2735, 0.2704, 0.27326, 0.27246, 0.2728, 0.27374, 0.2747, 0.27344, 0.2739, 0.2744, 0.27318, 0.27582, 0.27816, 0.27576, 0.27492, 0.27696, 0.27608, 0.27436, 0.27578, 0.27502, 0.27806, 0.274, 0.27654, 0.27598, 0.27728, 0.2783, 0.27636, 0.27394, 0.27612, 0.2788, 0.27772, 0.27614, 0.27662, 0.27458, 0.27506, 0.27614, 0.2755, 0.27668, 0.27622, 0.27808, 0.27856, 0.27796, 0.27642, 0.27808, 0.28, 0.27782, 0.27638, 0.27682, 0.2774, 0.27772, 0.27642, 0.27804, 0.27828 ], "test_acc": [ 0.2555, 0.2749, 0.2689, 0.2689, 0.2829, 0.2478, 0.2839, 0.2723, 0.2772, 0.2879, 0.2743, 0.2663, 0.2681, 0.2905, 0.2902, 0.284, 0.2788, 0.2919, 0.2851, 0.2912, 0.2889, 0.2929, 0.2868, 0.2687, 0.2855, 0.304, 0.292, 0.2903, 0.2882, 0.2887, 0.2923, 0.2995, 0.2973, 0.2915, 0.2914, 0.2869, 0.2737, 0.2922, 0.2898, 0.2812, 0.2924, 0.3001, 0.305, 0.2996, 0.2954, 0.3002, 0.2926, 0.2858, 0.3015, 0.2967, 0.2964, 0.2897, 0.3042, 0.286, 0.294, 0.2986, 0.2865, 0.3013, 0.2935, 0.2824, 0.2985, 0.2908, 0.3008, 0.2949, 0.3059, 0.289, 0.2914, 0.305, 0.2975, 0.3007, 0.3019, 0.3009, 0.2996, 0.2976, 0.2945, 0.2986, 0.3022, 0.2991, 0.2976, 0.2988, 0.2988, 0.2979, 0.2974, 0.298, 0.3014, 0.2972, 0.3003, 0.2981, 0.3005, 0.3031, 0.3026, 0.3007, 0.3004, 0.2997, 0.3016, 0.3003, 0.2993, 0.2995, 0.3002, 0.3001 ] }, "diagnostics": { "bp_cosine": [ 0.38934820890426636, -0.0007739475695416331 ], "perturbation_rho": [ -0.011460170149803162, 0.0 ], "nudging": { "0.001": [ -4.163011908531189e-07, 0.0 ], "0.003": [ -1.0598450899124146e-06, 0.0 ], "0.01": [ -3.500375896692276e-06, 0.0 ] }, "hidden_norms_per_layer": [ 52784.04296875, 1514456960.0, 4954951168.0 ], "bp_grad_norms_per_layer": [ 2.3542017402178317e-07, 3.12540243685433e-10, 3.13137349383652e-10 ] }, "drift": { "embed.weight": 333.9178900630863, "embed.bias": 277.5308018858926, "blocks.0.ln.weight": 9.301640363801488, "blocks.0.w1.weight": 311.12199748150937, "blocks.0.w1.bias": 280.3822361773791, "blocks.0.w2.weight": 500.10543177407226, "blocks.1.ln.weight": 9.416271027168449, "blocks.1.w1.weight": 397.745772813683, "blocks.1.w1.bias": 381.1405085841875, "blocks.1.w2.weight": 396.08258246162814, "out_ln.weight": 0.5525577953421494, "out_head.weight": 8.092380783169268, "out_head.bias": 3.6707232448212266 } }, "fa": { "log": { "train_loss": [ 2.074207492980957, 1.9848071645736693, 1.943194331741333, 1.915086039428711, 1.8987552841186524, 1.8773444555282592, 1.8620493222808838, 1.8454281293106078, 1.843613411216736, 1.8376456963348389, 1.8340519763946532, 1.8251803881072999, 1.8269455047607421, 1.825891435623169, 1.8311459658432008, 1.8294941538238525, 1.8284651235580445, 1.8239954425811769, 1.824907121887207, 1.826982011680603, 1.8236070413970946, 1.8217376638412475, 1.82049068069458, 1.8151681272125244, 1.8155477234649657, 1.8134433920288087, 1.806967512512207, 1.8068813376235962, 1.801505942955017, 1.8042971012115478, 1.800074999961853, 1.7939591689300538, 1.792923740272522, 1.7907480084991456, 1.7882287372589112, 1.7897650888824463, 1.7839135689926147, 1.7830314935302733, 1.7808781423187257, 1.7737779104614257, 1.7762451565933228, 1.7733127856826782, 1.7701874697875977, 1.7670377206802368, 1.7671197887802124, 1.7665505773162842, 1.7623907526016236, 1.7633579796600343, 1.7624771506500243, 1.7620069681167603, 1.7585726612091064, 1.7578929253387452, 1.7546437027740478, 1.7530586669921875, 1.7568175424575805, 1.7472540600585937, 1.7497945638656616, 1.7486419037246703, 1.7454212425994873, 1.7467387356948854, 1.742750499343872, 1.7459785363006592, 1.7462484993743896, 1.7419252165985109, 1.7439173141479491, 1.7400725153350831, 1.7417476744842528, 1.7432426296234131, 1.7410478344726563, 1.735186776046753, 1.7373164199447633, 1.7379439109039307, 1.7370698404312135, 1.7362006621932984, 1.7366024084091187, 1.734513318862915, 1.7316589307403565, 1.734174518661499, 1.7326682236480713, 1.7339326565170288, 1.734504469909668, 1.728739596824646, 1.7321637844848632, 1.7324034854125976, 1.7288938723754883, 1.7308405535888671, 1.7306951354980469, 1.7300820154190064, 1.7285541592788696, 1.7268984225845336, 1.727956399230957, 1.724655009765625, 1.7292626781845093, 1.7271040807723999, 1.7264983687973023, 1.7272509225845336, 1.7300393019104003, 1.7276934866714477, 1.7269879544067384, 1.72983638671875 ], "train_acc": [ 0.24412, 0.28062, 0.29426, 0.30988, 0.31292, 0.32326, 0.32948, 0.33612, 0.33972, 0.34158, 0.34404, 0.34674, 0.34434, 0.34662, 0.3424, 0.3445, 0.34358, 0.34696, 0.34462, 0.3454, 0.34674, 0.3471, 0.34642, 0.34934, 0.34898, 0.35068, 0.35258, 0.3542, 0.35448, 0.35074, 0.354, 0.35526, 0.35522, 0.35664, 0.36026, 0.36056, 0.36136, 0.35988, 0.3653, 0.3664, 0.36336, 0.36712, 0.36668, 0.36956, 0.36908, 0.36934, 0.3731, 0.36976, 0.36908, 0.3699, 0.37166, 0.37488, 0.3728, 0.37648, 0.37234, 0.3769, 0.3778, 0.37956, 0.37994, 0.37854, 0.3793, 0.38058, 0.3788, 0.3813, 0.3811, 0.38082, 0.3786, 0.38008, 0.37906, 0.383, 0.3824, 0.38106, 0.38238, 0.38434, 0.37922, 0.3843, 0.38626, 0.38438, 0.38332, 0.38316, 0.3814, 0.3837, 0.38628, 0.3838, 0.38572, 0.38528, 0.3855, 0.38382, 0.38534, 0.38696, 0.3866, 0.38526, 0.38498, 0.38372, 0.38534, 0.38782, 0.38812, 0.38732, 0.38564, 0.38654 ], "test_acc": [ 0.2891, 0.3185, 0.3279, 0.3405, 0.3535, 0.3324, 0.3578, 0.3568, 0.3611, 0.368, 0.3716, 0.3657, 0.3624, 0.37, 0.3642, 0.3776, 0.3742, 0.3629, 0.3623, 0.3785, 0.3689, 0.3538, 0.3593, 0.3592, 0.3713, 0.3788, 0.3722, 0.3675, 0.3747, 0.3758, 0.3671, 0.3866, 0.3809, 0.3827, 0.3781, 0.3711, 0.375, 0.3801, 0.3829, 0.3886, 0.3844, 0.3859, 0.3842, 0.3854, 0.3855, 0.3871, 0.3835, 0.3874, 0.3931, 0.3825, 0.3856, 0.3901, 0.3877, 0.3854, 0.3894, 0.3873, 0.3886, 0.3982, 0.3923, 0.3881, 0.3883, 0.3901, 0.3907, 0.3926, 0.3942, 0.3933, 0.3851, 0.3912, 0.393, 0.3928, 0.3961, 0.3907, 0.3876, 0.3881, 0.3875, 0.3885, 0.3909, 0.3893, 0.394, 0.3959, 0.3886, 0.3945, 0.3932, 0.3919, 0.3906, 0.3944, 0.3939, 0.3946, 0.3923, 0.393, 0.3929, 0.3923, 0.3915, 0.3948, 0.3934, 0.3929, 0.3932, 0.3936, 0.394, 0.3938 ] }, "diagnostics": { "bp_cosine": [ 0.017680617049336433, 0.8765696287155151 ], "perturbation_rho": [ -0.00557959359139204, 0.06313759833574295 ], "nudging": { "0.001": [ -2.048211172223091e-06, -3.955443389713764e-06 ], "0.003": [ -6.195507012307644e-06, -1.213036011904478e-05 ], "0.01": [ -2.056185621768236e-05, -4.089018329977989e-05 ] }, "hidden_norms_per_layer": [ 5668.7490234375, 427742.1875, 626308.1875 ], "bp_grad_norms_per_layer": [ 2.2485837689600885e-05, 1.0125075959876995e-06, 7.618949666721164e-07 ] }, "drift": { "embed.weight": 43.36126831717888, "embed.bias": 11.647761057592673, "blocks.0.ln.weight": 1.7734721493198804, "blocks.0.w1.weight": 28.788589686086883, "blocks.0.w1.bias": 16.981347027161885, "blocks.0.w2.weight": 61.91338151396999, "blocks.1.ln.weight": 1.2975357664484612, "blocks.1.w1.weight": 23.055782710684934, "blocks.1.w1.bias": 17.973225870539384, "blocks.1.w2.weight": 38.08861834310624, "out_ln.weight": 0.38876131505924627, "out_head.weight": 5.716507111968003, "out_head.bias": 4.553337714995325 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 2, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 0 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L2_seed0", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }