diff options
Diffstat (limited to 'results/fa_dfa_d512_L2_seed0/results_cifar10.json')
| -rw-r--r-- | results/fa_dfa_d512_L2_seed0/results_cifar10.json | 749 |
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed0/results_cifar10.json b/results/fa_dfa_d512_L2_seed0/results_cifar10.json new file mode 100644 index 0000000..7d68e48 --- /dev/null +++ b/results/fa_dfa_d512_L2_seed0/results_cifar10.json @@ -0,0 +1,749 @@ +{ + "0": { + "dfa": { + "log": { + "train_loss": [ + 2.062894982070923, + 2.042903160247803, + 2.0362783416748047, + 2.0289835427093506, + 2.0305548177719115, + 2.027372160644531, + 2.0264537405395506, + 2.024415637550354, + 2.0239928167343137, + 2.0210681298828126, + 2.0223728131103518, + 2.0176786605072023, + 2.0183338179016115, + 2.015661160888672, + 2.017801855773926, + 2.0157006243896483, + 2.013551385803223, + 2.013131450958252, + 2.012682000961304, + 2.0142799925231936, + 2.010995005722046, + 2.01094291557312, + 2.010355429763794, + 2.00825265914917, + 2.0103073081207277, + 2.0115878075790405, + 2.00740104183197, + 2.008656568450928, + 2.007300491104126, + 2.0068678036499024, + 2.0060133220672607, + 2.005689826889038, + 2.0071374508666993, + 2.0041723249053955, + 2.007439960021973, + 2.004801420516968, + 2.007543896255493, + 2.008051019935608, + 2.0040309619140624, + 2.002984625930786, + 2.0036395249176024, + 2.0038933919906614, + 2.000672343521118, + 2.002527554702759, + 2.0040715547180175, + 2.002382646026611, + 2.002094281616211, + 2.0012509018707276, + 2.0035453020477294, + 2.0021117819213865, + 2.0006714540863038, + 2.0024239098739622, + 2.000547568016052, + 2.0004410552978515, + 2.000826226043701, + 1.9995253698730469, + 2.0001726056671143, + 2.0008310513687135, + 1.998274679107666, + 1.9978595404052735, + 1.9991289748382568, + 1.9976552139663697, + 1.9974908544540406, + 1.9972500681304932, + 1.9982564139556884, + 1.9990739729309082, + 1.9982671169281006, + 1.9968176255035401, + 1.9985010131072998, + 1.997684263381958, + 1.9971537530517578, + 1.9961954132843018, + 1.9972638996124268, + 1.9965271125793458, + 1.9960845895385741, + 1.9970510581970216, + 1.9964770040512085, + 1.9966202107238769, + 1.99665422416687, + 1.9977766342163086, + 1.9974106648254395, + 1.9950730167007447, + 1.9971654697418213, + 1.995940417022705, + 1.9962149201202393, + 1.9963797412109374, + 1.9944206412506102, + 1.9952468407440185, + 1.9964326373291015, + 1.99426823387146, + 1.9950427423477173, + 1.9937485892105102, + 1.995298335914612, + 1.9937747159194947, + 1.99329125541687, + 1.9960021032333375, + 1.9957950158309936, + 1.9929876937103272, + 1.994628695678711, + 1.9954896281433105 + ], + "train_acc": [ + 0.2387, + 0.24782, + 0.24834, + 0.255, + 0.2542, + 0.25346, + 0.2542, + 0.25464, + 0.25776, + 0.25884, + 0.25932, + 0.26184, + 0.26154, + 0.2615, + 0.26154, + 0.26214, + 0.26598, + 0.26548, + 0.26678, + 0.26396, + 0.2672, + 0.2662, + 0.26618, + 0.26934, + 0.2649, + 0.26488, + 0.26854, + 0.2669, + 0.26922, + 0.27032, + 0.2688, + 0.26942, + 0.26852, + 0.2698, + 0.2708, + 0.27092, + 0.27064, + 0.2683, + 0.27222, + 0.2735, + 0.27254, + 0.26794, + 0.27416, + 0.27154, + 0.2709, + 0.2735, + 0.27234, + 0.2735, + 0.2704, + 0.27326, + 0.27246, + 0.2728, + 0.27374, + 0.2747, + 0.27344, + 0.2739, + 0.2744, + 0.27318, + 0.27582, + 0.27816, + 0.27576, + 0.27492, + 0.27696, + 0.27608, + 0.27436, + 0.27578, + 0.27502, + 0.27806, + 0.274, + 0.27654, + 0.27598, + 0.27728, + 0.2783, + 0.27636, + 0.27394, + 0.27612, + 0.2788, + 0.27772, + 0.27614, + 0.27662, + 0.27458, + 0.27506, + 0.27614, + 0.2755, + 0.27668, + 0.27622, + 0.27808, + 0.27856, + 0.27796, + 0.27642, + 0.27808, + 0.28, + 0.27782, + 0.27638, + 0.27682, + 0.2774, + 0.27772, + 0.27642, + 0.27804, + 0.27828 + ], + "test_acc": [ + 0.2555, + 0.2749, + 0.2689, + 0.2689, + 0.2829, + 0.2478, + 0.2839, + 0.2723, + 0.2772, + 0.2879, + 0.2743, + 0.2663, + 0.2681, + 0.2905, + 0.2902, + 0.284, + 0.2788, + 0.2919, + 0.2851, + 0.2912, + 0.2889, + 0.2929, + 0.2868, + 0.2687, + 0.2855, + 0.304, + 0.292, + 0.2903, + 0.2882, + 0.2887, + 0.2923, + 0.2995, + 0.2973, + 0.2915, + 0.2914, + 0.2869, + 0.2737, + 0.2922, + 0.2898, + 0.2812, + 0.2924, + 0.3001, + 0.305, + 0.2996, + 0.2954, + 0.3002, + 0.2926, + 0.2858, + 0.3015, + 0.2967, + 0.2964, + 0.2897, + 0.3042, + 0.286, + 0.294, + 0.2986, + 0.2865, + 0.3013, + 0.2935, + 0.2824, + 0.2985, + 0.2908, + 0.3008, + 0.2949, + 0.3059, + 0.289, + 0.2914, + 0.305, + 0.2975, + 0.3007, + 0.3019, + 0.3009, + 0.2996, + 0.2976, + 0.2945, + 0.2986, + 0.3022, + 0.2991, + 0.2976, + 0.2988, + 0.2988, + 0.2979, + 0.2974, + 0.298, + 0.3014, + 0.2972, + 0.3003, + 0.2981, + 0.3005, + 0.3031, + 0.3026, + 0.3007, + 0.3004, + 0.2997, + 0.3016, + 0.3003, + 0.2993, + 0.2995, + 0.3002, + 0.3001 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.38934820890426636, + -0.0007739475695416331 + ], + "perturbation_rho": [ + -0.011460170149803162, + 0.0 + ], + "nudging": { + "0.001": [ + -4.163011908531189e-07, + 0.0 + ], + "0.003": [ + -1.0598450899124146e-06, + 0.0 + ], + "0.01": [ + -3.500375896692276e-06, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 52784.04296875, + 1514456960.0, + 4954951168.0 + ], + "bp_grad_norms_per_layer": [ + 2.3542017402178317e-07, + 3.12540243685433e-10, + 3.13137349383652e-10 + ] + }, + "drift": { + "embed.weight": 333.9178900630863, + "embed.bias": 277.5308018858926, + "blocks.0.ln.weight": 9.301640363801488, + "blocks.0.w1.weight": 311.12199748150937, + "blocks.0.w1.bias": 280.3822361773791, + "blocks.0.w2.weight": 500.10543177407226, + "blocks.1.ln.weight": 9.416271027168449, + "blocks.1.w1.weight": 397.745772813683, + "blocks.1.w1.bias": 381.1405085841875, + "blocks.1.w2.weight": 396.08258246162814, + "out_ln.weight": 0.5525577953421494, + "out_head.weight": 8.092380783169268, + "out_head.bias": 3.6707232448212266 + } + }, + "fa": { + "log": { + "train_loss": [ + 2.074207492980957, + 1.9848071645736693, + 1.943194331741333, + 1.915086039428711, + 1.8987552841186524, + 1.8773444555282592, + 1.8620493222808838, + 1.8454281293106078, + 1.843613411216736, + 1.8376456963348389, + 1.8340519763946532, + 1.8251803881072999, + 1.8269455047607421, + 1.825891435623169, + 1.8311459658432008, + 1.8294941538238525, + 1.8284651235580445, + 1.8239954425811769, + 1.824907121887207, + 1.826982011680603, + 1.8236070413970946, + 1.8217376638412475, + 1.82049068069458, + 1.8151681272125244, + 1.8155477234649657, + 1.8134433920288087, + 1.806967512512207, + 1.8068813376235962, + 1.801505942955017, + 1.8042971012115478, + 1.800074999961853, + 1.7939591689300538, + 1.792923740272522, + 1.7907480084991456, + 1.7882287372589112, + 1.7897650888824463, + 1.7839135689926147, + 1.7830314935302733, + 1.7808781423187257, + 1.7737779104614257, + 1.7762451565933228, + 1.7733127856826782, + 1.7701874697875977, + 1.7670377206802368, + 1.7671197887802124, + 1.7665505773162842, + 1.7623907526016236, + 1.7633579796600343, + 1.7624771506500243, + 1.7620069681167603, + 1.7585726612091064, + 1.7578929253387452, + 1.7546437027740478, + 1.7530586669921875, + 1.7568175424575805, + 1.7472540600585937, + 1.7497945638656616, + 1.7486419037246703, + 1.7454212425994873, + 1.7467387356948854, + 1.742750499343872, + 1.7459785363006592, + 1.7462484993743896, + 1.7419252165985109, + 1.7439173141479491, + 1.7400725153350831, + 1.7417476744842528, + 1.7432426296234131, + 1.7410478344726563, + 1.735186776046753, + 1.7373164199447633, + 1.7379439109039307, + 1.7370698404312135, + 1.7362006621932984, + 1.7366024084091187, + 1.734513318862915, + 1.7316589307403565, + 1.734174518661499, + 1.7326682236480713, + 1.7339326565170288, + 1.734504469909668, + 1.728739596824646, + 1.7321637844848632, + 1.7324034854125976, + 1.7288938723754883, + 1.7308405535888671, + 1.7306951354980469, + 1.7300820154190064, + 1.7285541592788696, + 1.7268984225845336, + 1.727956399230957, + 1.724655009765625, + 1.7292626781845093, + 1.7271040807723999, + 1.7264983687973023, + 1.7272509225845336, + 1.7300393019104003, + 1.7276934866714477, + 1.7269879544067384, + 1.72983638671875 + ], + "train_acc": [ + 0.24412, + 0.28062, + 0.29426, + 0.30988, + 0.31292, + 0.32326, + 0.32948, + 0.33612, + 0.33972, + 0.34158, + 0.34404, + 0.34674, + 0.34434, + 0.34662, + 0.3424, + 0.3445, + 0.34358, + 0.34696, + 0.34462, + 0.3454, + 0.34674, + 0.3471, + 0.34642, + 0.34934, + 0.34898, + 0.35068, + 0.35258, + 0.3542, + 0.35448, + 0.35074, + 0.354, + 0.35526, + 0.35522, + 0.35664, + 0.36026, + 0.36056, + 0.36136, + 0.35988, + 0.3653, + 0.3664, + 0.36336, + 0.36712, + 0.36668, + 0.36956, + 0.36908, + 0.36934, + 0.3731, + 0.36976, + 0.36908, + 0.3699, + 0.37166, + 0.37488, + 0.3728, + 0.37648, + 0.37234, + 0.3769, + 0.3778, + 0.37956, + 0.37994, + 0.37854, + 0.3793, + 0.38058, + 0.3788, + 0.3813, + 0.3811, + 0.38082, + 0.3786, + 0.38008, + 0.37906, + 0.383, + 0.3824, + 0.38106, + 0.38238, + 0.38434, + 0.37922, + 0.3843, + 0.38626, + 0.38438, + 0.38332, + 0.38316, + 0.3814, + 0.3837, + 0.38628, + 0.3838, + 0.38572, + 0.38528, + 0.3855, + 0.38382, + 0.38534, + 0.38696, + 0.3866, + 0.38526, + 0.38498, + 0.38372, + 0.38534, + 0.38782, + 0.38812, + 0.38732, + 0.38564, + 0.38654 + ], + "test_acc": [ + 0.2891, + 0.3185, + 0.3279, + 0.3405, + 0.3535, + 0.3324, + 0.3578, + 0.3568, + 0.3611, + 0.368, + 0.3716, + 0.3657, + 0.3624, + 0.37, + 0.3642, + 0.3776, + 0.3742, + 0.3629, + 0.3623, + 0.3785, + 0.3689, + 0.3538, + 0.3593, + 0.3592, + 0.3713, + 0.3788, + 0.3722, + 0.3675, + 0.3747, + 0.3758, + 0.3671, + 0.3866, + 0.3809, + 0.3827, + 0.3781, + 0.3711, + 0.375, + 0.3801, + 0.3829, + 0.3886, + 0.3844, + 0.3859, + 0.3842, + 0.3854, + 0.3855, + 0.3871, + 0.3835, + 0.3874, + 0.3931, + 0.3825, + 0.3856, + 0.3901, + 0.3877, + 0.3854, + 0.3894, + 0.3873, + 0.3886, + 0.3982, + 0.3923, + 0.3881, + 0.3883, + 0.3901, + 0.3907, + 0.3926, + 0.3942, + 0.3933, + 0.3851, + 0.3912, + 0.393, + 0.3928, + 0.3961, + 0.3907, + 0.3876, + 0.3881, + 0.3875, + 0.3885, + 0.3909, + 0.3893, + 0.394, + 0.3959, + 0.3886, + 0.3945, + 0.3932, + 0.3919, + 0.3906, + 0.3944, + 0.3939, + 0.3946, + 0.3923, + 0.393, + 0.3929, + 0.3923, + 0.3915, + 0.3948, + 0.3934, + 0.3929, + 0.3932, + 0.3936, + 0.394, + 0.3938 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.017680617049336433, + 0.8765696287155151 + ], + "perturbation_rho": [ + -0.00557959359139204, + 0.06313759833574295 + ], + "nudging": { + "0.001": [ + -2.048211172223091e-06, + -3.955443389713764e-06 + ], + "0.003": [ + -6.195507012307644e-06, + -1.213036011904478e-05 + ], + "0.01": [ + -2.056185621768236e-05, + -4.089018329977989e-05 + ] + }, + "hidden_norms_per_layer": [ + 5668.7490234375, + 427742.1875, + 626308.1875 + ], + "bp_grad_norms_per_layer": [ + 2.2485837689600885e-05, + 1.0125075959876995e-06, + 7.618949666721164e-07 + ] + }, + "drift": { + "embed.weight": 43.36126831717888, + "embed.bias": 11.647761057592673, + "blocks.0.ln.weight": 1.7734721493198804, + "blocks.0.w1.weight": 28.788589686086883, + "blocks.0.w1.bias": 16.981347027161885, + "blocks.0.w2.weight": 61.91338151396999, + "blocks.1.ln.weight": 1.2975357664484612, + "blocks.1.w1.weight": 23.055782710684934, + "blocks.1.w1.bias": 17.973225870539384, + "blocks.1.w2.weight": 38.08861834310624, + "out_ln.weight": 0.38876131505924627, + "out_head.weight": 5.716507111968003, + "out_head.bias": 4.553337714995325 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 2, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 0 + ], + "gpu": 0, + "output_dir": "results/fa_dfa_d512_L2_seed0", + "methods": [ + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
