diff options
Diffstat (limited to 'results/fa_dfa_d512_L2_seed9/results_cifar10.json')
| -rw-r--r-- | results/fa_dfa_d512_L2_seed9/results_cifar10.json | 749 |
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed9/results_cifar10.json b/results/fa_dfa_d512_L2_seed9/results_cifar10.json new file mode 100644 index 0000000..f8f63d4 --- /dev/null +++ b/results/fa_dfa_d512_L2_seed9/results_cifar10.json @@ -0,0 +1,749 @@ +{ + "9": { + "dfa": { + "log": { + "train_loss": [ + 2.0386180068206787, + 2.0063905084228515, + 2.0115847008895873, + 2.0072783072662355, + 2.0072200788116454, + 2.007624338607788, + 2.004089120826721, + 2.004089771194458, + 1.9991737648010255, + 1.9998447619247437, + 1.9991543921661377, + 2.0006776647186277, + 1.9984499712371826, + 1.9943631922149658, + 1.994661587486267, + 1.993870899658203, + 1.9933709629821776, + 1.9952729042816162, + 1.9926185557556153, + 1.9912919250488281, + 1.9926570781707764, + 1.9911886741638183, + 1.9924334022521972, + 1.9887267460632325, + 1.9918579584121705, + 1.990792886352539, + 1.9901814585113526, + 1.9899697443008424, + 1.989364903640747, + 1.9860043600463868, + 1.9868051830291749, + 1.9893270887756347, + 1.9876267849349976, + 1.9893067332458496, + 1.9857772846221924, + 1.9837282821655273, + 1.9841915615081787, + 1.9825071751403809, + 1.9810244177246095, + 1.9853471765136719, + 1.9825159663391114, + 1.9842312357330323, + 1.9828273846817017, + 1.9831989236450196, + 1.9810442190551758, + 1.9819502600479126, + 1.981037528152466, + 1.9779154906845093, + 1.9809581425476075, + 1.9797189464569092, + 1.9827272113037109, + 1.9808893032073975, + 1.9813728839111329, + 1.9781295204925538, + 1.9786987835311889, + 1.9786434796905517, + 1.9790834701919555, + 1.9781043656921387, + 1.9786688150024414, + 1.9782110293579103, + 1.9773203885269166, + 1.9758285034942626, + 1.977617745285034, + 1.97553291305542, + 1.975182448425293, + 1.9747401064682006, + 1.9758236003875733, + 1.9758562586212158, + 1.9762433794403076, + 1.9765984790420532, + 1.9761512882232666, + 1.9743927758407593, + 1.9739378618621826, + 1.9728027178192138, + 1.9720366858673095, + 1.9760308059692382, + 1.9740920357513427, + 1.9741222943115235, + 1.9719459004974365, + 1.9733767440032959, + 1.9732320972061157, + 1.9731594284057616, + 1.9734650510025025, + 1.9740613651275636, + 1.970825253868103, + 1.97225927734375, + 1.9708090161132812, + 1.972899548110962, + 1.9718735347747802, + 1.9716896154785157, + 1.9735381398010254, + 1.970859426651001, + 1.970537699661255, + 1.9716636752700805, + 1.971408115081787, + 1.97217986328125, + 1.9708149477767944, + 1.9725973287582397, + 1.970340883255005, + 1.970512617111206 + ], + "train_acc": [ + 0.2506, + 0.26582, + 0.26488, + 0.26812, + 0.2673, + 0.26874, + 0.26924, + 0.27152, + 0.2706, + 0.2732, + 0.27076, + 0.26982, + 0.27112, + 0.27538, + 0.27152, + 0.27576, + 0.27424, + 0.2737, + 0.27522, + 0.27654, + 0.27548, + 0.27776, + 0.27694, + 0.27644, + 0.2755, + 0.27554, + 0.27802, + 0.2774, + 0.2763, + 0.27872, + 0.27982, + 0.27564, + 0.27854, + 0.27758, + 0.27964, + 0.28212, + 0.28362, + 0.28318, + 0.28196, + 0.28094, + 0.28112, + 0.28024, + 0.28322, + 0.28244, + 0.28272, + 0.28128, + 0.28152, + 0.28524, + 0.28126, + 0.28276, + 0.28214, + 0.28506, + 0.2806, + 0.28196, + 0.2851, + 0.2821, + 0.28354, + 0.28526, + 0.28296, + 0.28452, + 0.28764, + 0.28686, + 0.28512, + 0.28712, + 0.28588, + 0.28462, + 0.28596, + 0.2847, + 0.28546, + 0.2833, + 0.2868, + 0.28714, + 0.285, + 0.2887, + 0.28604, + 0.28332, + 0.28698, + 0.28862, + 0.2851, + 0.2889, + 0.29026, + 0.28762, + 0.28606, + 0.2889, + 0.28878, + 0.29028, + 0.2883, + 0.28902, + 0.2895, + 0.28942, + 0.29002, + 0.29058, + 0.28932, + 0.28564, + 0.286, + 0.28974, + 0.28982, + 0.28878, + 0.2885, + 0.2891 + ], + "test_acc": [ + 0.2683, + 0.295, + 0.2917, + 0.2896, + 0.2953, + 0.2912, + 0.311, + 0.2938, + 0.2849, + 0.2891, + 0.2916, + 0.3049, + 0.3017, + 0.3203, + 0.3102, + 0.2822, + 0.286, + 0.3035, + 0.3098, + 0.3009, + 0.3053, + 0.3044, + 0.302, + 0.2901, + 0.3166, + 0.3038, + 0.2909, + 0.2941, + 0.3023, + 0.2937, + 0.3143, + 0.2817, + 0.289, + 0.3074, + 0.3052, + 0.3025, + 0.3089, + 0.3155, + 0.3068, + 0.3125, + 0.3145, + 0.3012, + 0.3152, + 0.315, + 0.3013, + 0.3054, + 0.3112, + 0.2904, + 0.3169, + 0.2959, + 0.3056, + 0.3098, + 0.3101, + 0.3139, + 0.309, + 0.2991, + 0.3182, + 0.3204, + 0.2996, + 0.3108, + 0.3082, + 0.3162, + 0.3227, + 0.3027, + 0.3098, + 0.2966, + 0.309, + 0.3138, + 0.3095, + 0.302, + 0.3007, + 0.3096, + 0.3111, + 0.3052, + 0.3121, + 0.3254, + 0.3128, + 0.3127, + 0.3042, + 0.3189, + 0.3148, + 0.3064, + 0.3145, + 0.3172, + 0.3148, + 0.3157, + 0.3164, + 0.3148, + 0.3139, + 0.3147, + 0.315, + 0.3137, + 0.3139, + 0.3151, + 0.3161, + 0.3159, + 0.3157, + 0.3154, + 0.3157, + 0.3156 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4173116087913513, + -0.0009379963739775121 + ], + "perturbation_rho": [ + 0.029962807893753052, + 0.0 + ], + "nudging": { + "0.001": [ + -5.238689482212067e-07, + 0.0 + ], + "0.003": [ + -1.4784745872020721e-06, + 1.862645149230957e-09 + ], + "0.01": [ + -4.835892468690872e-06, + -4.6566128730773926e-09 + ] + }, + "hidden_norms_per_layer": [ + 52101.48828125, + 755819456.0, + 2329725696.0 + ], + "bp_grad_norms_per_layer": [ + 3.256158436215628e-07, + 4.5803447146219867e-10, + 4.584113644234833e-10 + ] + }, + "drift": { + "embed.weight": 314.4915524892561, + "embed.bias": 242.71554547665664, + "blocks.0.ln.weight": 9.316701961843108, + "blocks.0.w1.weight": 260.9170515894993, + "blocks.0.w1.bias": 217.2580939372968, + "blocks.0.w2.weight": 445.91774813193825, + "blocks.1.ln.weight": 8.403039866788982, + "blocks.1.w1.weight": 293.10409601703697, + "blocks.1.w1.bias": 296.0137857555933, + "blocks.1.w2.weight": 322.56673718802114, + "out_ln.weight": 0.438240662386626, + "out_head.weight": 7.216506109788919, + "out_head.bias": 4.092364299645094 + } + }, + "fa": { + "log": { + "train_loss": [ + 2.059632821121216, + 1.969141392288208, + 1.9324101000595093, + 1.8976149897003174, + 1.8789895468902589, + 1.8676787176513672, + 1.86150774559021, + 1.8536200240707397, + 1.8464182161712646, + 1.843310608215332, + 1.8476687601470947, + 1.8471106829452515, + 1.8417246197128296, + 1.838934436569214, + 1.8480940073013306, + 1.841720523109436, + 1.8359926760482788, + 1.8341460582733153, + 1.8318497580718993, + 1.8298718184661866, + 1.8337750116729736, + 1.8297588416290282, + 1.8286794381332399, + 1.8261895336532592, + 1.8255341546630859, + 1.8234506717300416, + 1.8259339986801149, + 1.821055384902954, + 1.8205125164794922, + 1.8167257778549195, + 1.8076189421081543, + 1.8187879995727538, + 1.8171783072662353, + 1.8175717837524414, + 1.8142739019775391, + 1.8160600145721435, + 1.8160681335449218, + 1.8097417612075806, + 1.8152825867080689, + 1.8145546726226807, + 1.814115087852478, + 1.8139980951690673, + 1.8110767394256593, + 1.8108615531158447, + 1.8082058542633057, + 1.806761900253296, + 1.8031038238143922, + 1.8006043545150756, + 1.8022277898406982, + 1.8031743975067138, + 1.8007837707138061, + 1.8021138620758057, + 1.8031328768920898, + 1.7993617374038697, + 1.7992449984359742, + 1.7986480782699585, + 1.7985403269195557, + 1.7962297436141967, + 1.7968010370254517, + 1.795757841835022, + 1.7965225546646117, + 1.7958138821792602, + 1.7978459465789796, + 1.795165989151001, + 1.79601362575531, + 1.7981088857269287, + 1.7986928964233397, + 1.796389625015259, + 1.7948159000015258, + 1.795204453163147, + 1.7975346917724608, + 1.7945230379486083, + 1.794725383377075, + 1.7934243726348877, + 1.7920495998382568, + 1.7969142938995362, + 1.7927454508209228, + 1.7913766479110718, + 1.792234444503784, + 1.7971493310928344, + 1.7925569116210938, + 1.794579433517456, + 1.7918265099716186, + 1.7970994007110597, + 1.7937700403213501, + 1.79378436958313, + 1.7918543418121338, + 1.7927718152618408, + 1.792527283859253, + 1.7904213320922853, + 1.791894981842041, + 1.7942055084228516, + 1.7854851037597657, + 1.7892465375518798, + 1.7894356133651734, + 1.792232000427246, + 1.7908443558120728, + 1.7891317191314697, + 1.7882942892456055, + 1.7879403518295287 + ], + "train_acc": [ + 0.24674, + 0.28878, + 0.30256, + 0.31774, + 0.32412, + 0.32786, + 0.33236, + 0.33536, + 0.33926, + 0.34026, + 0.33958, + 0.33756, + 0.34346, + 0.34348, + 0.33962, + 0.34076, + 0.34474, + 0.34456, + 0.34354, + 0.34714, + 0.3452, + 0.347, + 0.34758, + 0.34994, + 0.34704, + 0.34678, + 0.34878, + 0.35086, + 0.3489, + 0.35086, + 0.354, + 0.35062, + 0.35238, + 0.35012, + 0.35416, + 0.3535, + 0.35234, + 0.3533, + 0.35412, + 0.35204, + 0.35228, + 0.35076, + 0.35398, + 0.35318, + 0.35272, + 0.3529, + 0.3562, + 0.35708, + 0.35474, + 0.35498, + 0.35806, + 0.35614, + 0.3567, + 0.359, + 0.35654, + 0.3578, + 0.35942, + 0.35754, + 0.36092, + 0.35994, + 0.36174, + 0.36086, + 0.36242, + 0.36584, + 0.36354, + 0.36262, + 0.3625, + 0.35902, + 0.36222, + 0.36288, + 0.36128, + 0.36226, + 0.36288, + 0.36458, + 0.36242, + 0.36178, + 0.3654, + 0.36442, + 0.3654, + 0.36446, + 0.36594, + 0.36486, + 0.36312, + 0.36548, + 0.36586, + 0.3661, + 0.36682, + 0.36846, + 0.3665, + 0.36726, + 0.3648, + 0.36732, + 0.36906, + 0.36904, + 0.36968, + 0.36782, + 0.3685, + 0.36574, + 0.36768, + 0.36662 + ], + "test_acc": [ + 0.2753, + 0.3239, + 0.3396, + 0.3381, + 0.3497, + 0.3518, + 0.3631, + 0.3416, + 0.3506, + 0.3507, + 0.3488, + 0.3577, + 0.3492, + 0.3608, + 0.3625, + 0.3672, + 0.3648, + 0.373, + 0.3637, + 0.3675, + 0.3612, + 0.3701, + 0.3614, + 0.3567, + 0.3695, + 0.3672, + 0.3684, + 0.3628, + 0.3779, + 0.3671, + 0.3748, + 0.3768, + 0.3622, + 0.3679, + 0.3684, + 0.3674, + 0.365, + 0.365, + 0.3596, + 0.3633, + 0.3614, + 0.3725, + 0.3516, + 0.3689, + 0.3514, + 0.356, + 0.3549, + 0.3407, + 0.3627, + 0.3489, + 0.3519, + 0.3524, + 0.3578, + 0.3532, + 0.3396, + 0.3532, + 0.3527, + 0.3599, + 0.3532, + 0.3571, + 0.3569, + 0.3491, + 0.3603, + 0.3561, + 0.3594, + 0.3522, + 0.3517, + 0.3523, + 0.3618, + 0.3583, + 0.3522, + 0.3556, + 0.3617, + 0.3617, + 0.362, + 0.3692, + 0.3621, + 0.3631, + 0.3579, + 0.3653, + 0.3655, + 0.3626, + 0.3669, + 0.3689, + 0.3658, + 0.3664, + 0.3649, + 0.3635, + 0.3656, + 0.3676, + 0.3651, + 0.3669, + 0.3663, + 0.3669, + 0.3663, + 0.3667, + 0.3665, + 0.3667, + 0.3662, + 0.3661 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.005262219812721014, + 0.9548712968826294 + ], + "perturbation_rho": [ + 0.014450715854763985, + 0.06202582269906998 + ], + "nudging": { + "0.001": [ + 1.9065337255597115e-06, + -7.555587217211723e-06 + ], + "0.003": [ + 5.672394763678312e-06, + -2.293300349265337e-05 + ], + "0.01": [ + 1.8914113752543926e-05, + -7.650378393009305e-05 + ] + }, + "hidden_norms_per_layer": [ + 4985.0673828125, + 267249.8125, + 166942.46875 + ], + "bp_grad_norms_per_layer": [ + 2.8030346584273502e-05, + 1.5286594816643628e-06, + 1.4554038898495492e-06 + ] + }, + "drift": { + "embed.weight": 30.89122351236108, + "embed.bias": 29.388918157004504, + "blocks.0.ln.weight": 1.5688009803019956, + "blocks.0.w1.weight": 22.80179549488676, + "blocks.0.w1.bias": 19.927274930467597, + "blocks.0.w2.weight": 66.38185851388366, + "blocks.1.ln.weight": 1.1343783166936168, + "blocks.1.w1.weight": 17.613374844897635, + "blocks.1.w1.bias": 9.480317921179704, + "blocks.1.w2.weight": 41.63261375754297, + "out_ln.weight": 0.4189237920059734, + "out_head.weight": 4.914939575481723, + "out_head.bias": 17.20838803283335 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 2, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 9 + ], + "gpu": 0, + "output_dir": "results/fa_dfa_d512_L2_seed9", + "methods": [ + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
