{ "4": { "dfa": { "log": { "train_loss": [ 2.0741304068756103, 2.052452068710327, 2.0495207961273194, 2.0484457649230956, 2.045468647079468, 2.0459753023529053, 2.0450184237670896, 2.0391295627593995, 2.0377573050689697, 2.0382228170394896, 2.0312761193466184, 2.0324994396591185, 2.0278026767730712, 2.0305476247787477, 2.0286661254119873, 2.029820890045166, 2.0290051824188233, 2.0265300660705567, 2.025750561065674, 2.027355994720459, 2.0275561265563966, 2.023750612411499, 2.025079263343811, 2.025395411605835, 2.0240028636932372, 2.022815622253418, 2.0226645655822755, 2.022443874359131, 2.022390442466736, 2.023733573875427, 2.0224531535339354, 2.0227799210357666, 2.0218398332214353, 2.020151731872559, 2.021256269683838, 2.0194612783432007, 2.018333575744629, 2.0183729624938964, 2.0209142852020263, 2.022426343536377, 2.018248730201721, 2.0204831772613527, 2.0188777527618407, 2.0191313500213623, 2.0171565660858155, 2.0189703364562988, 2.0182820797729493, 2.0170327036285403, 2.0180798105239868, 2.0163722726821898, 2.0178759913635256, 2.017920862388611, 2.015365661468506, 2.0167020557403563, 2.0157576428985595, 2.0196311264801023, 2.0176754986190795, 2.017508302345276, 2.0164641773223875, 2.016444677734375, 2.0168316576385497, 2.0152849128723145, 2.015149051208496, 2.0158757721710203, 2.016044344520569, 2.0154035729217528, 2.012803511734009, 2.0160995071792605, 2.015346680755615, 2.0140808686828615, 2.0151058874893186, 2.0144621922302246, 2.0154705238342285, 2.0149063832092287, 2.0115139068603516, 2.0131744523620605, 2.0158527814483644, 2.0125201052474977, 2.0122518685913087, 2.0132210369873045, 2.0136120219421385, 2.0142880089950563, 2.013032984085083, 2.011840599975586, 2.0118305902862548, 2.012003014450073, 2.011992978248596, 2.0092738487243653, 2.0135212693023683, 2.010035700378418, 2.011592872314453, 2.010264990081787, 2.0128248121643066, 2.0130243259048464, 2.0120003854751585, 2.011955912322998, 2.011813560256958, 2.0142602909851073, 2.0124067852020264, 2.0116278426742555 ], "train_acc": [ 0.23226, 0.2375, 0.23894, 0.2411, 0.24176, 0.24224, 0.24692, 0.24654, 0.24822, 0.24668, 0.25084, 0.24936, 0.2519, 0.24896, 0.25208, 0.25194, 0.2549, 0.25158, 0.25292, 0.25402, 0.25358, 0.2561, 0.25688, 0.25572, 0.25782, 0.25752, 0.2589, 0.25694, 0.2558, 0.25686, 0.25668, 0.259, 0.2579, 0.25902, 0.25906, 0.25856, 0.26018, 0.2611, 0.25834, 0.26182, 0.26058, 0.25944, 0.26134, 0.25952, 0.26058, 0.2594, 0.26156, 0.26526, 0.26156, 0.2652, 0.26178, 0.26122, 0.2618, 0.26384, 0.26214, 0.26386, 0.26256, 0.2644, 0.26262, 0.2629, 0.26074, 0.26266, 0.2634, 0.26182, 0.26266, 0.26396, 0.26654, 0.2633, 0.2613, 0.26562, 0.26356, 0.26384, 0.26406, 0.26388, 0.26606, 0.26592, 0.265, 0.26578, 0.268, 0.2666, 0.26434, 0.2666, 0.26418, 0.26448, 0.26558, 0.2644, 0.26708, 0.26714, 0.2644, 0.2675, 0.26548, 0.26528, 0.26508, 0.26738, 0.26266, 0.2658, 0.26572, 0.26576, 0.26514, 0.2658 ], "test_acc": [ 0.2469, 0.2437, 0.255, 0.2587, 0.2612, 0.2707, 0.2697, 0.2504, 0.279, 0.2707, 0.2664, 0.2693, 0.2715, 0.2832, 0.2849, 0.2633, 0.2682, 0.2874, 0.2852, 0.2671, 0.273, 0.2819, 0.2654, 0.2763, 0.279, 0.2924, 0.281, 0.2755, 0.2706, 0.2758, 0.2812, 0.2801, 0.2847, 0.2684, 0.2679, 0.2819, 0.2548, 0.2726, 0.2794, 0.2838, 0.2834, 0.2788, 0.283, 0.2721, 0.2782, 0.2742, 0.2817, 0.2752, 0.2722, 0.2812, 0.2797, 0.2792, 0.2799, 0.2747, 0.2879, 0.2769, 0.2842, 0.2793, 0.2857, 0.2797, 0.2793, 0.283, 0.2889, 0.2789, 0.2748, 0.2811, 0.2814, 0.2775, 0.282, 0.2787, 0.2862, 0.2861, 0.2788, 0.2763, 0.272, 0.2788, 0.2818, 0.2839, 0.2865, 0.2837, 0.2898, 0.2814, 0.2784, 0.2823, 0.2852, 0.2835, 0.2848, 0.2846, 0.2821, 0.2809, 0.2812, 0.2826, 0.2818, 0.2832, 0.2834, 0.2832, 0.2838, 0.2838, 0.2838, 0.2837 ] }, "diagnostics": { "bp_cosine": [ 0.337674617767334, 0.0006247189012356102, 0.0002945333835668862, -7.626566366525367e-05, -0.00035525468410924077, 4.714205351774581e-05 ], "perturbation_rho": [ 0.005920294672250748, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -3.096647560596466e-07, 0.0, 0.0, 0.0, 9.313225746154785e-10, 0.0 ], "0.003": [ -9.313225746154785e-07, 9.313225746154785e-10, 0.0, 0.0, 9.313225746154785e-10, 0.0 ], "0.01": [ -2.87545844912529e-06, 0.0, 0.0, 9.313225746154785e-10, 9.313225746154785e-10, 0.0 ] }, "hidden_norms_per_layer": [ 58616.81640625, 1590750592.0, 3689531648.0, 5549292544.0, 7886680064.0, 9552689152.0, 9643235328.0 ], "bp_grad_norms_per_layer": [ 1.978580996819801e-07, 1.773336893995392e-10, 1.7791043638304416e-10, 1.7622008019468893e-10, 1.761738255279255e-10, 1.7640035265831244e-10, 1.7640640337379665e-10 ] }, "drift": { "embed.weight": 352.51471697650226, "embed.bias": 269.49001616797665, "blocks.0.ln.weight": 9.43372656624646, "blocks.0.w1.weight": 313.54087904771035, "blocks.0.w1.bias": 290.62855542890503, "blocks.0.w2.weight": 505.8716937587808, "blocks.1.ln.weight": 8.808169542950294, "blocks.1.w1.weight": 358.5357409826361, "blocks.1.w1.bias": 345.5274778587847, "blocks.1.w2.weight": 349.75977929168596, "blocks.2.ln.weight": 9.276124324101515, "blocks.2.w1.weight": 395.6550378108265, "blocks.2.w1.bias": 371.0546436106137, "blocks.2.w2.weight": 375.3367421271525, "blocks.3.ln.weight": 10.24244368106198, "blocks.3.w1.weight": 420.44883795775684, "blocks.3.w1.bias": 397.1721710589656, "blocks.3.w2.weight": 405.8311891944568, "blocks.4.ln.weight": 10.577140914534366, "blocks.4.w1.weight": 436.864273411592, "blocks.4.w1.bias": 406.9723932351042, "blocks.4.w2.weight": 404.6446833274338, "blocks.5.ln.weight": 7.782034028860308, "blocks.5.w1.weight": 310.2471895048895, "blocks.5.w1.bias": 297.2855707982679, "blocks.5.w2.weight": 270.3724536312007, "out_ln.weight": 0.5880164032165464, "out_head.weight": 8.450568347443314, "out_head.bias": 0.7740018910126388 } }, "fa": { "log": { "train_loss": [ 2.038021390991211, 1.9517871558380127, 1.923053580093384, 1.9045403602600097, 1.8952905172729493, 1.8863004998397828, 1.8793055545043946, 1.868332847251892, 1.860797550354004, 1.8578368386077881, 1.8483906720352172, 1.8424116570663451, 1.8290137046051025, 1.8305858782577515, 1.823958169631958, 1.8175954293823242, 1.8124929406356811, 1.8102095357513428, 1.8039513228607178, 1.8015951740264893, 1.7953115439605714, 1.7889242324447632, 1.7881110052871705, 1.7843929150390625, 1.7783852965545655, 1.777275090942383, 1.7724220377349853, 1.7673138269424438, 1.7659701934814453, 1.7594620475006104, 1.753105486755371, 1.7537677935028075, 1.7502301782989502, 1.743755245666504, 1.7426675580596924, 1.7381902320098876, 1.7371277405548096, 1.7380020862197876, 1.7344951665878297, 1.732631077194214, 1.7297903375244141, 1.7305091592025756, 1.72773092628479, 1.7255595262908936, 1.7265567044067383, 1.7226529630279541, 1.7242008368301391, 1.7205993241119384, 1.714460986251831, 1.7183882989501953, 1.7157616848373414, 1.7143050561141968, 1.711619351425171, 1.712949155960083, 1.7116730854797364, 1.7097789264297485, 1.7088176770401, 1.7031783606338502, 1.705644631690979, 1.702429769935608, 1.7007943072891236, 1.6994391622924805, 1.698121346435547, 1.6975506435775758, 1.6984819930648805, 1.6961595495224, 1.6988952493286134, 1.700139475479126, 1.698183412246704, 1.6925607485580445, 1.6942372484970092, 1.695046120262146, 1.6923927303695678, 1.6946959600448608, 1.6924981302261353, 1.688026438217163, 1.6864081888580322, 1.6876143859863282, 1.687906523399353, 1.6851787896347046, 1.6870249395370482, 1.6865479514312745, 1.6857007721710204, 1.686013254776001, 1.685618132247925, 1.6866127777099609, 1.682880577697754, 1.6817467867660523, 1.6864028040695191, 1.683715857887268, 1.6836617621612548, 1.6802171184921264, 1.6822573038101196, 1.6837931204223633, 1.6831412961196899, 1.6796661951065064, 1.682324230041504, 1.6844535943222045, 1.6789856439590454, 1.680855456161499 ], "train_acc": [ 0.2477, 0.28914, 0.30422, 0.30836, 0.31314, 0.31906, 0.3247, 0.32558, 0.33112, 0.33134, 0.33596, 0.33794, 0.34382, 0.34438, 0.3429, 0.3491, 0.34826, 0.351, 0.35252, 0.3536, 0.35608, 0.36104, 0.35948, 0.36006, 0.36364, 0.36444, 0.36608, 0.367, 0.36846, 0.36866, 0.37048, 0.37416, 0.37428, 0.37498, 0.37714, 0.37884, 0.37872, 0.3782, 0.381, 0.38058, 0.3804, 0.38016, 0.38418, 0.38552, 0.38428, 0.3811, 0.38204, 0.38364, 0.38758, 0.38694, 0.38588, 0.38568, 0.388, 0.38704, 0.39158, 0.38884, 0.38912, 0.38936, 0.39034, 0.39182, 0.39316, 0.3944, 0.39182, 0.39272, 0.39394, 0.39482, 0.39348, 0.39242, 0.39554, 0.3963, 0.39508, 0.39252, 0.39634, 0.39332, 0.39612, 0.39644, 0.39648, 0.39668, 0.3985, 0.3995, 0.39528, 0.39904, 0.39988, 0.39688, 0.39954, 0.39648, 0.4014, 0.39972, 0.39808, 0.4019, 0.39968, 0.40222, 0.39884, 0.39954, 0.39804, 0.40034, 0.39982, 0.39856, 0.40168, 0.4006 ], "test_acc": [ 0.2942, 0.311, 0.3308, 0.342, 0.3419, 0.3528, 0.3504, 0.3462, 0.3605, 0.367, 0.3696, 0.3674, 0.3716, 0.3801, 0.3769, 0.3624, 0.3792, 0.3785, 0.3758, 0.3779, 0.3853, 0.3821, 0.3816, 0.3891, 0.3866, 0.3936, 0.3896, 0.3908, 0.397, 0.3971, 0.4013, 0.4023, 0.393, 0.3983, 0.3977, 0.3969, 0.3982, 0.405, 0.4014, 0.4089, 0.4078, 0.3985, 0.4063, 0.4039, 0.4008, 0.4096, 0.4111, 0.4059, 0.4128, 0.4079, 0.4066, 0.4115, 0.407, 0.4156, 0.4156, 0.4208, 0.4164, 0.4206, 0.4124, 0.4186, 0.4142, 0.4123, 0.4105, 0.4153, 0.4198, 0.4192, 0.419, 0.4198, 0.4202, 0.417, 0.4233, 0.4224, 0.4164, 0.4183, 0.4193, 0.4178, 0.4189, 0.4232, 0.4184, 0.4206, 0.4223, 0.4222, 0.417, 0.4199, 0.421, 0.4202, 0.4181, 0.4177, 0.4214, 0.4186, 0.4201, 0.4189, 0.4221, 0.4205, 0.4194, 0.42, 0.4203, 0.4199, 0.4196, 0.4195 ] }, "diagnostics": { "bp_cosine": [ 0.015272621065378189, 0.05551045760512352, 0.03781959414482117, -0.09142173081636429, -0.12766994535923004, 0.9957026839256287 ], "perturbation_rho": [ -0.044239602982997894, 0.018639111891388893, -0.002674652263522148, -0.024060344323515892, -0.007919290103018284, -0.016996072605252266 ], "nudging": { "0.001": [ -2.239597961306572e-06, -6.057089194655418e-07, -1.341104507446289e-07, 1.417938619852066e-07, 1.6426201909780502e-07, -1.8667196854948997e-06 ], "0.003": [ -6.492482498288155e-06, -1.5690457075834274e-06, -4.0302984416484833e-07, 5.105976015329361e-07, 7.660128176212311e-07, -6.384681910276413e-06 ], "0.01": [ -2.1643005311489105e-05, -5.265465006232262e-06, -1.4334218576550484e-06, 2.071727067232132e-06, 2.557528205215931e-06, -2.2026244550943375e-05 ] }, "hidden_norms_per_layer": [ 5698.91357421875, 74089.609375, 464746.75, 571451.9375, 1133723.625, 1542811.875, 774708.375 ], "bp_grad_norms_per_layer": [ 3.8776230212533846e-05, 3.033989969480899e-06, 9.73796886682976e-07, 8.570191312173847e-07, 8.443464594165562e-07, 8.415062779931759e-07, 8.336798487107444e-07 ] }, "drift": { "embed.weight": 39.486431642766554, "embed.bias": 14.997056918535808, "blocks.0.ln.weight": 1.193207647495217, "blocks.0.w1.weight": 15.819034065039398, "blocks.0.w1.bias": 13.818478530432463, "blocks.0.w2.weight": 51.89139321984625, "blocks.1.ln.weight": 1.0430825935788601, "blocks.1.w1.weight": 19.906462986471904, "blocks.1.w1.bias": 13.39027258705086, "blocks.1.w2.weight": 46.62053425901664, "blocks.2.ln.weight": 0.7864666972877575, "blocks.2.w1.weight": 18.270196046735624, "blocks.2.w1.bias": 12.944067249835973, "blocks.2.w2.weight": 49.53460850460699, "blocks.3.ln.weight": 0.64141877927046, "blocks.3.w1.weight": 20.764880942811217, "blocks.3.w1.bias": 20.679665524082093, "blocks.3.w2.weight": 25.665386885036355, "blocks.4.ln.weight": 0.5680829244316266, "blocks.4.w1.weight": 20.078876458586997, "blocks.4.w1.bias": 21.20100063860491, "blocks.4.w2.weight": 30.60469406190784, "blocks.5.ln.weight": 0.6546824348706847, "blocks.5.w1.weight": 18.8873912461224, "blocks.5.w1.bias": 18.79210459184489, "blocks.5.w2.weight": 45.45712755218628, "out_ln.weight": 0.3591377698736513, "out_head.weight": 6.323626106875271, "out_head.bias": 0.8856670357666573 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 6, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 4 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L6_seed4", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }