{ "2": { "dfa": { "log": { "train_loss": [ 2.058412809791565, 2.0388552247619627, 2.0358241034317017, 2.027553281555176, 2.030367368774414, 2.027717582397461, 2.023588889923096, 2.022263825721741, 2.0241731433105468, 2.0235239835357666, 2.023893345298767, 2.0222612105560303, 2.028809658164978, 2.023522481994629, 2.023535331993103, 2.022634300880432, 2.0261124728393556, 2.027209746055603, 2.024631557235718, 2.0272511472320556, 2.0248798042297365, 2.0252146803283693, 2.021958327026367, 2.0255450409317017, 2.0234208207702635, 2.0240782318496704, 2.0233148418807985, 2.022000389137268, 2.024022118911743, 2.023005671234131, 2.0231490325927735, 2.024285191497803, 2.0222519898986815, 2.023439755783081, 2.023540186843872, 2.0246322383117676, 2.0237508728027342, 2.024476735076904, 2.0262484502410887, 2.0244761968612672, 2.023149300994873, 2.0230725455093386, 2.0237448512268066, 2.0239054921722412, 2.0238359395980834, 2.0231575259399412, 2.022854585723877, 2.022712833328247, 2.022943268432617, 2.023613681335449, 2.022585965042114, 2.0229795806503295, 2.0224396421051027, 2.024438477630615, 2.0226136851501466, 2.0218412887191772, 2.020350592918396, 2.021553417892456, 2.0207389210510254, 2.022400696411133, 2.0226713175201416, 2.0205454586029052, 2.022753714904785, 2.0204339378356932, 2.0214138391113283, 2.019458531036377, 2.018622496871948, 2.0211455561828613, 2.020830050392151, 2.0200049672698976, 2.0226647985839845, 2.020451495361328, 2.0213021927642822, 2.018636092834473, 2.0201395918273928, 2.0197924830627443, 2.0189465530395507, 2.0179246043395995, 2.0190702261352538, 2.018002661895752, 2.0188750094604493, 2.0186908027648927, 2.018660167617798, 2.016986283912659, 2.016896242828369, 2.0198894203948976, 2.0182291090393067, 2.0168725957870484, 2.0189685047912596, 2.0170926274108885, 2.0171643753814696, 2.0170515134429934, 2.017839207763672, 2.0162586155700684, 2.016942921524048, 2.0172505876159668, 2.016627454185486, 2.01472389213562, 2.016936295089722, 2.0162249319458008 ], "train_acc": [ 0.24042, 0.24948, 0.25212, 0.25448, 0.25656, 0.25446, 0.26134, 0.2625, 0.25946, 0.26152, 0.26086, 0.26258, 0.2591, 0.25878, 0.25972, 0.2621, 0.26092, 0.25914, 0.25866, 0.25816, 0.26052, 0.25714, 0.26258, 0.25996, 0.26152, 0.2614, 0.2641, 0.26338, 0.26254, 0.26234, 0.26476, 0.26218, 0.2652, 0.26612, 0.2645, 0.26434, 0.26412, 0.26428, 0.26476, 0.26552, 0.26592, 0.2645, 0.26798, 0.26322, 0.26514, 0.2651, 0.26806, 0.26828, 0.26474, 0.26502, 0.26398, 0.26496, 0.26396, 0.265, 0.26866, 0.26958, 0.2685, 0.26846, 0.26926, 0.27102, 0.26792, 0.26856, 0.26608, 0.26824, 0.27114, 0.26984, 0.2685, 0.26856, 0.26812, 0.26898, 0.26946, 0.26888, 0.26992, 0.2687, 0.2679, 0.2708, 0.26838, 0.27112, 0.27018, 0.26964, 0.27128, 0.27114, 0.27024, 0.27024, 0.27036, 0.271, 0.27062, 0.27166, 0.27026, 0.27294, 0.2727, 0.27276, 0.27036, 0.27272, 0.26992, 0.26996, 0.2709, 0.27316, 0.2732, 0.27336 ], "test_acc": [ 0.278, 0.2738, 0.2583, 0.2773, 0.2658, 0.2783, 0.2681, 0.2957, 0.2671, 0.2647, 0.287, 0.2846, 0.284, 0.287, 0.2724, 0.2925, 0.2763, 0.2711, 0.2614, 0.277, 0.2817, 0.2791, 0.2834, 0.2821, 0.2641, 0.2764, 0.2963, 0.2882, 0.3005, 0.2923, 0.2579, 0.2889, 0.2999, 0.2958, 0.2739, 0.2984, 0.286, 0.2643, 0.2829, 0.2919, 0.292, 0.2875, 0.2932, 0.2778, 0.2753, 0.291, 0.2955, 0.3014, 0.2887, 0.2856, 0.2937, 0.2946, 0.298, 0.2932, 0.3005, 0.2989, 0.2924, 0.2977, 0.2922, 0.2876, 0.2943, 0.2844, 0.3003, 0.2952, 0.2881, 0.2821, 0.2934, 0.28, 0.2958, 0.2933, 0.2923, 0.2941, 0.2872, 0.2946, 0.2966, 0.2962, 0.2915, 0.2969, 0.2988, 0.2968, 0.2991, 0.2972, 0.297, 0.2955, 0.2973, 0.2994, 0.2959, 0.2962, 0.3, 0.2971, 0.2977, 0.2962, 0.2963, 0.2955, 0.2959, 0.2964, 0.2962, 0.2963, 0.2968, 0.2968 ] }, "diagnostics": { "bp_cosine": [ 0.3571905195713043, -2.4819419195409864e-05 ], "perturbation_rho": [ -0.020394116640090942, 0.0 ], "nudging": { "0.001": [ -3.2084062695503235e-07, 0.0 ], "0.003": [ -8.596107363700867e-07, 0.0 ], "0.01": [ -2.905726432800293e-06, 0.0 ] }, "hidden_norms_per_layer": [ 53198.71875, 2227773184.0, 5250976256.0 ], "bp_grad_norms_per_layer": [ 2.0440073456029495e-07, 3.7151820508896094e-10, 3.7148767395578375e-10 ] }, "drift": { "embed.weight": 342.0501862953785, "embed.bias": 318.0357815319326, "blocks.0.ln.weight": 9.910735164962347, "blocks.0.w1.weight": 324.42259888737226, "blocks.0.w1.bias": 352.6779805020607, "blocks.0.w2.weight": 492.2710513712036, "blocks.1.ln.weight": 9.723967303148715, "blocks.1.w1.weight": 403.31369239097415, "blocks.1.w1.bias": 386.0984329662907, "blocks.1.w2.weight": 397.9343379416526, "out_ln.weight": 0.5056100406607513, "out_head.weight": 8.24905668320801, "out_head.bias": 2.0933992602399067 } }, "fa": { "log": { "train_loss": [ 2.063060122451782, 1.9739086376571655, 1.9282753707504272, 1.8921499670410156, 1.8799907299804688, 1.8701481190490723, 1.8541997326660156, 1.8432505453109742, 1.8392359512710572, 1.8295656701278686, 1.8286965405273437, 1.8275740008163452, 1.82835955909729, 1.8276023639297485, 1.8295053287506104, 1.8279134408569335, 1.8347502783966065, 1.8358594959259034, 1.832546812095642, 1.8375971967315674, 1.8337256093978882, 1.8388268453598022, 1.8368015246200562, 1.8367653689956664, 1.837699118347168, 1.8374284832763672, 1.8332337552642821, 1.8305227688217163, 1.8352981665802002, 1.8384290933227538, 1.8319619774627685, 1.8331132510375976, 1.8284437879180908, 1.8323823754882813, 1.8337605920791626, 1.8296470736312866, 1.824372737045288, 1.8253158220672607, 1.8254631029891968, 1.8240845959472656, 1.819489220275879, 1.8196685235214234, 1.8173167004013062, 1.8210680514526367, 1.812099649734497, 1.8139883127212524, 1.810353461265564, 1.8109969634246825, 1.808874561843872, 1.8115904225158692, 1.8089021768188476, 1.8070925519561767, 1.807039188232422, 1.8048222934341431, 1.8031300540924071, 1.8039923257446289, 1.8042795065307617, 1.8037835544586183, 1.8002930462646485, 1.8007701531982423, 1.8004488678359984, 1.8029598141098022, 1.8020868547821045, 1.7990351900482178, 1.8022524103546143, 1.7987030548477172, 1.7969628913116455, 1.7972235089874267, 1.7918564282226563, 1.7940529309082032, 1.7972945267105103, 1.7940796615219117, 1.7942549993133545, 1.7947112902450562, 1.7927878363037109, 1.7915658866119384, 1.7944716805267333, 1.790445680809021, 1.7891779144668578, 1.789405579185486, 1.7867662616729736, 1.7887766037368775, 1.7875445496368407, 1.7851270193862916, 1.7886884448623657, 1.786267046775818, 1.785640559425354, 1.7853610308074952, 1.7856942657470702, 1.7871524771499634, 1.7883876535797119, 1.782026519203186, 1.786798097305298, 1.7790444551849365, 1.7840377599334716, 1.787256519126892, 1.7822379702758788, 1.7822947565460205, 1.7829025159072875, 1.7819519442749023 ], "train_acc": [ 0.24228, 0.28314, 0.30214, 0.31828, 0.32302, 0.3277, 0.33338, 0.33888, 0.34066, 0.34536, 0.34814, 0.34648, 0.34716, 0.34526, 0.3462, 0.3422, 0.343, 0.34162, 0.3438, 0.34388, 0.34354, 0.33854, 0.34312, 0.34176, 0.34514, 0.34304, 0.34458, 0.34162, 0.34348, 0.34098, 0.34374, 0.34488, 0.34328, 0.34504, 0.34414, 0.34548, 0.34552, 0.34848, 0.34836, 0.34802, 0.34918, 0.346, 0.34986, 0.3473, 0.3515, 0.3527, 0.3532, 0.35212, 0.35068, 0.34998, 0.3505, 0.3565, 0.35392, 0.35556, 0.35556, 0.35462, 0.3548, 0.35674, 0.35552, 0.35848, 0.35704, 0.35594, 0.35598, 0.35716, 0.35818, 0.35842, 0.35966, 0.35968, 0.36022, 0.36082, 0.3571, 0.3612, 0.3604, 0.3607, 0.3602, 0.36134, 0.35734, 0.36262, 0.36352, 0.35916, 0.36462, 0.3617, 0.3608, 0.3617, 0.36106, 0.36262, 0.36296, 0.36354, 0.36138, 0.36132, 0.36446, 0.36452, 0.36388, 0.3645, 0.36378, 0.36342, 0.36496, 0.36556, 0.36274, 0.36546 ], "test_acc": [ 0.2954, 0.3137, 0.3295, 0.3474, 0.3551, 0.3544, 0.3515, 0.3694, 0.3633, 0.3479, 0.3744, 0.3726, 0.371, 0.3618, 0.3649, 0.3685, 0.3658, 0.3704, 0.3504, 0.3729, 0.3578, 0.3685, 0.3676, 0.3643, 0.3562, 0.3486, 0.3732, 0.3624, 0.3693, 0.341, 0.3467, 0.3544, 0.3679, 0.3526, 0.3593, 0.3647, 0.3604, 0.3662, 0.3632, 0.3644, 0.3628, 0.3598, 0.3564, 0.3633, 0.3531, 0.3607, 0.3616, 0.3636, 0.3514, 0.3488, 0.3408, 0.3522, 0.3651, 0.3408, 0.3548, 0.3504, 0.3469, 0.3507, 0.3515, 0.3434, 0.3548, 0.351, 0.351, 0.3545, 0.3487, 0.3467, 0.3492, 0.3439, 0.346, 0.3357, 0.332, 0.3387, 0.3546, 0.3415, 0.3458, 0.3451, 0.3477, 0.342, 0.3446, 0.3427, 0.3426, 0.3423, 0.3481, 0.3467, 0.3443, 0.3437, 0.3466, 0.3459, 0.3448, 0.3458, 0.3433, 0.3461, 0.3479, 0.3447, 0.3452, 0.3467, 0.3461, 0.3467, 0.3464, 0.3464 ] }, "diagnostics": { "bp_cosine": [ 0.01565447635948658, 0.9284564256668091 ], "perturbation_rho": [ 0.08889118582010269, 0.1751367598772049 ], "nudging": { "0.001": [ -8.567003533244133e-07, -7.14592169970274e-06 ], "0.003": [ -2.5028130039572716e-06, -2.1490384824573994e-05 ], "0.01": [ -8.566654287278652e-06, -7.176969666033983e-05 ] }, "hidden_norms_per_layer": [ 5015.7705078125, 205831.875, 281989.59375 ], "bp_grad_norms_per_layer": [ 1.882538890640717e-05, 8.274267884189612e-07, 8.043497246035258e-07 ] }, "drift": { "embed.weight": 31.381319271594045, "embed.bias": 16.70881646410694, "blocks.0.ln.weight": 1.5550725713952875, "blocks.0.w1.weight": 29.555012389084762, "blocks.0.w1.bias": 17.153011809958922, "blocks.0.w2.weight": 62.82184507015774, "blocks.1.ln.weight": 1.2734634249220895, "blocks.1.w1.weight": 21.575349693350912, "blocks.1.w1.bias": 10.895115401942027, "blocks.1.w2.weight": 35.67159460439069, "out_ln.weight": 0.4183849023916904, "out_head.weight": 4.1274562698411295, "out_head.bias": 12.873937810986282 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 2, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 2 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L2_seed2", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }