summaryrefslogtreecommitdiff
path: root/results/fa_dfa_d512_L2_seed2/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_dfa_d512_L2_seed2/results_cifar10.json')
-rw-r--r--results/fa_dfa_d512_L2_seed2/results_cifar10.json749
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed2/results_cifar10.json b/results/fa_dfa_d512_L2_seed2/results_cifar10.json
new file mode 100644
index 0000000..35785f5
--- /dev/null
+++ b/results/fa_dfa_d512_L2_seed2/results_cifar10.json
@@ -0,0 +1,749 @@
+{
+ "2": {
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 2.058412809791565,
+ 2.0388552247619627,
+ 2.0358241034317017,
+ 2.027553281555176,
+ 2.030367368774414,
+ 2.027717582397461,
+ 2.023588889923096,
+ 2.022263825721741,
+ 2.0241731433105468,
+ 2.0235239835357666,
+ 2.023893345298767,
+ 2.0222612105560303,
+ 2.028809658164978,
+ 2.023522481994629,
+ 2.023535331993103,
+ 2.022634300880432,
+ 2.0261124728393556,
+ 2.027209746055603,
+ 2.024631557235718,
+ 2.0272511472320556,
+ 2.0248798042297365,
+ 2.0252146803283693,
+ 2.021958327026367,
+ 2.0255450409317017,
+ 2.0234208207702635,
+ 2.0240782318496704,
+ 2.0233148418807985,
+ 2.022000389137268,
+ 2.024022118911743,
+ 2.023005671234131,
+ 2.0231490325927735,
+ 2.024285191497803,
+ 2.0222519898986815,
+ 2.023439755783081,
+ 2.023540186843872,
+ 2.0246322383117676,
+ 2.0237508728027342,
+ 2.024476735076904,
+ 2.0262484502410887,
+ 2.0244761968612672,
+ 2.023149300994873,
+ 2.0230725455093386,
+ 2.0237448512268066,
+ 2.0239054921722412,
+ 2.0238359395980834,
+ 2.0231575259399412,
+ 2.022854585723877,
+ 2.022712833328247,
+ 2.022943268432617,
+ 2.023613681335449,
+ 2.022585965042114,
+ 2.0229795806503295,
+ 2.0224396421051027,
+ 2.024438477630615,
+ 2.0226136851501466,
+ 2.0218412887191772,
+ 2.020350592918396,
+ 2.021553417892456,
+ 2.0207389210510254,
+ 2.022400696411133,
+ 2.0226713175201416,
+ 2.0205454586029052,
+ 2.022753714904785,
+ 2.0204339378356932,
+ 2.0214138391113283,
+ 2.019458531036377,
+ 2.018622496871948,
+ 2.0211455561828613,
+ 2.020830050392151,
+ 2.0200049672698976,
+ 2.0226647985839845,
+ 2.020451495361328,
+ 2.0213021927642822,
+ 2.018636092834473,
+ 2.0201395918273928,
+ 2.0197924830627443,
+ 2.0189465530395507,
+ 2.0179246043395995,
+ 2.0190702261352538,
+ 2.018002661895752,
+ 2.0188750094604493,
+ 2.0186908027648927,
+ 2.018660167617798,
+ 2.016986283912659,
+ 2.016896242828369,
+ 2.0198894203948976,
+ 2.0182291090393067,
+ 2.0168725957870484,
+ 2.0189685047912596,
+ 2.0170926274108885,
+ 2.0171643753814696,
+ 2.0170515134429934,
+ 2.017839207763672,
+ 2.0162586155700684,
+ 2.016942921524048,
+ 2.0172505876159668,
+ 2.016627454185486,
+ 2.01472389213562,
+ 2.016936295089722,
+ 2.0162249319458008
+ ],
+ "train_acc": [
+ 0.24042,
+ 0.24948,
+ 0.25212,
+ 0.25448,
+ 0.25656,
+ 0.25446,
+ 0.26134,
+ 0.2625,
+ 0.25946,
+ 0.26152,
+ 0.26086,
+ 0.26258,
+ 0.2591,
+ 0.25878,
+ 0.25972,
+ 0.2621,
+ 0.26092,
+ 0.25914,
+ 0.25866,
+ 0.25816,
+ 0.26052,
+ 0.25714,
+ 0.26258,
+ 0.25996,
+ 0.26152,
+ 0.2614,
+ 0.2641,
+ 0.26338,
+ 0.26254,
+ 0.26234,
+ 0.26476,
+ 0.26218,
+ 0.2652,
+ 0.26612,
+ 0.2645,
+ 0.26434,
+ 0.26412,
+ 0.26428,
+ 0.26476,
+ 0.26552,
+ 0.26592,
+ 0.2645,
+ 0.26798,
+ 0.26322,
+ 0.26514,
+ 0.2651,
+ 0.26806,
+ 0.26828,
+ 0.26474,
+ 0.26502,
+ 0.26398,
+ 0.26496,
+ 0.26396,
+ 0.265,
+ 0.26866,
+ 0.26958,
+ 0.2685,
+ 0.26846,
+ 0.26926,
+ 0.27102,
+ 0.26792,
+ 0.26856,
+ 0.26608,
+ 0.26824,
+ 0.27114,
+ 0.26984,
+ 0.2685,
+ 0.26856,
+ 0.26812,
+ 0.26898,
+ 0.26946,
+ 0.26888,
+ 0.26992,
+ 0.2687,
+ 0.2679,
+ 0.2708,
+ 0.26838,
+ 0.27112,
+ 0.27018,
+ 0.26964,
+ 0.27128,
+ 0.27114,
+ 0.27024,
+ 0.27024,
+ 0.27036,
+ 0.271,
+ 0.27062,
+ 0.27166,
+ 0.27026,
+ 0.27294,
+ 0.2727,
+ 0.27276,
+ 0.27036,
+ 0.27272,
+ 0.26992,
+ 0.26996,
+ 0.2709,
+ 0.27316,
+ 0.2732,
+ 0.27336
+ ],
+ "test_acc": [
+ 0.278,
+ 0.2738,
+ 0.2583,
+ 0.2773,
+ 0.2658,
+ 0.2783,
+ 0.2681,
+ 0.2957,
+ 0.2671,
+ 0.2647,
+ 0.287,
+ 0.2846,
+ 0.284,
+ 0.287,
+ 0.2724,
+ 0.2925,
+ 0.2763,
+ 0.2711,
+ 0.2614,
+ 0.277,
+ 0.2817,
+ 0.2791,
+ 0.2834,
+ 0.2821,
+ 0.2641,
+ 0.2764,
+ 0.2963,
+ 0.2882,
+ 0.3005,
+ 0.2923,
+ 0.2579,
+ 0.2889,
+ 0.2999,
+ 0.2958,
+ 0.2739,
+ 0.2984,
+ 0.286,
+ 0.2643,
+ 0.2829,
+ 0.2919,
+ 0.292,
+ 0.2875,
+ 0.2932,
+ 0.2778,
+ 0.2753,
+ 0.291,
+ 0.2955,
+ 0.3014,
+ 0.2887,
+ 0.2856,
+ 0.2937,
+ 0.2946,
+ 0.298,
+ 0.2932,
+ 0.3005,
+ 0.2989,
+ 0.2924,
+ 0.2977,
+ 0.2922,
+ 0.2876,
+ 0.2943,
+ 0.2844,
+ 0.3003,
+ 0.2952,
+ 0.2881,
+ 0.2821,
+ 0.2934,
+ 0.28,
+ 0.2958,
+ 0.2933,
+ 0.2923,
+ 0.2941,
+ 0.2872,
+ 0.2946,
+ 0.2966,
+ 0.2962,
+ 0.2915,
+ 0.2969,
+ 0.2988,
+ 0.2968,
+ 0.2991,
+ 0.2972,
+ 0.297,
+ 0.2955,
+ 0.2973,
+ 0.2994,
+ 0.2959,
+ 0.2962,
+ 0.3,
+ 0.2971,
+ 0.2977,
+ 0.2962,
+ 0.2963,
+ 0.2955,
+ 0.2959,
+ 0.2964,
+ 0.2962,
+ 0.2963,
+ 0.2968,
+ 0.2968
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.3571905195713043,
+ -2.4819419195409864e-05
+ ],
+ "perturbation_rho": [
+ -0.020394116640090942,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -3.2084062695503235e-07,
+ 0.0
+ ],
+ "0.003": [
+ -8.596107363700867e-07,
+ 0.0
+ ],
+ "0.01": [
+ -2.905726432800293e-06,
+ 0.0
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 53198.71875,
+ 2227773184.0,
+ 5250976256.0
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.0440073456029495e-07,
+ 3.7151820508896094e-10,
+ 3.7148767395578375e-10
+ ]
+ },
+ "drift": {
+ "embed.weight": 342.0501862953785,
+ "embed.bias": 318.0357815319326,
+ "blocks.0.ln.weight": 9.910735164962347,
+ "blocks.0.w1.weight": 324.42259888737226,
+ "blocks.0.w1.bias": 352.6779805020607,
+ "blocks.0.w2.weight": 492.2710513712036,
+ "blocks.1.ln.weight": 9.723967303148715,
+ "blocks.1.w1.weight": 403.31369239097415,
+ "blocks.1.w1.bias": 386.0984329662907,
+ "blocks.1.w2.weight": 397.9343379416526,
+ "out_ln.weight": 0.5056100406607513,
+ "out_head.weight": 8.24905668320801,
+ "out_head.bias": 2.0933992602399067
+ }
+ },
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.063060122451782,
+ 1.9739086376571655,
+ 1.9282753707504272,
+ 1.8921499670410156,
+ 1.8799907299804688,
+ 1.8701481190490723,
+ 1.8541997326660156,
+ 1.8432505453109742,
+ 1.8392359512710572,
+ 1.8295656701278686,
+ 1.8286965405273437,
+ 1.8275740008163452,
+ 1.82835955909729,
+ 1.8276023639297485,
+ 1.8295053287506104,
+ 1.8279134408569335,
+ 1.8347502783966065,
+ 1.8358594959259034,
+ 1.832546812095642,
+ 1.8375971967315674,
+ 1.8337256093978882,
+ 1.8388268453598022,
+ 1.8368015246200562,
+ 1.8367653689956664,
+ 1.837699118347168,
+ 1.8374284832763672,
+ 1.8332337552642821,
+ 1.8305227688217163,
+ 1.8352981665802002,
+ 1.8384290933227538,
+ 1.8319619774627685,
+ 1.8331132510375976,
+ 1.8284437879180908,
+ 1.8323823754882813,
+ 1.8337605920791626,
+ 1.8296470736312866,
+ 1.824372737045288,
+ 1.8253158220672607,
+ 1.8254631029891968,
+ 1.8240845959472656,
+ 1.819489220275879,
+ 1.8196685235214234,
+ 1.8173167004013062,
+ 1.8210680514526367,
+ 1.812099649734497,
+ 1.8139883127212524,
+ 1.810353461265564,
+ 1.8109969634246825,
+ 1.808874561843872,
+ 1.8115904225158692,
+ 1.8089021768188476,
+ 1.8070925519561767,
+ 1.807039188232422,
+ 1.8048222934341431,
+ 1.8031300540924071,
+ 1.8039923257446289,
+ 1.8042795065307617,
+ 1.8037835544586183,
+ 1.8002930462646485,
+ 1.8007701531982423,
+ 1.8004488678359984,
+ 1.8029598141098022,
+ 1.8020868547821045,
+ 1.7990351900482178,
+ 1.8022524103546143,
+ 1.7987030548477172,
+ 1.7969628913116455,
+ 1.7972235089874267,
+ 1.7918564282226563,
+ 1.7940529309082032,
+ 1.7972945267105103,
+ 1.7940796615219117,
+ 1.7942549993133545,
+ 1.7947112902450562,
+ 1.7927878363037109,
+ 1.7915658866119384,
+ 1.7944716805267333,
+ 1.790445680809021,
+ 1.7891779144668578,
+ 1.789405579185486,
+ 1.7867662616729736,
+ 1.7887766037368775,
+ 1.7875445496368407,
+ 1.7851270193862916,
+ 1.7886884448623657,
+ 1.786267046775818,
+ 1.785640559425354,
+ 1.7853610308074952,
+ 1.7856942657470702,
+ 1.7871524771499634,
+ 1.7883876535797119,
+ 1.782026519203186,
+ 1.786798097305298,
+ 1.7790444551849365,
+ 1.7840377599334716,
+ 1.787256519126892,
+ 1.7822379702758788,
+ 1.7822947565460205,
+ 1.7829025159072875,
+ 1.7819519442749023
+ ],
+ "train_acc": [
+ 0.24228,
+ 0.28314,
+ 0.30214,
+ 0.31828,
+ 0.32302,
+ 0.3277,
+ 0.33338,
+ 0.33888,
+ 0.34066,
+ 0.34536,
+ 0.34814,
+ 0.34648,
+ 0.34716,
+ 0.34526,
+ 0.3462,
+ 0.3422,
+ 0.343,
+ 0.34162,
+ 0.3438,
+ 0.34388,
+ 0.34354,
+ 0.33854,
+ 0.34312,
+ 0.34176,
+ 0.34514,
+ 0.34304,
+ 0.34458,
+ 0.34162,
+ 0.34348,
+ 0.34098,
+ 0.34374,
+ 0.34488,
+ 0.34328,
+ 0.34504,
+ 0.34414,
+ 0.34548,
+ 0.34552,
+ 0.34848,
+ 0.34836,
+ 0.34802,
+ 0.34918,
+ 0.346,
+ 0.34986,
+ 0.3473,
+ 0.3515,
+ 0.3527,
+ 0.3532,
+ 0.35212,
+ 0.35068,
+ 0.34998,
+ 0.3505,
+ 0.3565,
+ 0.35392,
+ 0.35556,
+ 0.35556,
+ 0.35462,
+ 0.3548,
+ 0.35674,
+ 0.35552,
+ 0.35848,
+ 0.35704,
+ 0.35594,
+ 0.35598,
+ 0.35716,
+ 0.35818,
+ 0.35842,
+ 0.35966,
+ 0.35968,
+ 0.36022,
+ 0.36082,
+ 0.3571,
+ 0.3612,
+ 0.3604,
+ 0.3607,
+ 0.3602,
+ 0.36134,
+ 0.35734,
+ 0.36262,
+ 0.36352,
+ 0.35916,
+ 0.36462,
+ 0.3617,
+ 0.3608,
+ 0.3617,
+ 0.36106,
+ 0.36262,
+ 0.36296,
+ 0.36354,
+ 0.36138,
+ 0.36132,
+ 0.36446,
+ 0.36452,
+ 0.36388,
+ 0.3645,
+ 0.36378,
+ 0.36342,
+ 0.36496,
+ 0.36556,
+ 0.36274,
+ 0.36546
+ ],
+ "test_acc": [
+ 0.2954,
+ 0.3137,
+ 0.3295,
+ 0.3474,
+ 0.3551,
+ 0.3544,
+ 0.3515,
+ 0.3694,
+ 0.3633,
+ 0.3479,
+ 0.3744,
+ 0.3726,
+ 0.371,
+ 0.3618,
+ 0.3649,
+ 0.3685,
+ 0.3658,
+ 0.3704,
+ 0.3504,
+ 0.3729,
+ 0.3578,
+ 0.3685,
+ 0.3676,
+ 0.3643,
+ 0.3562,
+ 0.3486,
+ 0.3732,
+ 0.3624,
+ 0.3693,
+ 0.341,
+ 0.3467,
+ 0.3544,
+ 0.3679,
+ 0.3526,
+ 0.3593,
+ 0.3647,
+ 0.3604,
+ 0.3662,
+ 0.3632,
+ 0.3644,
+ 0.3628,
+ 0.3598,
+ 0.3564,
+ 0.3633,
+ 0.3531,
+ 0.3607,
+ 0.3616,
+ 0.3636,
+ 0.3514,
+ 0.3488,
+ 0.3408,
+ 0.3522,
+ 0.3651,
+ 0.3408,
+ 0.3548,
+ 0.3504,
+ 0.3469,
+ 0.3507,
+ 0.3515,
+ 0.3434,
+ 0.3548,
+ 0.351,
+ 0.351,
+ 0.3545,
+ 0.3487,
+ 0.3467,
+ 0.3492,
+ 0.3439,
+ 0.346,
+ 0.3357,
+ 0.332,
+ 0.3387,
+ 0.3546,
+ 0.3415,
+ 0.3458,
+ 0.3451,
+ 0.3477,
+ 0.342,
+ 0.3446,
+ 0.3427,
+ 0.3426,
+ 0.3423,
+ 0.3481,
+ 0.3467,
+ 0.3443,
+ 0.3437,
+ 0.3466,
+ 0.3459,
+ 0.3448,
+ 0.3458,
+ 0.3433,
+ 0.3461,
+ 0.3479,
+ 0.3447,
+ 0.3452,
+ 0.3467,
+ 0.3461,
+ 0.3467,
+ 0.3464,
+ 0.3464
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.01565447635948658,
+ 0.9284564256668091
+ ],
+ "perturbation_rho": [
+ 0.08889118582010269,
+ 0.1751367598772049
+ ],
+ "nudging": {
+ "0.001": [
+ -8.567003533244133e-07,
+ -7.14592169970274e-06
+ ],
+ "0.003": [
+ -2.5028130039572716e-06,
+ -2.1490384824573994e-05
+ ],
+ "0.01": [
+ -8.566654287278652e-06,
+ -7.176969666033983e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 5015.7705078125,
+ 205831.875,
+ 281989.59375
+ ],
+ "bp_grad_norms_per_layer": [
+ 1.882538890640717e-05,
+ 8.274267884189612e-07,
+ 8.043497246035258e-07
+ ]
+ },
+ "drift": {
+ "embed.weight": 31.381319271594045,
+ "embed.bias": 16.70881646410694,
+ "blocks.0.ln.weight": 1.5550725713952875,
+ "blocks.0.w1.weight": 29.555012389084762,
+ "blocks.0.w1.bias": 17.153011809958922,
+ "blocks.0.w2.weight": 62.82184507015774,
+ "blocks.1.ln.weight": 1.2734634249220895,
+ "blocks.1.w1.weight": 21.575349693350912,
+ "blocks.1.w1.bias": 10.895115401942027,
+ "blocks.1.w2.weight": 35.67159460439069,
+ "out_ln.weight": 0.4183849023916904,
+ "out_head.weight": 4.1274562698411295,
+ "out_head.bias": 12.873937810986282
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 2,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 2
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_dfa_d512_L2_seed2",
+ "methods": [
+ "fa",
+ "dfa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file