summaryrefslogtreecommitdiff
path: root/results/fa_dfa_d512_L2_seed8/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_dfa_d512_L2_seed8/results_cifar10.json')
-rw-r--r--results/fa_dfa_d512_L2_seed8/results_cifar10.json749
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed8/results_cifar10.json b/results/fa_dfa_d512_L2_seed8/results_cifar10.json
new file mode 100644
index 0000000..ad4f8bf
--- /dev/null
+++ b/results/fa_dfa_d512_L2_seed8/results_cifar10.json
@@ -0,0 +1,749 @@
+{
+ "8": {
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 2.0461414054870604,
+ 2.028953609237671,
+ 2.0224830960845948,
+ 2.0189640741348267,
+ 2.0186043047332762,
+ 2.011939255371094,
+ 2.00884051902771,
+ 2.006375752105713,
+ 2.0061196725463866,
+ 2.0044810569763185,
+ 2.000473762359619,
+ 1.999425143661499,
+ 1.9991976582336426,
+ 1.9983828188323975,
+ 1.9999516902160646,
+ 2.000131714401245,
+ 2.000538674583435,
+ 1.999087513999939,
+ 1.9965772060394287,
+ 1.9952695233154296,
+ 1.9958783276367187,
+ 1.9935351610565186,
+ 1.9946063667297362,
+ 1.9927719008636475,
+ 1.9930043865203857,
+ 1.992498685836792,
+ 1.9923327257537842,
+ 1.9919360898208618,
+ 1.9922407612609863,
+ 1.992235760192871,
+ 1.992523240623474,
+ 1.9913750788116455,
+ 1.9934618493652343,
+ 1.9923072975921632,
+ 1.991889149017334,
+ 1.9904881185913086,
+ 1.9916703072357178,
+ 1.9886171953582763,
+ 1.9906551904296874,
+ 1.9912475842285156,
+ 1.9906490882873535,
+ 1.9897464477920532,
+ 1.9902090267562866,
+ 1.98889538230896,
+ 1.9899030431365967,
+ 1.9914473651885987,
+ 1.987290951499939,
+ 1.9882332851409912,
+ 1.987876655883789,
+ 1.986627554321289,
+ 1.9874235430526734,
+ 1.985631577758789,
+ 1.9859224739074708,
+ 1.984819174156189,
+ 1.9877312922668458,
+ 1.9880256802749634,
+ 1.9883026748657227,
+ 1.9880133050918578,
+ 1.9872900528717041,
+ 1.9861614239501952,
+ 1.9879061701202392,
+ 1.986334129486084,
+ 1.9889874462509156,
+ 1.9848816363143922,
+ 1.985108938598633,
+ 1.9852813848114013,
+ 1.9847304062652589,
+ 1.9842171102142334,
+ 1.986599141769409,
+ 1.9858817081451416,
+ 1.9852649099349975,
+ 1.982235690460205,
+ 1.9838326638793946,
+ 1.9827596533966065,
+ 1.9836663906097411,
+ 1.9844815605163575,
+ 1.9842618350982666,
+ 1.984488549156189,
+ 1.9830066680908203,
+ 1.9835596384048462,
+ 1.9822921755981446,
+ 1.9845924890899658,
+ 1.9827096743392945,
+ 1.9821208544158935,
+ 1.983244455909729,
+ 1.9823134091567993,
+ 1.9837292085266114,
+ 1.9827219149017334,
+ 1.9828275063323975,
+ 1.9811715400695802,
+ 1.9821106326675415,
+ 1.9830516720199585,
+ 1.9831754531097412,
+ 1.9825017529296876,
+ 1.9844729486465453,
+ 1.9823845765686035,
+ 1.9825008573913574,
+ 1.9817371285247802,
+ 1.9809684440612794,
+ 1.981824859008789
+ ],
+ "train_acc": [
+ 0.24566,
+ 0.25216,
+ 0.25672,
+ 0.2583,
+ 0.25908,
+ 0.2611,
+ 0.26292,
+ 0.26504,
+ 0.26436,
+ 0.26372,
+ 0.26838,
+ 0.2684,
+ 0.26774,
+ 0.26886,
+ 0.26864,
+ 0.26928,
+ 0.26802,
+ 0.26984,
+ 0.27068,
+ 0.27056,
+ 0.27002,
+ 0.27018,
+ 0.27034,
+ 0.27138,
+ 0.27238,
+ 0.27266,
+ 0.27208,
+ 0.27464,
+ 0.27406,
+ 0.27306,
+ 0.27278,
+ 0.27354,
+ 0.27164,
+ 0.27506,
+ 0.27494,
+ 0.27682,
+ 0.27244,
+ 0.2749,
+ 0.27302,
+ 0.2745,
+ 0.2736,
+ 0.27382,
+ 0.27478,
+ 0.27344,
+ 0.27582,
+ 0.2732,
+ 0.27662,
+ 0.27616,
+ 0.2763,
+ 0.27742,
+ 0.27642,
+ 0.27984,
+ 0.2777,
+ 0.28112,
+ 0.27754,
+ 0.27344,
+ 0.2769,
+ 0.27664,
+ 0.27734,
+ 0.27754,
+ 0.27784,
+ 0.27642,
+ 0.27598,
+ 0.2796,
+ 0.27964,
+ 0.27868,
+ 0.27864,
+ 0.27868,
+ 0.27826,
+ 0.27986,
+ 0.27616,
+ 0.2817,
+ 0.28024,
+ 0.27688,
+ 0.28002,
+ 0.27942,
+ 0.27838,
+ 0.2787,
+ 0.27856,
+ 0.28034,
+ 0.27972,
+ 0.27722,
+ 0.27992,
+ 0.28172,
+ 0.27796,
+ 0.2775,
+ 0.28122,
+ 0.2803,
+ 0.27958,
+ 0.27936,
+ 0.28062,
+ 0.2791,
+ 0.2797,
+ 0.28202,
+ 0.27898,
+ 0.27894,
+ 0.27866,
+ 0.27832,
+ 0.28,
+ 0.28114
+ ],
+ "test_acc": [
+ 0.2641,
+ 0.2447,
+ 0.2423,
+ 0.2586,
+ 0.2666,
+ 0.2868,
+ 0.2779,
+ 0.27,
+ 0.2886,
+ 0.2704,
+ 0.2846,
+ 0.2825,
+ 0.2801,
+ 0.2912,
+ 0.277,
+ 0.2834,
+ 0.2838,
+ 0.2802,
+ 0.2793,
+ 0.2883,
+ 0.2871,
+ 0.2825,
+ 0.288,
+ 0.2913,
+ 0.2813,
+ 0.2931,
+ 0.2994,
+ 0.3001,
+ 0.2753,
+ 0.2966,
+ 0.2996,
+ 0.2965,
+ 0.2835,
+ 0.3002,
+ 0.2979,
+ 0.2783,
+ 0.3017,
+ 0.2848,
+ 0.2846,
+ 0.2928,
+ 0.2956,
+ 0.2705,
+ 0.2811,
+ 0.292,
+ 0.2763,
+ 0.2834,
+ 0.2837,
+ 0.2949,
+ 0.2998,
+ 0.2894,
+ 0.2853,
+ 0.2921,
+ 0.2986,
+ 0.2918,
+ 0.2933,
+ 0.28,
+ 0.2988,
+ 0.2925,
+ 0.2828,
+ 0.2875,
+ 0.2985,
+ 0.2927,
+ 0.2922,
+ 0.3016,
+ 0.2947,
+ 0.2952,
+ 0.2936,
+ 0.2923,
+ 0.2992,
+ 0.2968,
+ 0.2915,
+ 0.2992,
+ 0.2941,
+ 0.2969,
+ 0.2936,
+ 0.2972,
+ 0.2964,
+ 0.2928,
+ 0.2958,
+ 0.2973,
+ 0.2958,
+ 0.2971,
+ 0.2983,
+ 0.2983,
+ 0.2951,
+ 0.2963,
+ 0.2953,
+ 0.2964,
+ 0.2963,
+ 0.293,
+ 0.2951,
+ 0.2967,
+ 0.2967,
+ 0.297,
+ 0.2966,
+ 0.2967,
+ 0.2967,
+ 0.2966,
+ 0.2966,
+ 0.2967
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.3839848041534424,
+ -0.0006596383173018694
+ ],
+ "perturbation_rho": [
+ 0.02412901259958744,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -4.284083843231201e-07,
+ 0.0
+ ],
+ "0.003": [
+ -1.3029202818870544e-06,
+ 0.0
+ ],
+ "0.01": [
+ -4.258938133716583e-06,
+ 0.0
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 53606.07421875,
+ 782741952.0,
+ 4561426432.0
+ ],
+ "bp_grad_norms_per_layer": [
+ 3.0959373020778003e-07,
+ 3.211692578553027e-10,
+ 3.2110258896267396e-10
+ ]
+ },
+ "drift": {
+ "embed.weight": 322.14716880304843,
+ "embed.bias": 253.7663922411994,
+ "blocks.0.ln.weight": 9.639264948834146,
+ "blocks.0.w1.weight": 278.73838749620353,
+ "blocks.0.w1.bias": 250.4325839565606,
+ "blocks.0.w2.weight": 488.7145731499842,
+ "blocks.1.ln.weight": 9.351844341907716,
+ "blocks.1.w1.weight": 376.1230199590697,
+ "blocks.1.w1.bias": 376.4920228948829,
+ "blocks.1.w2.weight": 403.36194320458816,
+ "out_ln.weight": 0.513534701987637,
+ "out_head.weight": 7.742896807554914,
+ "out_head.bias": 1.1408249446090957
+ }
+ },
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.0653204177856446,
+ 1.9681754495239259,
+ 1.9207439241790771,
+ 1.8943786935806275,
+ 1.8802625274276734,
+ 1.8628883916473389,
+ 1.8490794301605225,
+ 1.8400364615249634,
+ 1.8355530837249756,
+ 1.8266534114837647,
+ 1.8170614450454712,
+ 1.8170341843414306,
+ 1.809728816757202,
+ 1.80435710231781,
+ 1.8044258756256104,
+ 1.7987670265960694,
+ 1.7999644842147826,
+ 1.7953315704345703,
+ 1.7825802756118774,
+ 1.7845099126434327,
+ 1.7779603283691405,
+ 1.7730702184677125,
+ 1.7695367748260498,
+ 1.7647147689056397,
+ 1.7608037928009033,
+ 1.7535330474090576,
+ 1.75540680393219,
+ 1.7487119026947022,
+ 1.7451758492279053,
+ 1.745663233718872,
+ 1.7409377331924438,
+ 1.7372819427871704,
+ 1.7388353146743774,
+ 1.7410107398605346,
+ 1.7357459603881835,
+ 1.7290400104522705,
+ 1.7318879638290405,
+ 1.729545888900757,
+ 1.7291300962066651,
+ 1.733487999343872,
+ 1.7302352466583253,
+ 1.7331863732147217,
+ 1.7339300806045532,
+ 1.7359314554595948,
+ 1.7347373684310914,
+ 1.7375746230316162,
+ 1.7313235457611085,
+ 1.7353338851165772,
+ 1.73820286403656,
+ 1.7340232833862306,
+ 1.7341221398925781,
+ 1.7339955667114257,
+ 1.7339833393096924,
+ 1.7300079647064208,
+ 1.7303287143707275,
+ 1.7298947993469238,
+ 1.7274299069213868,
+ 1.7319763919067384,
+ 1.7264507590103149,
+ 1.7299312719726563,
+ 1.7262817291641235,
+ 1.7270497384262085,
+ 1.7246126723098756,
+ 1.7255360033798217,
+ 1.7196656997680664,
+ 1.7214281465911865,
+ 1.7198693132781981,
+ 1.7217327685546875,
+ 1.7179188094329834,
+ 1.7154542624664306,
+ 1.7195643279266357,
+ 1.7149108078384399,
+ 1.7153279098510743,
+ 1.7153327802276612,
+ 1.7094103066253663,
+ 1.7162176602554322,
+ 1.7122739435195924,
+ 1.7128758419418335,
+ 1.708295757408142,
+ 1.7086283514785767,
+ 1.7106998838043213,
+ 1.711903858909607,
+ 1.7090504042434693,
+ 1.7111234002304077,
+ 1.7090101749420166,
+ 1.7079448748779298,
+ 1.707335115890503,
+ 1.7080174974822997,
+ 1.705443286972046,
+ 1.7056840801239013,
+ 1.708050958175659,
+ 1.7072754711151124,
+ 1.7059114752960205,
+ 1.7063753726959228,
+ 1.7061457764434815,
+ 1.7009761544418336,
+ 1.707751445274353,
+ 1.7066948248291016,
+ 1.7041513320922852,
+ 1.7030947677612305
+ ],
+ "train_acc": [
+ 0.24824,
+ 0.29,
+ 0.30804,
+ 0.32064,
+ 0.32604,
+ 0.33114,
+ 0.33818,
+ 0.3373,
+ 0.34064,
+ 0.3462,
+ 0.34982,
+ 0.34634,
+ 0.35334,
+ 0.35346,
+ 0.35488,
+ 0.3554,
+ 0.35676,
+ 0.35738,
+ 0.36206,
+ 0.36144,
+ 0.36364,
+ 0.3671,
+ 0.36916,
+ 0.3698,
+ 0.37032,
+ 0.3709,
+ 0.37188,
+ 0.3757,
+ 0.37546,
+ 0.37376,
+ 0.37888,
+ 0.37908,
+ 0.37828,
+ 0.37822,
+ 0.37984,
+ 0.3791,
+ 0.38144,
+ 0.38286,
+ 0.37966,
+ 0.3797,
+ 0.38152,
+ 0.38084,
+ 0.3812,
+ 0.3809,
+ 0.38156,
+ 0.382,
+ 0.38494,
+ 0.38258,
+ 0.38066,
+ 0.3824,
+ 0.38058,
+ 0.38342,
+ 0.3823,
+ 0.38198,
+ 0.38534,
+ 0.38368,
+ 0.38524,
+ 0.38594,
+ 0.38536,
+ 0.38514,
+ 0.38676,
+ 0.38838,
+ 0.38778,
+ 0.38664,
+ 0.39118,
+ 0.38748,
+ 0.39154,
+ 0.3882,
+ 0.38852,
+ 0.39078,
+ 0.38918,
+ 0.39202,
+ 0.39086,
+ 0.39128,
+ 0.39242,
+ 0.3935,
+ 0.39422,
+ 0.39322,
+ 0.39388,
+ 0.39516,
+ 0.39496,
+ 0.39414,
+ 0.39428,
+ 0.39522,
+ 0.39426,
+ 0.3953,
+ 0.39628,
+ 0.39662,
+ 0.39662,
+ 0.39608,
+ 0.39646,
+ 0.39568,
+ 0.39606,
+ 0.39558,
+ 0.3961,
+ 0.3992,
+ 0.39438,
+ 0.39786,
+ 0.39626,
+ 0.39922
+ ],
+ "test_acc": [
+ 0.297,
+ 0.3142,
+ 0.3407,
+ 0.3409,
+ 0.3537,
+ 0.3628,
+ 0.3482,
+ 0.3626,
+ 0.3557,
+ 0.351,
+ 0.3614,
+ 0.3693,
+ 0.363,
+ 0.3681,
+ 0.374,
+ 0.3756,
+ 0.3778,
+ 0.3795,
+ 0.3757,
+ 0.3742,
+ 0.3801,
+ 0.3732,
+ 0.3782,
+ 0.3805,
+ 0.3718,
+ 0.3786,
+ 0.3914,
+ 0.3924,
+ 0.3797,
+ 0.3967,
+ 0.3891,
+ 0.3829,
+ 0.3811,
+ 0.3967,
+ 0.3876,
+ 0.3862,
+ 0.3945,
+ 0.3851,
+ 0.3807,
+ 0.3871,
+ 0.3924,
+ 0.3941,
+ 0.3823,
+ 0.392,
+ 0.3942,
+ 0.3908,
+ 0.3979,
+ 0.3954,
+ 0.4003,
+ 0.401,
+ 0.3938,
+ 0.3938,
+ 0.3997,
+ 0.3943,
+ 0.4069,
+ 0.4012,
+ 0.4056,
+ 0.408,
+ 0.4037,
+ 0.3996,
+ 0.4115,
+ 0.4098,
+ 0.4062,
+ 0.4083,
+ 0.4115,
+ 0.4094,
+ 0.4147,
+ 0.4109,
+ 0.4101,
+ 0.4084,
+ 0.4112,
+ 0.4114,
+ 0.4127,
+ 0.4113,
+ 0.407,
+ 0.4126,
+ 0.4167,
+ 0.4132,
+ 0.4156,
+ 0.4138,
+ 0.4122,
+ 0.4128,
+ 0.417,
+ 0.4138,
+ 0.4128,
+ 0.4136,
+ 0.4137,
+ 0.4132,
+ 0.4153,
+ 0.4136,
+ 0.4123,
+ 0.413,
+ 0.4134,
+ 0.4142,
+ 0.4155,
+ 0.4155,
+ 0.4142,
+ 0.4147,
+ 0.4149,
+ 0.4146
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.02496020682156086,
+ 0.9624444246292114
+ ],
+ "perturbation_rho": [
+ -0.018970193341374397,
+ 0.1267668902873993
+ ],
+ "nudging": {
+ "0.001": [
+ -2.1758460206910968e-06,
+ -7.471287972293794e-06
+ ],
+ "0.003": [
+ -6.601490895263851e-06,
+ -2.2840846213512123e-05
+ ],
+ "0.01": [
+ -2.1907704649493098e-05,
+ -7.614441710757092e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 6420.08984375,
+ 205601.1875,
+ 92651.546875
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.9750526664429344e-05,
+ 2.456108632031828e-06,
+ 2.075838210657821e-06
+ ]
+ },
+ "drift": {
+ "embed.weight": 37.110060620728056,
+ "embed.bias": 24.00213600327038,
+ "blocks.0.ln.weight": 1.3952106680756078,
+ "blocks.0.w1.weight": 19.29938322080228,
+ "blocks.0.w1.bias": 17.715456046599957,
+ "blocks.0.w2.weight": 54.87838247174745,
+ "blocks.1.ln.weight": 1.0669201771550085,
+ "blocks.1.w1.weight": 18.224214324200183,
+ "blocks.1.w1.bias": 17.474148202150594,
+ "blocks.1.w2.weight": 31.754151778532563,
+ "out_ln.weight": 0.42931707858608786,
+ "out_head.weight": 4.036471355678216,
+ "out_head.bias": 7.088871139191845
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 2,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 8
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_dfa_d512_L2_seed8",
+ "methods": [
+ "fa",
+ "dfa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file