summaryrefslogtreecommitdiff
path: root/results/fa_dfa_d512_L2_seed7/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_dfa_d512_L2_seed7/results_cifar10.json')
-rw-r--r--results/fa_dfa_d512_L2_seed7/results_cifar10.json749
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed7/results_cifar10.json b/results/fa_dfa_d512_L2_seed7/results_cifar10.json
new file mode 100644
index 0000000..481338c
--- /dev/null
+++ b/results/fa_dfa_d512_L2_seed7/results_cifar10.json
@@ -0,0 +1,749 @@
+{
+ "7": {
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 2.055191882095337,
+ 2.043570478172302,
+ 2.0389851570892334,
+ 2.035236138343811,
+ 2.034318865890503,
+ 2.028933349571228,
+ 2.027525556945801,
+ 2.0267114724731443,
+ 2.0244813998031614,
+ 2.0217119938659667,
+ 2.0195889541625975,
+ 2.0210990812683107,
+ 2.0200074877166747,
+ 2.0166528286743164,
+ 2.0172128536224365,
+ 2.0116504791259766,
+ 2.0116141784667967,
+ 2.007682880592346,
+ 2.0073163960266114,
+ 2.0056607851791384,
+ 2.0035111226654054,
+ 2.0027661852264402,
+ 2.001486244812012,
+ 1.9986013162231446,
+ 1.997822530975342,
+ 1.994211967010498,
+ 1.9924970539093017,
+ 1.991006000213623,
+ 1.9917142455291748,
+ 1.9929195302581788,
+ 1.991425333518982,
+ 1.9895027528381348,
+ 1.9874201156997682,
+ 1.9884889245605468,
+ 1.986476892967224,
+ 1.9826913553237915,
+ 1.9848502500152587,
+ 1.982286188697815,
+ 1.9824313144683838,
+ 1.9826200205230713,
+ 1.9815959204864502,
+ 1.9807573030853272,
+ 1.9788639946746827,
+ 1.9796723455810548,
+ 1.976197322998047,
+ 1.9779787089538574,
+ 1.9767974209594728,
+ 1.9764958350372315,
+ 1.9774945835876465,
+ 1.9747930298614502,
+ 1.9727936906433106,
+ 1.9740131066131592,
+ 1.9746413722991942,
+ 1.9732583834838868,
+ 1.9723580028533936,
+ 1.9721147798919678,
+ 1.972632116394043,
+ 1.970795502243042,
+ 1.9690511889648437,
+ 1.9716948537826537,
+ 1.9707828464508057,
+ 1.9699502618026734,
+ 1.969847806854248,
+ 1.9696522138214112,
+ 1.9674137978744506,
+ 1.9683316724014281,
+ 1.96831518825531,
+ 1.9711441744613647,
+ 1.9686481335830688,
+ 1.9681067206573486,
+ 1.9675092895507813,
+ 1.9689227291107179,
+ 1.9677108968353272,
+ 1.9652254253387451,
+ 1.9658482390594483,
+ 1.9671778398895263,
+ 1.9676923946762086,
+ 1.9644599740219115,
+ 1.9651101944351197,
+ 1.9664753457260131,
+ 1.9669549044799806,
+ 1.9642051581573485,
+ 1.9663040605163575,
+ 1.9670575283432006,
+ 1.9643160835266114,
+ 1.9654435306167604,
+ 1.964134133644104,
+ 1.9641572988891602,
+ 1.9649527727508544,
+ 1.9648468869781495,
+ 1.9629023349380492,
+ 1.9663221743774415,
+ 1.9669214375305175,
+ 1.9649668531036377,
+ 1.9656098468780518,
+ 1.966679817123413,
+ 1.9638590016174315,
+ 1.9619427868270873,
+ 1.9663854665756226,
+ 1.966093027381897
+ ],
+ "train_acc": [
+ 0.24264,
+ 0.24694,
+ 0.24798,
+ 0.24876,
+ 0.25246,
+ 0.25632,
+ 0.25708,
+ 0.25698,
+ 0.25824,
+ 0.26182,
+ 0.2633,
+ 0.26056,
+ 0.26094,
+ 0.26186,
+ 0.26334,
+ 0.26518,
+ 0.26768,
+ 0.26548,
+ 0.26774,
+ 0.26878,
+ 0.2695,
+ 0.2733,
+ 0.26882,
+ 0.27458,
+ 0.2744,
+ 0.27714,
+ 0.27356,
+ 0.27912,
+ 0.27626,
+ 0.27554,
+ 0.2775,
+ 0.2796,
+ 0.27856,
+ 0.27752,
+ 0.27988,
+ 0.28044,
+ 0.28096,
+ 0.2833,
+ 0.28072,
+ 0.28224,
+ 0.28246,
+ 0.28386,
+ 0.28302,
+ 0.28622,
+ 0.28438,
+ 0.28368,
+ 0.28372,
+ 0.28316,
+ 0.28436,
+ 0.28636,
+ 0.28652,
+ 0.28768,
+ 0.2859,
+ 0.28832,
+ 0.28462,
+ 0.28838,
+ 0.2877,
+ 0.28634,
+ 0.28904,
+ 0.28846,
+ 0.28746,
+ 0.28738,
+ 0.2889,
+ 0.28872,
+ 0.28988,
+ 0.28838,
+ 0.2881,
+ 0.29144,
+ 0.28876,
+ 0.28998,
+ 0.29006,
+ 0.28796,
+ 0.28852,
+ 0.29134,
+ 0.29044,
+ 0.29064,
+ 0.28968,
+ 0.2908,
+ 0.28898,
+ 0.29126,
+ 0.28764,
+ 0.29144,
+ 0.2911,
+ 0.29084,
+ 0.29148,
+ 0.28904,
+ 0.29322,
+ 0.2902,
+ 0.2903,
+ 0.2903,
+ 0.29346,
+ 0.2899,
+ 0.28924,
+ 0.29046,
+ 0.28966,
+ 0.29182,
+ 0.2899,
+ 0.28986,
+ 0.2916,
+ 0.28824
+ ],
+ "test_acc": [
+ 0.2524,
+ 0.2673,
+ 0.2815,
+ 0.2506,
+ 0.2816,
+ 0.2711,
+ 0.2809,
+ 0.2844,
+ 0.2929,
+ 0.286,
+ 0.2744,
+ 0.289,
+ 0.2842,
+ 0.2845,
+ 0.2813,
+ 0.2816,
+ 0.2741,
+ 0.2919,
+ 0.2911,
+ 0.2705,
+ 0.2945,
+ 0.3034,
+ 0.2878,
+ 0.2798,
+ 0.2791,
+ 0.298,
+ 0.2976,
+ 0.293,
+ 0.2996,
+ 0.2971,
+ 0.3057,
+ 0.3087,
+ 0.3011,
+ 0.3061,
+ 0.3061,
+ 0.2919,
+ 0.3051,
+ 0.306,
+ 0.3078,
+ 0.3056,
+ 0.3019,
+ 0.3022,
+ 0.3075,
+ 0.3081,
+ 0.3008,
+ 0.2993,
+ 0.2992,
+ 0.3129,
+ 0.3147,
+ 0.2965,
+ 0.31,
+ 0.2998,
+ 0.3082,
+ 0.312,
+ 0.3096,
+ 0.3084,
+ 0.306,
+ 0.3072,
+ 0.308,
+ 0.3153,
+ 0.3089,
+ 0.3032,
+ 0.3083,
+ 0.3208,
+ 0.3021,
+ 0.3158,
+ 0.3101,
+ 0.3162,
+ 0.3125,
+ 0.3103,
+ 0.3118,
+ 0.309,
+ 0.3117,
+ 0.3098,
+ 0.3162,
+ 0.3136,
+ 0.3107,
+ 0.3074,
+ 0.3122,
+ 0.3141,
+ 0.3127,
+ 0.314,
+ 0.3129,
+ 0.3145,
+ 0.3133,
+ 0.3138,
+ 0.3131,
+ 0.3158,
+ 0.3159,
+ 0.3161,
+ 0.3141,
+ 0.3163,
+ 0.3165,
+ 0.3154,
+ 0.3163,
+ 0.3164,
+ 0.3155,
+ 0.3155,
+ 0.3157,
+ 0.3157
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.4341934025287628,
+ -0.0012890032958239317
+ ],
+ "perturbation_rho": [
+ -0.016353363171219826,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -6.253831088542938e-07,
+ 0.0
+ ],
+ "0.003": [
+ -1.7937272787094116e-06,
+ 1.862645149230957e-09
+ ],
+ "0.01": [
+ -6.007961928844452e-06,
+ 5.587935447692871e-09
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 51618.765625,
+ 586580544.0,
+ 3527968768.0
+ ],
+ "bp_grad_norms_per_layer": [
+ 3.575926825760689e-07,
+ 3.2419492090873803e-10,
+ 3.250963664935824e-10
+ ]
+ },
+ "drift": {
+ "embed.weight": 305.91109235091693,
+ "embed.bias": 181.83596330336093,
+ "blocks.0.ln.weight": 10.507483299521725,
+ "blocks.0.w1.weight": 259.244642347064,
+ "blocks.0.w1.bias": 195.88858302375624,
+ "blocks.0.w2.weight": 487.57558684361754,
+ "blocks.1.ln.weight": 9.741938719661329,
+ "blocks.1.w1.weight": 370.35850714262523,
+ "blocks.1.w1.bias": 288.30321808565367,
+ "blocks.1.w2.weight": 411.72437143655895,
+ "out_ln.weight": 0.4751365199666905,
+ "out_head.weight": 6.958959988926819,
+ "out_head.bias": 2.336896476076589
+ }
+ },
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.065423551902771,
+ 1.959441243019104,
+ 1.922898962135315,
+ 1.8985358092498779,
+ 1.8807485336685181,
+ 1.8632725805664063,
+ 1.8535257900238038,
+ 1.8472118298339844,
+ 1.8383856839752197,
+ 1.8354701901626587,
+ 1.8370730047988892,
+ 1.837422192993164,
+ 1.8389883419036865,
+ 1.8328349654388427,
+ 1.8349895798110962,
+ 1.8335126385116578,
+ 1.8306356255722045,
+ 1.8322726831817626,
+ 1.8286183166885377,
+ 1.8288718432617188,
+ 1.8341219143295289,
+ 1.8368035592269898,
+ 1.836811799583435,
+ 1.836639772872925,
+ 1.8373656529998779,
+ 1.836424264526367,
+ 1.8352625201797486,
+ 1.835800665588379,
+ 1.832284771118164,
+ 1.833700514755249,
+ 1.8298065981674194,
+ 1.8254384775543213,
+ 1.821793406639099,
+ 1.8201812942123412,
+ 1.8183945245742799,
+ 1.8144645150375367,
+ 1.8105643741607667,
+ 1.809894971961975,
+ 1.804399468612671,
+ 1.8044112042999267,
+ 1.8014125130844116,
+ 1.8024961044311523,
+ 1.7954880487442018,
+ 1.798938335647583,
+ 1.790709694480896,
+ 1.7935989169311524,
+ 1.7944183544921875,
+ 1.7913234217071534,
+ 1.7892272469711303,
+ 1.7870802127838135,
+ 1.7874060748291016,
+ 1.7849993677139282,
+ 1.7821664669418336,
+ 1.784739924659729,
+ 1.7879353686523438,
+ 1.786940495300293,
+ 1.784608112564087,
+ 1.7870150913238525,
+ 1.7842396997070313,
+ 1.7843707611465454,
+ 1.7866798919296265,
+ 1.7842874060440064,
+ 1.7791111608886718,
+ 1.7806335921859742,
+ 1.7796328140640258,
+ 1.7788975708770751,
+ 1.7777235781097411,
+ 1.7809623500823974,
+ 1.7793159552764892,
+ 1.7774666768646241,
+ 1.7777468250274657,
+ 1.7797447577667236,
+ 1.7749399490356446,
+ 1.7782198504257203,
+ 1.7768975478744506,
+ 1.7724751330184936,
+ 1.7744919674682618,
+ 1.771957764816284,
+ 1.773150245323181,
+ 1.7745548120880128,
+ 1.7708911740112305,
+ 1.7687720165634155,
+ 1.7715272402191162,
+ 1.7657094653320313,
+ 1.7654507334899903,
+ 1.7671412448120116,
+ 1.7664664395904541,
+ 1.768566664352417,
+ 1.7679725888824462,
+ 1.7632778255844117,
+ 1.7664907150268554,
+ 1.7670541214370727,
+ 1.7653729449081421,
+ 1.7616971383666993,
+ 1.7609278664398194,
+ 1.7637566931915283,
+ 1.764719966506958,
+ 1.7616608474349975,
+ 1.7632052117538453,
+ 1.7648505276107789
+ ],
+ "train_acc": [
+ 0.24818,
+ 0.2905,
+ 0.3052,
+ 0.31584,
+ 0.32536,
+ 0.33246,
+ 0.33778,
+ 0.33886,
+ 0.33934,
+ 0.34248,
+ 0.3433,
+ 0.34108,
+ 0.33788,
+ 0.34122,
+ 0.3401,
+ 0.34124,
+ 0.3422,
+ 0.3437,
+ 0.34032,
+ 0.34338,
+ 0.33892,
+ 0.33994,
+ 0.3359,
+ 0.33762,
+ 0.33858,
+ 0.33796,
+ 0.33882,
+ 0.34338,
+ 0.34164,
+ 0.34066,
+ 0.34704,
+ 0.3459,
+ 0.34644,
+ 0.34698,
+ 0.34912,
+ 0.34876,
+ 0.3523,
+ 0.35206,
+ 0.35342,
+ 0.35536,
+ 0.35396,
+ 0.3552,
+ 0.35924,
+ 0.35432,
+ 0.35796,
+ 0.35682,
+ 0.35832,
+ 0.35936,
+ 0.36088,
+ 0.36014,
+ 0.36244,
+ 0.3632,
+ 0.36318,
+ 0.36202,
+ 0.36224,
+ 0.36138,
+ 0.36264,
+ 0.35992,
+ 0.3656,
+ 0.36372,
+ 0.3631,
+ 0.3644,
+ 0.3645,
+ 0.36648,
+ 0.36714,
+ 0.36738,
+ 0.3652,
+ 0.36398,
+ 0.36904,
+ 0.3683,
+ 0.36936,
+ 0.3682,
+ 0.36688,
+ 0.36788,
+ 0.3702,
+ 0.36986,
+ 0.36914,
+ 0.3728,
+ 0.3697,
+ 0.37158,
+ 0.37106,
+ 0.37164,
+ 0.37216,
+ 0.3765,
+ 0.37258,
+ 0.3718,
+ 0.37274,
+ 0.37224,
+ 0.3709,
+ 0.372,
+ 0.37362,
+ 0.3726,
+ 0.37316,
+ 0.37384,
+ 0.37496,
+ 0.37558,
+ 0.3719,
+ 0.37734,
+ 0.37454,
+ 0.37464
+ ],
+ "test_acc": [
+ 0.2781,
+ 0.3155,
+ 0.3352,
+ 0.3255,
+ 0.3405,
+ 0.3545,
+ 0.3621,
+ 0.3461,
+ 0.3528,
+ 0.3543,
+ 0.331,
+ 0.3589,
+ 0.3453,
+ 0.349,
+ 0.3481,
+ 0.3479,
+ 0.355,
+ 0.3516,
+ 0.347,
+ 0.3387,
+ 0.3431,
+ 0.3418,
+ 0.3297,
+ 0.3231,
+ 0.3156,
+ 0.3425,
+ 0.3359,
+ 0.3325,
+ 0.3627,
+ 0.3371,
+ 0.351,
+ 0.3523,
+ 0.3384,
+ 0.3573,
+ 0.3432,
+ 0.3522,
+ 0.3549,
+ 0.3581,
+ 0.361,
+ 0.3577,
+ 0.3477,
+ 0.3498,
+ 0.3374,
+ 0.3495,
+ 0.337,
+ 0.3531,
+ 0.3467,
+ 0.3464,
+ 0.3582,
+ 0.3339,
+ 0.3416,
+ 0.3402,
+ 0.3472,
+ 0.3388,
+ 0.3466,
+ 0.3442,
+ 0.3452,
+ 0.3515,
+ 0.3485,
+ 0.3612,
+ 0.3508,
+ 0.3437,
+ 0.3639,
+ 0.3558,
+ 0.3438,
+ 0.3503,
+ 0.3466,
+ 0.3499,
+ 0.3569,
+ 0.3508,
+ 0.3467,
+ 0.3479,
+ 0.3496,
+ 0.352,
+ 0.3543,
+ 0.3569,
+ 0.3474,
+ 0.344,
+ 0.3485,
+ 0.3519,
+ 0.3507,
+ 0.352,
+ 0.3534,
+ 0.3545,
+ 0.353,
+ 0.3563,
+ 0.3533,
+ 0.355,
+ 0.3552,
+ 0.357,
+ 0.354,
+ 0.3546,
+ 0.3545,
+ 0.3529,
+ 0.3537,
+ 0.3533,
+ 0.3535,
+ 0.3541,
+ 0.3539,
+ 0.3537
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.039823852479457855,
+ 0.9718431234359741
+ ],
+ "perturbation_rho": [
+ -0.031080063432455063,
+ 0.03366325423121452
+ ],
+ "nudging": {
+ "0.001": [
+ -2.9830262064933777e-06,
+ -5.972804501652718e-06
+ ],
+ "0.003": [
+ -8.938834071159363e-06,
+ -1.8277671188116074e-05
+ ],
+ "0.01": [
+ -3.016670234501362e-05,
+ -6.103678606450558e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 5119.443359375,
+ 277281.78125,
+ 221633.09375
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.112029142153915e-05,
+ 1.5214125141937984e-06,
+ 1.2520613381639123e-06
+ ]
+ },
+ "drift": {
+ "embed.weight": 32.21887870916367,
+ "embed.bias": 19.808534592837418,
+ "blocks.0.ln.weight": 1.571417962464522,
+ "blocks.0.w1.weight": 27.02065176792147,
+ "blocks.0.w1.bias": 18.826762362229086,
+ "blocks.0.w2.weight": 62.552517441341244,
+ "blocks.1.ln.weight": 1.2403307752162702,
+ "blocks.1.w1.weight": 19.856236759319962,
+ "blocks.1.w1.bias": 14.207741981198222,
+ "blocks.1.w2.weight": 38.602188965118806,
+ "out_ln.weight": 0.442837113470192,
+ "out_head.weight": 4.411774526619856,
+ "out_head.bias": 11.444358576141303
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 2,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 7
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_dfa_d512_L2_seed7",
+ "methods": [
+ "fa",
+ "dfa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file