summaryrefslogtreecommitdiff
path: root/results/fa_dfa_d512_L6_seed2/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_dfa_d512_L6_seed2/results_cifar10.json')
-rw-r--r--results/fa_dfa_d512_L6_seed2/results_cifar10.json837
1 files changed, 837 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L6_seed2/results_cifar10.json b/results/fa_dfa_d512_L6_seed2/results_cifar10.json
new file mode 100644
index 0000000..0d6122d
--- /dev/null
+++ b/results/fa_dfa_d512_L6_seed2/results_cifar10.json
@@ -0,0 +1,837 @@
+{
+ "2": {
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 2.0704764087677003,
+ 2.049675481185913,
+ 2.0393172933197024,
+ 2.0385254068756105,
+ 2.0333104403305056,
+ 2.037317512435913,
+ 2.035111841583252,
+ 2.033784921951294,
+ 2.0276396758270265,
+ 2.0287634895324707,
+ 2.0255478504943847,
+ 2.0249928087997437,
+ 2.0251559844207763,
+ 2.026155082015991,
+ 2.0227601895141603,
+ 2.0238794365692137,
+ 2.0220592249298095,
+ 2.0211007302474977,
+ 2.0220025036621094,
+ 2.0187504733657837,
+ 2.022589133682251,
+ 2.0209386083221434,
+ 2.022369726409912,
+ 2.019175484046936,
+ 2.0184574550628662,
+ 2.020228290786743,
+ 2.0170737294769285,
+ 2.0200500258636476,
+ 2.0192940770721437,
+ 2.017934571380615,
+ 2.018111932220459,
+ 2.019744345703125,
+ 2.0181864041137696,
+ 2.018692120895386,
+ 2.019279464416504,
+ 2.020759454421997,
+ 2.0175593240356444,
+ 2.0189450312805177,
+ 2.018363641014099,
+ 2.0204193601989746,
+ 2.018774921836853,
+ 2.020020353240967,
+ 2.020256604042053,
+ 2.018686157913208,
+ 2.017777068939209,
+ 2.01642233127594,
+ 2.0193701077270507,
+ 2.0175296588897704,
+ 2.0180459953308105,
+ 2.0163426136016844,
+ 2.0169748413085937,
+ 2.017522889404297,
+ 2.0171759409332277,
+ 2.0182337244415285,
+ 2.0202614056396486,
+ 2.0193526766967773,
+ 2.0176297589874266,
+ 2.0176475778961183,
+ 2.017951414642334,
+ 2.0159765984725952,
+ 2.0174861521911622,
+ 2.0162583628082276,
+ 2.0189596444702147,
+ 2.017551812057495,
+ 2.0174899821472168,
+ 2.017485563354492,
+ 2.0167667126464845,
+ 2.017466169166565,
+ 2.017418462524414,
+ 2.0175614359283447,
+ 2.016368521194458,
+ 2.017146753158569,
+ 2.016855639877319,
+ 2.016222254562378,
+ 2.016020330963135,
+ 2.0157443789672853,
+ 2.014490191497803,
+ 2.0179072814559937,
+ 2.0176085803985595,
+ 2.016617900123596,
+ 2.016193874168396,
+ 2.0163377814483643,
+ 2.017562115097046,
+ 2.017051735992432,
+ 2.015485999984741,
+ 2.0135854721450808,
+ 2.0146356997299195,
+ 2.0149522621154787,
+ 2.0146646865844726,
+ 2.0153391693878175,
+ 2.0160440145874023,
+ 2.0161946767425536,
+ 2.014449896469116,
+ 2.015591969642639,
+ 2.01485006980896,
+ 2.01346685836792,
+ 2.0139751796722414,
+ 2.0144011250305174,
+ 2.014900064163208,
+ 2.016459233779907
+ ],
+ "train_acc": [
+ 0.23802,
+ 0.24392,
+ 0.24906,
+ 0.25122,
+ 0.25396,
+ 0.25104,
+ 0.2552,
+ 0.25244,
+ 0.2577,
+ 0.25632,
+ 0.25834,
+ 0.2557,
+ 0.25944,
+ 0.25876,
+ 0.26044,
+ 0.25964,
+ 0.2593,
+ 0.26036,
+ 0.26106,
+ 0.26136,
+ 0.26018,
+ 0.25898,
+ 0.25858,
+ 0.2613,
+ 0.26334,
+ 0.26364,
+ 0.26186,
+ 0.26224,
+ 0.26166,
+ 0.26282,
+ 0.26364,
+ 0.26358,
+ 0.2645,
+ 0.26294,
+ 0.26592,
+ 0.26282,
+ 0.26398,
+ 0.26414,
+ 0.26538,
+ 0.26506,
+ 0.26578,
+ 0.26148,
+ 0.26312,
+ 0.26586,
+ 0.26478,
+ 0.26574,
+ 0.26416,
+ 0.26488,
+ 0.26366,
+ 0.26614,
+ 0.2656,
+ 0.26508,
+ 0.2675,
+ 0.26694,
+ 0.26532,
+ 0.26614,
+ 0.26596,
+ 0.26538,
+ 0.2652,
+ 0.26606,
+ 0.26698,
+ 0.26806,
+ 0.26674,
+ 0.26714,
+ 0.26704,
+ 0.26768,
+ 0.26714,
+ 0.2651,
+ 0.26544,
+ 0.26656,
+ 0.2676,
+ 0.26678,
+ 0.26898,
+ 0.26788,
+ 0.26736,
+ 0.2677,
+ 0.26732,
+ 0.26766,
+ 0.26812,
+ 0.2675,
+ 0.26916,
+ 0.26876,
+ 0.26754,
+ 0.26748,
+ 0.26802,
+ 0.27004,
+ 0.27052,
+ 0.2671,
+ 0.27224,
+ 0.26654,
+ 0.26818,
+ 0.26902,
+ 0.2691,
+ 0.26962,
+ 0.2702,
+ 0.26948,
+ 0.2712,
+ 0.27026,
+ 0.26876,
+ 0.26952
+ ],
+ "test_acc": [
+ 0.2537,
+ 0.2494,
+ 0.2765,
+ 0.2473,
+ 0.2851,
+ 0.2759,
+ 0.2702,
+ 0.2833,
+ 0.2841,
+ 0.2663,
+ 0.2858,
+ 0.2432,
+ 0.2894,
+ 0.2933,
+ 0.2938,
+ 0.2901,
+ 0.2777,
+ 0.2769,
+ 0.2907,
+ 0.2833,
+ 0.2973,
+ 0.2692,
+ 0.277,
+ 0.2841,
+ 0.2917,
+ 0.2694,
+ 0.2929,
+ 0.2737,
+ 0.2955,
+ 0.2877,
+ 0.2891,
+ 0.302,
+ 0.272,
+ 0.2931,
+ 0.2882,
+ 0.2806,
+ 0.2849,
+ 0.2989,
+ 0.2988,
+ 0.3036,
+ 0.2869,
+ 0.2951,
+ 0.3014,
+ 0.289,
+ 0.2834,
+ 0.2896,
+ 0.2887,
+ 0.2932,
+ 0.2855,
+ 0.2882,
+ 0.2846,
+ 0.3018,
+ 0.2981,
+ 0.3019,
+ 0.2846,
+ 0.2968,
+ 0.2915,
+ 0.2935,
+ 0.2912,
+ 0.2978,
+ 0.2989,
+ 0.2953,
+ 0.2999,
+ 0.292,
+ 0.2923,
+ 0.2856,
+ 0.2956,
+ 0.2993,
+ 0.2906,
+ 0.2931,
+ 0.2925,
+ 0.2948,
+ 0.2968,
+ 0.295,
+ 0.2965,
+ 0.3019,
+ 0.2889,
+ 0.2941,
+ 0.2958,
+ 0.2959,
+ 0.2955,
+ 0.2926,
+ 0.2921,
+ 0.2964,
+ 0.2981,
+ 0.2912,
+ 0.2982,
+ 0.2995,
+ 0.2958,
+ 0.2963,
+ 0.2965,
+ 0.2963,
+ 0.2947,
+ 0.2957,
+ 0.2953,
+ 0.2947,
+ 0.2953,
+ 0.2951,
+ 0.2949,
+ 0.295
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.3428037762641907,
+ -3.763916902244091e-05,
+ -0.0007522967061959207,
+ -0.00019637049990706146,
+ -0.0005234384443610907,
+ 0.00033836261718533933
+ ],
+ "perturbation_rho": [
+ -0.03871288150548935,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -3.3015385270118713e-07,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.003": [
+ -8.167698979377747e-07,
+ 0.0,
+ 0.0,
+ 0.0,
+ 1.862645149230957e-09,
+ 0.0
+ ],
+ "0.01": [
+ -2.7455389499664307e-06,
+ 0.0,
+ 0.0,
+ 1.862645149230957e-09,
+ 1.862645149230957e-09,
+ 0.0
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 53848.7734375,
+ 2442806016.0,
+ 5245538816.0,
+ 6828209664.0,
+ 7018600960.0,
+ 9658986496.0,
+ 9768150016.0
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.0601439132406085e-07,
+ 2.350288574870518e-10,
+ 2.3180254937749112e-10,
+ 2.322748937633179e-10,
+ 2.3222145040247e-10,
+ 2.3218917066802902e-10,
+ 2.321651759729093e-10
+ ]
+ },
+ "drift": {
+ "embed.weight": 347.726745764923,
+ "embed.bias": 320.686611820448,
+ "blocks.0.ln.weight": 9.997068770929598,
+ "blocks.0.w1.weight": 332.0183119830964,
+ "blocks.0.w1.bias": 361.6276454599223,
+ "blocks.0.w2.weight": 491.26444464340926,
+ "blocks.1.ln.weight": 9.760206175642947,
+ "blocks.1.w1.weight": 399.42793179083463,
+ "blocks.1.w1.bias": 382.1218468905457,
+ "blocks.1.w2.weight": 398.4896403314863,
+ "blocks.2.ln.weight": 9.863790992763134,
+ "blocks.2.w1.weight": 403.4218387582533,
+ "blocks.2.w1.bias": 369.67326277166103,
+ "blocks.2.w2.weight": 388.1030551430935,
+ "blocks.3.ln.weight": 7.7321395772148405,
+ "blocks.3.w1.weight": 284.159080804305,
+ "blocks.3.w1.bias": 261.08860693920894,
+ "blocks.3.w2.weight": 276.021700238577,
+ "blocks.4.ln.weight": 10.766653379169998,
+ "blocks.4.w1.weight": 441.4219333141434,
+ "blocks.4.w1.bias": 408.4716885612093,
+ "blocks.4.w2.weight": 432.48056855561003,
+ "blocks.5.ln.weight": 7.252784916283292,
+ "blocks.5.w1.weight": 280.38847615534195,
+ "blocks.5.w1.bias": 255.99327290804064,
+ "blocks.5.w2.weight": 255.63025547094998,
+ "out_ln.weight": 0.644730004333539,
+ "out_head.weight": 9.313913439210426,
+ "out_head.bias": 0.978185244031994
+ }
+ },
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.0382984645843507,
+ 1.9496157778167724,
+ 1.9119072325897217,
+ 1.8929361431121827,
+ 1.8775380432128905,
+ 1.8741492847442627,
+ 1.8671779189300537,
+ 1.860015816307068,
+ 1.8485039702987671,
+ 1.844084996986389,
+ 1.8363114721679688,
+ 1.8330332998275758,
+ 1.8273526552581787,
+ 1.825867492904663,
+ 1.821722242088318,
+ 1.8222067623519898,
+ 1.8212668908691407,
+ 1.8164310580825807,
+ 1.8167414797592163,
+ 1.8158153560638428,
+ 1.8170397219848633,
+ 1.8139575901031495,
+ 1.814438596458435,
+ 1.807250874671936,
+ 1.806480390663147,
+ 1.805527213973999,
+ 1.7998141473770142,
+ 1.8049808203125,
+ 1.8055741637420655,
+ 1.796914314918518,
+ 1.8009305011749268,
+ 1.797931548538208,
+ 1.7981645835113524,
+ 1.793643822402954,
+ 1.7937120150375365,
+ 1.7967921892929077,
+ 1.7892387997436523,
+ 1.785188671875,
+ 1.786605785293579,
+ 1.787917324485779,
+ 1.7853582260894776,
+ 1.7880721422576904,
+ 1.7864411516571046,
+ 1.7777207873916625,
+ 1.7769269942855834,
+ 1.777174091796875,
+ 1.7795673489761352,
+ 1.773414126586914,
+ 1.7774351581192016,
+ 1.7697969200897217,
+ 1.771698450050354,
+ 1.768428716278076,
+ 1.7676336987304688,
+ 1.765194714126587,
+ 1.7675122838974,
+ 1.7682551845932006,
+ 1.7667323706436158,
+ 1.7661600426864623,
+ 1.7620434980010986,
+ 1.7610514661026,
+ 1.7625030724716186,
+ 1.7606126858520508,
+ 1.760137271118164,
+ 1.7585180844879151,
+ 1.7585363976287842,
+ 1.7592174551010131,
+ 1.755930234375,
+ 1.7548912310791016,
+ 1.7563516518783568,
+ 1.7501784167099,
+ 1.7541064535522461,
+ 1.7512517785263062,
+ 1.7541993662261963,
+ 1.7516761654663087,
+ 1.7516398949813843,
+ 1.749719626121521,
+ 1.7497738579559325,
+ 1.752181930885315,
+ 1.7519074490356445,
+ 1.7518238845443725,
+ 1.7466175811004638,
+ 1.748845227355957,
+ 1.746575064430237,
+ 1.7496823914337158,
+ 1.7468877982330322,
+ 1.7439219277191162,
+ 1.7428745371246337,
+ 1.746016036453247,
+ 1.742904917678833,
+ 1.7454003299713134,
+ 1.7449493420028686,
+ 1.744745844039917,
+ 1.7438948041152955,
+ 1.7453510579681397,
+ 1.7438724200439453,
+ 1.7425698751068115,
+ 1.742772998123169,
+ 1.7421956006622314,
+ 1.7445682699966432,
+ 1.7442712462615966
+ ],
+ "train_acc": [
+ 0.25024,
+ 0.28724,
+ 0.30528,
+ 0.31264,
+ 0.32216,
+ 0.32208,
+ 0.32792,
+ 0.33064,
+ 0.3365,
+ 0.3396,
+ 0.34,
+ 0.34242,
+ 0.34468,
+ 0.34422,
+ 0.34752,
+ 0.34912,
+ 0.34524,
+ 0.34978,
+ 0.34856,
+ 0.3501,
+ 0.34806,
+ 0.35048,
+ 0.35214,
+ 0.35416,
+ 0.35338,
+ 0.35482,
+ 0.35432,
+ 0.35244,
+ 0.35388,
+ 0.35836,
+ 0.35712,
+ 0.3568,
+ 0.3591,
+ 0.36118,
+ 0.36208,
+ 0.35824,
+ 0.36296,
+ 0.3625,
+ 0.3616,
+ 0.3628,
+ 0.36246,
+ 0.36298,
+ 0.3605,
+ 0.36632,
+ 0.36574,
+ 0.36678,
+ 0.36478,
+ 0.3649,
+ 0.3662,
+ 0.36734,
+ 0.3665,
+ 0.36722,
+ 0.36714,
+ 0.3702,
+ 0.36908,
+ 0.37058,
+ 0.36998,
+ 0.36858,
+ 0.37244,
+ 0.37104,
+ 0.3722,
+ 0.37344,
+ 0.3726,
+ 0.37172,
+ 0.3741,
+ 0.37406,
+ 0.3731,
+ 0.37294,
+ 0.37284,
+ 0.37628,
+ 0.37682,
+ 0.37742,
+ 0.37544,
+ 0.37656,
+ 0.37632,
+ 0.37814,
+ 0.37808,
+ 0.37642,
+ 0.37748,
+ 0.37462,
+ 0.37968,
+ 0.37766,
+ 0.37704,
+ 0.37846,
+ 0.37784,
+ 0.379,
+ 0.37904,
+ 0.37854,
+ 0.38202,
+ 0.37828,
+ 0.37712,
+ 0.37962,
+ 0.38004,
+ 0.37898,
+ 0.3783,
+ 0.37898,
+ 0.38082,
+ 0.38006,
+ 0.37922,
+ 0.37846
+ ],
+ "test_acc": [
+ 0.3027,
+ 0.306,
+ 0.3365,
+ 0.3382,
+ 0.3465,
+ 0.3597,
+ 0.3579,
+ 0.3625,
+ 0.3757,
+ 0.3702,
+ 0.3663,
+ 0.3612,
+ 0.374,
+ 0.378,
+ 0.3778,
+ 0.3778,
+ 0.3807,
+ 0.3691,
+ 0.3833,
+ 0.3714,
+ 0.3788,
+ 0.3629,
+ 0.3794,
+ 0.382,
+ 0.3843,
+ 0.3732,
+ 0.3818,
+ 0.373,
+ 0.3819,
+ 0.3776,
+ 0.3882,
+ 0.3926,
+ 0.385,
+ 0.3853,
+ 0.3879,
+ 0.3927,
+ 0.3894,
+ 0.3945,
+ 0.3903,
+ 0.3924,
+ 0.3896,
+ 0.3941,
+ 0.3919,
+ 0.3888,
+ 0.3863,
+ 0.3927,
+ 0.3922,
+ 0.3903,
+ 0.3939,
+ 0.3828,
+ 0.3963,
+ 0.3935,
+ 0.3958,
+ 0.3971,
+ 0.4048,
+ 0.4003,
+ 0.3934,
+ 0.3945,
+ 0.395,
+ 0.3979,
+ 0.3908,
+ 0.3969,
+ 0.4012,
+ 0.3998,
+ 0.3987,
+ 0.3965,
+ 0.4025,
+ 0.3984,
+ 0.4038,
+ 0.3982,
+ 0.4015,
+ 0.4027,
+ 0.3997,
+ 0.4022,
+ 0.4045,
+ 0.4031,
+ 0.4028,
+ 0.4041,
+ 0.3998,
+ 0.4012,
+ 0.3998,
+ 0.3979,
+ 0.4026,
+ 0.401,
+ 0.4006,
+ 0.4048,
+ 0.4018,
+ 0.4009,
+ 0.4025,
+ 0.4024,
+ 0.4009,
+ 0.4036,
+ 0.4025,
+ 0.4022,
+ 0.4026,
+ 0.401,
+ 0.4018,
+ 0.401,
+ 0.4015,
+ 0.4016
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.02052094228565693,
+ 0.07671980559825897,
+ -0.10412630438804626,
+ -0.03588568791747093,
+ -0.07592153549194336,
+ 0.9841817617416382
+ ],
+ "perturbation_rho": [
+ -0.0499441958963871,
+ 0.03510870411992073,
+ 0.012152664363384247,
+ -0.01593763567507267,
+ -0.030490349978208542,
+ 0.01056537963449955
+ ],
+ "nudging": {
+ "0.001": [
+ -1.460895873606205e-06,
+ -1.8533319234848022e-07,
+ 8.102506399154663e-08,
+ 3.9814040064811707e-08,
+ 7.660128176212311e-08,
+ -1.0418007150292397e-06
+ ],
+ "0.003": [
+ -4.51505184173584e-06,
+ -7.73230567574501e-07,
+ 4.012836143374443e-07,
+ 1.9150320440530777e-07,
+ 2.3317988961935043e-07,
+ -3.8853613659739494e-06
+ ],
+ "0.01": [
+ -1.504761166870594e-05,
+ -2.689310349524021e-06,
+ 1.5775440260767937e-06,
+ 6.139744073152542e-07,
+ 9.952345862984657e-07,
+ -1.3828510418534279e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 7937.806640625,
+ 157942.125,
+ 845318.25,
+ 1734418.625,
+ 1908211.875,
+ 2166763.75,
+ 1424229.125
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.3930177121656016e-05,
+ 1.1552400565051357e-06,
+ 6.149262503640784e-07,
+ 6.002979375807627e-07,
+ 6.000758503432735e-07,
+ 5.996230356686283e-07,
+ 5.751607545789739e-07
+ ]
+ },
+ "drift": {
+ "embed.weight": 54.05447299340841,
+ "embed.bias": 16.031038115248215,
+ "blocks.0.ln.weight": 1.2416108593211508,
+ "blocks.0.w1.weight": 17.922589218376636,
+ "blocks.0.w1.bias": 14.956067338203475,
+ "blocks.0.w2.weight": 64.67351730215137,
+ "blocks.1.ln.weight": 1.1286859632363149,
+ "blocks.1.w1.weight": 23.71804846947617,
+ "blocks.1.w1.bias": 17.43068124645083,
+ "blocks.1.w2.weight": 41.38902946126262,
+ "blocks.2.ln.weight": 0.7406672335136909,
+ "blocks.2.w1.weight": 24.88918465627309,
+ "blocks.2.w1.bias": 25.668393301356875,
+ "blocks.2.w2.weight": 26.33124026065157,
+ "blocks.3.ln.weight": 0.5408212886770045,
+ "blocks.3.w1.weight": 19.746562187924944,
+ "blocks.3.w1.bias": 21.605426127504696,
+ "blocks.3.w2.weight": 26.408093498021923,
+ "blocks.4.ln.weight": 0.7373842468395975,
+ "blocks.4.w1.weight": 21.153183487980545,
+ "blocks.4.w1.bias": 21.145538252519305,
+ "blocks.4.w2.weight": 45.59224517841596,
+ "blocks.5.ln.weight": 0.8316077429831186,
+ "blocks.5.w1.weight": 20.11472175424346,
+ "blocks.5.w1.bias": 17.387776840886495,
+ "blocks.5.w2.weight": 81.52952222436008,
+ "out_ln.weight": 0.38061390763416836,
+ "out_head.weight": 7.016437743402715,
+ "out_head.bias": 0.6179754221306049
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 6,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 2
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_dfa_d512_L6_seed2",
+ "methods": [
+ "fa",
+ "dfa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file