summaryrefslogtreecommitdiff
path: root/results/fa_dfa_d512_L2_seed1/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_dfa_d512_L2_seed1/results_cifar10.json')
-rw-r--r--results/fa_dfa_d512_L2_seed1/results_cifar10.json749
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed1/results_cifar10.json b/results/fa_dfa_d512_L2_seed1/results_cifar10.json
new file mode 100644
index 0000000..0dd9e9b
--- /dev/null
+++ b/results/fa_dfa_d512_L2_seed1/results_cifar10.json
@@ -0,0 +1,749 @@
+{
+ "1": {
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 2.059094401855469,
+ 2.044447731781006,
+ 2.0331237268066404,
+ 2.029790968055725,
+ 2.0203696198272705,
+ 2.019836251373291,
+ 2.0172710887908933,
+ 2.0157542709350587,
+ 2.01279447265625,
+ 2.0095205695343017,
+ 2.0108920065689087,
+ 2.0079552867889405,
+ 2.0044708168792726,
+ 2.0045814642333983,
+ 2.008353828582764,
+ 2.0057097484970092,
+ 2.0044997080993654,
+ 2.008672186203003,
+ 2.007922875289917,
+ 2.005835166091919,
+ 2.0033903245544433,
+ 2.0044442585754396,
+ 2.002520341949463,
+ 2.00441702545166,
+ 2.0058324599456787,
+ 2.004086421432495,
+ 2.0051950196838377,
+ 2.0038982134246828,
+ 2.004509604110718,
+ 2.0052878368377685,
+ 2.002380726890564,
+ 2.004787947921753,
+ 2.0059314285278322,
+ 2.00248601272583,
+ 2.0011240525817873,
+ 2.0024265776062014,
+ 2.000450315246582,
+ 2.003341311035156,
+ 2.0023523516082764,
+ 2.0043818824768067,
+ 2.0009307250213624,
+ 1.9997900833129882,
+ 1.99952888671875,
+ 1.9998678870010376,
+ 2.000314803161621,
+ 2.0005521519470215,
+ 1.9993469972991944,
+ 2.0002477783966066,
+ 1.9992239441680908,
+ 2.000459006500244,
+ 1.999985199661255,
+ 1.9989831493377686,
+ 1.9985046770477295,
+ 1.999920511932373,
+ 2.001435203552246,
+ 1.999222763671875,
+ 1.9992314191436769,
+ 1.9978362256240845,
+ 1.9966827032470704,
+ 1.9963577353286743,
+ 1.9981027877807618,
+ 1.998446220703125,
+ 1.999375821762085,
+ 1.9966239959716796,
+ 1.9978697190856933,
+ 1.9981718766021728,
+ 1.9964544176864625,
+ 1.996339178161621,
+ 1.995297778892517,
+ 1.9981674702453613,
+ 1.9945542547988893,
+ 1.9964004328918457,
+ 1.9957070028686523,
+ 1.9959317153930665,
+ 1.996950538787842,
+ 1.9957062911987304,
+ 1.9937946883392335,
+ 1.9961785815429687,
+ 1.996840117225647,
+ 1.9966120117950439,
+ 1.9950081676483153,
+ 1.9959315377807618,
+ 1.9947433185195922,
+ 1.9953646588897704,
+ 1.9961627129745483,
+ 1.9956305498504638,
+ 1.9933074866104126,
+ 1.9939569332122802,
+ 1.9948224069213867,
+ 1.9938344969940185,
+ 1.9951542666625977,
+ 1.994460453224182,
+ 1.9951913018798828,
+ 1.992417700653076,
+ 1.9943852715682984,
+ 1.9950172023010253,
+ 1.9913645124816894,
+ 1.9934076538467407,
+ 1.993856616821289,
+ 1.9950498567962647
+ ],
+ "train_acc": [
+ 0.24538,
+ 0.2525,
+ 0.24984,
+ 0.25596,
+ 0.25824,
+ 0.26188,
+ 0.26018,
+ 0.26256,
+ 0.26788,
+ 0.26836,
+ 0.26572,
+ 0.26712,
+ 0.26946,
+ 0.2707,
+ 0.26872,
+ 0.26986,
+ 0.26942,
+ 0.26706,
+ 0.2688,
+ 0.26814,
+ 0.2714,
+ 0.26896,
+ 0.26966,
+ 0.27136,
+ 0.26994,
+ 0.27172,
+ 0.27024,
+ 0.2708,
+ 0.27018,
+ 0.27212,
+ 0.27326,
+ 0.2728,
+ 0.2694,
+ 0.27118,
+ 0.27332,
+ 0.2738,
+ 0.27492,
+ 0.27382,
+ 0.27348,
+ 0.27124,
+ 0.27338,
+ 0.27632,
+ 0.27474,
+ 0.27438,
+ 0.27608,
+ 0.27216,
+ 0.27472,
+ 0.27174,
+ 0.2764,
+ 0.27286,
+ 0.27426,
+ 0.27344,
+ 0.27646,
+ 0.27692,
+ 0.27348,
+ 0.27398,
+ 0.2745,
+ 0.27462,
+ 0.27702,
+ 0.2742,
+ 0.27524,
+ 0.27522,
+ 0.2742,
+ 0.27684,
+ 0.27522,
+ 0.2755,
+ 0.2759,
+ 0.27692,
+ 0.27698,
+ 0.27796,
+ 0.27768,
+ 0.27376,
+ 0.27822,
+ 0.2749,
+ 0.27752,
+ 0.2773,
+ 0.27838,
+ 0.27666,
+ 0.27632,
+ 0.27526,
+ 0.27792,
+ 0.27644,
+ 0.2755,
+ 0.27696,
+ 0.27616,
+ 0.27868,
+ 0.27898,
+ 0.27856,
+ 0.27766,
+ 0.27746,
+ 0.27564,
+ 0.27836,
+ 0.27742,
+ 0.27794,
+ 0.27654,
+ 0.277,
+ 0.28076,
+ 0.27934,
+ 0.27814,
+ 0.27694
+ ],
+ "test_acc": [
+ 0.2655,
+ 0.2561,
+ 0.2732,
+ 0.2647,
+ 0.2937,
+ 0.2959,
+ 0.2856,
+ 0.2952,
+ 0.2909,
+ 0.2903,
+ 0.2948,
+ 0.2937,
+ 0.2853,
+ 0.2983,
+ 0.2836,
+ 0.2904,
+ 0.2751,
+ 0.294,
+ 0.2826,
+ 0.2783,
+ 0.3006,
+ 0.2986,
+ 0.2981,
+ 0.2913,
+ 0.27,
+ 0.2959,
+ 0.2941,
+ 0.2893,
+ 0.2816,
+ 0.2762,
+ 0.2842,
+ 0.2888,
+ 0.294,
+ 0.3006,
+ 0.2761,
+ 0.2995,
+ 0.2824,
+ 0.2895,
+ 0.2918,
+ 0.2959,
+ 0.2896,
+ 0.2977,
+ 0.2867,
+ 0.2906,
+ 0.2955,
+ 0.2965,
+ 0.2819,
+ 0.2848,
+ 0.293,
+ 0.2901,
+ 0.2903,
+ 0.2893,
+ 0.2946,
+ 0.286,
+ 0.2811,
+ 0.2948,
+ 0.2884,
+ 0.2963,
+ 0.2914,
+ 0.2919,
+ 0.2882,
+ 0.2923,
+ 0.2964,
+ 0.3036,
+ 0.3028,
+ 0.2942,
+ 0.2974,
+ 0.286,
+ 0.2997,
+ 0.2913,
+ 0.2942,
+ 0.2914,
+ 0.295,
+ 0.2929,
+ 0.2945,
+ 0.2905,
+ 0.2979,
+ 0.3003,
+ 0.2997,
+ 0.295,
+ 0.2937,
+ 0.2884,
+ 0.2946,
+ 0.2959,
+ 0.2977,
+ 0.2996,
+ 0.2999,
+ 0.2952,
+ 0.297,
+ 0.2936,
+ 0.2981,
+ 0.2977,
+ 0.2982,
+ 0.2978,
+ 0.2979,
+ 0.2976,
+ 0.2983,
+ 0.2977,
+ 0.2978,
+ 0.2978
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.41370105743408203,
+ -0.001240116311237216
+ ],
+ "perturbation_rho": [
+ 0.015020761638879776,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -4.163011908531189e-07,
+ 0.0
+ ],
+ "0.003": [
+ -1.1897645890712738e-06,
+ 0.0
+ ],
+ "0.01": [
+ -3.778841346502304e-06,
+ 9.313225746154785e-10
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 56646.390625,
+ 1782275456.0,
+ 3970110464.0
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.493850104201556e-07,
+ 3.667711412358443e-10,
+ 3.6680619652784685e-10
+ ]
+ },
+ "drift": {
+ "embed.weight": 340.80661711332743,
+ "embed.bias": 276.58178672612297,
+ "blocks.0.ln.weight": 9.889068312709053,
+ "blocks.0.w1.weight": 318.9410688527977,
+ "blocks.0.w1.bias": 284.37318853440576,
+ "blocks.0.w2.weight": 489.2728313372279,
+ "blocks.1.ln.weight": 9.298819559476074,
+ "blocks.1.w1.weight": 366.2278399546544,
+ "blocks.1.w1.bias": 340.3854434800174,
+ "blocks.1.w2.weight": 341.5363762004093,
+ "out_ln.weight": 0.5301057051408113,
+ "out_head.weight": 8.039116173269838,
+ "out_head.bias": 2.5371126762269562
+ }
+ },
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.05515945022583,
+ 1.9500655529785156,
+ 1.9110925933456422,
+ 1.8819315839004516,
+ 1.8608471837615967,
+ 1.8478346523666382,
+ 1.8411366244125367,
+ 1.8377560669326782,
+ 1.8311604034805298,
+ 1.8246206870269774,
+ 1.8166842291641236,
+ 1.8113972366714477,
+ 1.8071093799209594,
+ 1.7970440604400635,
+ 1.7988952663803102,
+ 1.7952887838363647,
+ 1.7926777132415772,
+ 1.790428493423462,
+ 1.7899820502090453,
+ 1.7887613116836547,
+ 1.7811174698257446,
+ 1.781726747894287,
+ 1.782828377418518,
+ 1.7825099970245362,
+ 1.7798745111846923,
+ 1.7748807119369507,
+ 1.769409514427185,
+ 1.7675959386444091,
+ 1.7701947622680665,
+ 1.7674276565551759,
+ 1.7609349981307982,
+ 1.7605391665267944,
+ 1.762060026626587,
+ 1.7580202764129638,
+ 1.7636039975357056,
+ 1.7673666812133788,
+ 1.7655566649627685,
+ 1.7669985010147096,
+ 1.7656920331192016,
+ 1.7639919567108153,
+ 1.7634542723846436,
+ 1.7601457201766968,
+ 1.761037275123596,
+ 1.7602271603775024,
+ 1.7624055517578125,
+ 1.7582754214477538,
+ 1.7596718951416015,
+ 1.7575918433380127,
+ 1.757328048439026,
+ 1.7560129935455322,
+ 1.7593553677749634,
+ 1.75662100856781,
+ 1.7546059392547608,
+ 1.7581290004730226,
+ 1.7570533187103272,
+ 1.7555389776992798,
+ 1.755943459587097,
+ 1.752056611404419,
+ 1.752125501060486,
+ 1.7542531232452392,
+ 1.7525837285614014,
+ 1.7537434762954711,
+ 1.7566586553573609,
+ 1.754645963783264,
+ 1.7561360279083251,
+ 1.7577947814178467,
+ 1.7517323531723021,
+ 1.7506846601104735,
+ 1.7523996893310547,
+ 1.7564484720611573,
+ 1.7542920526885986,
+ 1.7536059958648682,
+ 1.753201146583557,
+ 1.7531446646118165,
+ 1.7524780932617188,
+ 1.7523272793197633,
+ 1.752608459777832,
+ 1.7483984720611572,
+ 1.7505473443984985,
+ 1.750156759109497,
+ 1.7495093181991577,
+ 1.7508859223175048,
+ 1.7515791293716432,
+ 1.7466206330108642,
+ 1.751723793373108,
+ 1.750410927658081,
+ 1.7431821329116821,
+ 1.7460082646942139,
+ 1.7443738849639892,
+ 1.7485774746704101,
+ 1.747268639907837,
+ 1.7440908068847656,
+ 1.7475049467468262,
+ 1.7451262094497682,
+ 1.747353721961975,
+ 1.7474739736557008,
+ 1.7444730795669556,
+ 1.748691442642212,
+ 1.743288662033081,
+ 1.7470912045669555
+ ],
+ "train_acc": [
+ 0.25462,
+ 0.29498,
+ 0.31256,
+ 0.32432,
+ 0.33206,
+ 0.33724,
+ 0.33776,
+ 0.34132,
+ 0.34392,
+ 0.34576,
+ 0.35074,
+ 0.34868,
+ 0.35426,
+ 0.35624,
+ 0.35478,
+ 0.35702,
+ 0.35892,
+ 0.3572,
+ 0.35788,
+ 0.35796,
+ 0.3596,
+ 0.36274,
+ 0.3592,
+ 0.36092,
+ 0.36282,
+ 0.36558,
+ 0.36466,
+ 0.36602,
+ 0.36356,
+ 0.36714,
+ 0.36908,
+ 0.36888,
+ 0.36582,
+ 0.368,
+ 0.365,
+ 0.3677,
+ 0.3674,
+ 0.3658,
+ 0.36706,
+ 0.368,
+ 0.3688,
+ 0.3678,
+ 0.36976,
+ 0.36634,
+ 0.36654,
+ 0.3687,
+ 0.36986,
+ 0.36986,
+ 0.3703,
+ 0.37068,
+ 0.36806,
+ 0.37002,
+ 0.37306,
+ 0.3722,
+ 0.36826,
+ 0.37146,
+ 0.3704,
+ 0.37428,
+ 0.37186,
+ 0.37382,
+ 0.37398,
+ 0.3711,
+ 0.3723,
+ 0.37532,
+ 0.37158,
+ 0.37096,
+ 0.37172,
+ 0.37316,
+ 0.37314,
+ 0.37438,
+ 0.37196,
+ 0.3737,
+ 0.37458,
+ 0.37306,
+ 0.37588,
+ 0.37444,
+ 0.37408,
+ 0.37832,
+ 0.37416,
+ 0.37576,
+ 0.3746,
+ 0.375,
+ 0.37462,
+ 0.37456,
+ 0.37364,
+ 0.37744,
+ 0.37852,
+ 0.37832,
+ 0.3778,
+ 0.37706,
+ 0.37604,
+ 0.37654,
+ 0.37828,
+ 0.37762,
+ 0.37686,
+ 0.377,
+ 0.37886,
+ 0.37662,
+ 0.37522,
+ 0.37652
+ ],
+ "test_acc": [
+ 0.2978,
+ 0.3334,
+ 0.3399,
+ 0.3342,
+ 0.3634,
+ 0.3618,
+ 0.3505,
+ 0.3521,
+ 0.3696,
+ 0.3722,
+ 0.3679,
+ 0.3787,
+ 0.3663,
+ 0.3811,
+ 0.3611,
+ 0.365,
+ 0.3543,
+ 0.3666,
+ 0.3501,
+ 0.36,
+ 0.3572,
+ 0.3504,
+ 0.3467,
+ 0.3598,
+ 0.3353,
+ 0.3474,
+ 0.3382,
+ 0.3432,
+ 0.3617,
+ 0.3397,
+ 0.353,
+ 0.3288,
+ 0.3385,
+ 0.3414,
+ 0.3467,
+ 0.3389,
+ 0.3341,
+ 0.3434,
+ 0.3537,
+ 0.3496,
+ 0.3526,
+ 0.346,
+ 0.3603,
+ 0.3526,
+ 0.3342,
+ 0.346,
+ 0.3392,
+ 0.3277,
+ 0.3535,
+ 0.3419,
+ 0.3396,
+ 0.3404,
+ 0.3433,
+ 0.3468,
+ 0.339,
+ 0.3361,
+ 0.3421,
+ 0.3363,
+ 0.3544,
+ 0.3465,
+ 0.3454,
+ 0.3472,
+ 0.3401,
+ 0.3454,
+ 0.3511,
+ 0.343,
+ 0.3445,
+ 0.3368,
+ 0.3424,
+ 0.3425,
+ 0.3381,
+ 0.3435,
+ 0.3496,
+ 0.346,
+ 0.3411,
+ 0.3408,
+ 0.3512,
+ 0.3469,
+ 0.3473,
+ 0.3419,
+ 0.3554,
+ 0.3449,
+ 0.345,
+ 0.3431,
+ 0.3442,
+ 0.3501,
+ 0.3534,
+ 0.3469,
+ 0.3496,
+ 0.3436,
+ 0.3478,
+ 0.3501,
+ 0.3492,
+ 0.3481,
+ 0.3474,
+ 0.3466,
+ 0.3476,
+ 0.3468,
+ 0.3473,
+ 0.3471
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.007958251982927322,
+ 0.9600946307182312
+ ],
+ "perturbation_rho": [
+ 0.029625363647937775,
+ 0.18801619112491608
+ ],
+ "nudging": {
+ "0.001": [
+ 4.2957253754138947e-07,
+ -8.616363629698753e-06
+ ],
+ "0.003": [
+ 1.2052478268742561e-06,
+ -2.6152702048420906e-05
+ ],
+ "0.01": [
+ 4.0422892197966576e-06,
+ -8.745735976845026e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 6253.97314453125,
+ 339687.71875,
+ 217173.15625
+ ],
+ "bp_grad_norms_per_layer": [
+ 1.8587075828691013e-05,
+ 8.973949547907978e-07,
+ 7.725411705905572e-07
+ ]
+ },
+ "drift": {
+ "embed.weight": 35.41278218973057,
+ "embed.bias": 29.83841191850244,
+ "blocks.0.ln.weight": 1.4875314025636917,
+ "blocks.0.w1.weight": 25.996758962578763,
+ "blocks.0.w1.bias": 15.439034204651744,
+ "blocks.0.w2.weight": 58.48910743468254,
+ "blocks.1.ln.weight": 1.2261067193625912,
+ "blocks.1.w1.weight": 24.34549540914942,
+ "blocks.1.w1.bias": 12.006957572444392,
+ "blocks.1.w2.weight": 29.62795958064609,
+ "out_ln.weight": 0.4822583681094011,
+ "out_head.weight": 3.604309031698496,
+ "out_head.bias": 10.930487632919764
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 2,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 1
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_dfa_d512_L2_seed1",
+ "methods": [
+ "fa",
+ "dfa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file