summaryrefslogtreecommitdiff
path: root/results/fa_depth_scan_d512_L6/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_depth_scan_d512_L6/results_cifar10.json')
-rw-r--r--results/fa_depth_scan_d512_L6/results_cifar10.json433
1 files changed, 433 insertions, 0 deletions
diff --git a/results/fa_depth_scan_d512_L6/results_cifar10.json b/results/fa_depth_scan_d512_L6/results_cifar10.json
new file mode 100644
index 0000000..f92f310
--- /dev/null
+++ b/results/fa_depth_scan_d512_L6/results_cifar10.json
@@ -0,0 +1,433 @@
+{
+ "42": {
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.0374581846618653,
+ 1.9505271494293213,
+ 1.9189605682373048,
+ 1.8992357767105104,
+ 1.8916226636123656,
+ 1.8799470928955078,
+ 1.8715093560409546,
+ 1.8660212090301513,
+ 1.8614284765625,
+ 1.8615510483169555,
+ 1.858706633758545,
+ 1.8505436419296264,
+ 1.8469465209197997,
+ 1.84686426486969,
+ 1.8409993788909913,
+ 1.8422894380950927,
+ 1.8362944522094726,
+ 1.838251561012268,
+ 1.8342618326568603,
+ 1.8288902439117432,
+ 1.8288569342803955,
+ 1.8237011749649048,
+ 1.8190487328338623,
+ 1.8216550624847412,
+ 1.818442062072754,
+ 1.8108094896697997,
+ 1.8102704141998291,
+ 1.8097241515350342,
+ 1.8078967553710938,
+ 1.799188058128357,
+ 1.8009985346221924,
+ 1.8004494039535524,
+ 1.79110828830719,
+ 1.7962453186035157,
+ 1.7955271081924438,
+ 1.7904337732696534,
+ 1.788247091140747,
+ 1.7867638687133789,
+ 1.787053722076416,
+ 1.7837253421020507,
+ 1.7821894748687743,
+ 1.7816637888336182,
+ 1.7749454086685181,
+ 1.7757588800811768,
+ 1.7753548749542236,
+ 1.7709813816070556,
+ 1.7743957537078858,
+ 1.7711823197174072,
+ 1.7686557120132447,
+ 1.7698634561157227,
+ 1.76816160987854,
+ 1.7640094296646118,
+ 1.7590285652923583,
+ 1.759483937072754,
+ 1.7608595893096923,
+ 1.759725392189026,
+ 1.7576867937850953,
+ 1.7575671384429932,
+ 1.7513107781600952,
+ 1.7550161592102052,
+ 1.752431219062805,
+ 1.7487841637802124,
+ 1.7479721618652344,
+ 1.7504890463638305,
+ 1.7505805645751953,
+ 1.7466501081085206,
+ 1.7456124398422241,
+ 1.7472877283096313,
+ 1.740817502784729,
+ 1.7439257540893556,
+ 1.7465672635650635,
+ 1.744754091758728,
+ 1.7406636810684204,
+ 1.741213535194397,
+ 1.7423687073516845,
+ 1.742182956199646,
+ 1.742147672958374,
+ 1.7392435836029052,
+ 1.7430149713516236,
+ 1.7413112850952148,
+ 1.7365029236602783,
+ 1.739822388305664,
+ 1.7374979788208007,
+ 1.7375597472763062,
+ 1.7379079512786866,
+ 1.735270802078247,
+ 1.7385935315322876,
+ 1.7365304137420654,
+ 1.7351179248428346,
+ 1.7382376040649414,
+ 1.734423624343872,
+ 1.7308770125579833,
+ 1.7355197325897216,
+ 1.7343845403671265,
+ 1.734937107887268,
+ 1.7350866909408569,
+ 1.735432066116333,
+ 1.734759259376526,
+ 1.733669355697632,
+ 1.73626565574646
+ ],
+ "train_acc": [
+ 0.24744,
+ 0.28938,
+ 0.3027,
+ 0.31002,
+ 0.31422,
+ 0.32022,
+ 0.32548,
+ 0.32622,
+ 0.33078,
+ 0.32936,
+ 0.33574,
+ 0.33636,
+ 0.33724,
+ 0.33784,
+ 0.34,
+ 0.3413,
+ 0.34206,
+ 0.33976,
+ 0.3412,
+ 0.34588,
+ 0.34544,
+ 0.34566,
+ 0.34976,
+ 0.34872,
+ 0.35166,
+ 0.35328,
+ 0.3528,
+ 0.35174,
+ 0.35398,
+ 0.35788,
+ 0.35598,
+ 0.35664,
+ 0.35946,
+ 0.3579,
+ 0.35866,
+ 0.35922,
+ 0.36176,
+ 0.36192,
+ 0.36018,
+ 0.36312,
+ 0.36604,
+ 0.36232,
+ 0.36722,
+ 0.36558,
+ 0.36774,
+ 0.36944,
+ 0.367,
+ 0.3692,
+ 0.36964,
+ 0.37104,
+ 0.37188,
+ 0.37134,
+ 0.37254,
+ 0.37084,
+ 0.37208,
+ 0.3718,
+ 0.37112,
+ 0.3728,
+ 0.37378,
+ 0.37414,
+ 0.373,
+ 0.3766,
+ 0.37534,
+ 0.37602,
+ 0.37528,
+ 0.37748,
+ 0.37684,
+ 0.37644,
+ 0.3761,
+ 0.37702,
+ 0.37658,
+ 0.3781,
+ 0.37686,
+ 0.38036,
+ 0.3784,
+ 0.37902,
+ 0.3791,
+ 0.37944,
+ 0.37872,
+ 0.37962,
+ 0.3794,
+ 0.37758,
+ 0.37992,
+ 0.37976,
+ 0.38084,
+ 0.37792,
+ 0.37966,
+ 0.3806,
+ 0.38122,
+ 0.37914,
+ 0.38144,
+ 0.3834,
+ 0.38042,
+ 0.3804,
+ 0.38228,
+ 0.38292,
+ 0.38086,
+ 0.38258,
+ 0.38086,
+ 0.37848
+ ],
+ "test_acc": [
+ 0.2938,
+ 0.3207,
+ 0.3406,
+ 0.3392,
+ 0.3402,
+ 0.349,
+ 0.3619,
+ 0.3561,
+ 0.3742,
+ 0.3541,
+ 0.3632,
+ 0.3742,
+ 0.3679,
+ 0.3696,
+ 0.3734,
+ 0.3754,
+ 0.3854,
+ 0.3709,
+ 0.3747,
+ 0.3711,
+ 0.3773,
+ 0.3787,
+ 0.384,
+ 0.3688,
+ 0.386,
+ 0.3897,
+ 0.383,
+ 0.3852,
+ 0.3876,
+ 0.3857,
+ 0.3878,
+ 0.3886,
+ 0.3873,
+ 0.3929,
+ 0.3862,
+ 0.3864,
+ 0.3871,
+ 0.3947,
+ 0.3901,
+ 0.3942,
+ 0.3854,
+ 0.3841,
+ 0.3892,
+ 0.3876,
+ 0.3965,
+ 0.3924,
+ 0.382,
+ 0.3953,
+ 0.3896,
+ 0.3921,
+ 0.3975,
+ 0.3964,
+ 0.3916,
+ 0.3991,
+ 0.3928,
+ 0.4014,
+ 0.3993,
+ 0.4035,
+ 0.3844,
+ 0.3975,
+ 0.4034,
+ 0.4017,
+ 0.3952,
+ 0.3992,
+ 0.4025,
+ 0.4019,
+ 0.3993,
+ 0.3959,
+ 0.3993,
+ 0.4058,
+ 0.3945,
+ 0.4016,
+ 0.4055,
+ 0.4015,
+ 0.4036,
+ 0.4034,
+ 0.3976,
+ 0.4013,
+ 0.4024,
+ 0.4014,
+ 0.3967,
+ 0.398,
+ 0.3947,
+ 0.4056,
+ 0.4012,
+ 0.4001,
+ 0.402,
+ 0.4004,
+ 0.4031,
+ 0.4008,
+ 0.4025,
+ 0.402,
+ 0.4018,
+ 0.4026,
+ 0.4007,
+ 0.4012,
+ 0.4015,
+ 0.4021,
+ 0.4015,
+ 0.4014
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.018813904374837875,
+ 0.08222152292728424,
+ -0.07224605977535248,
+ -0.09462258964776993,
+ -0.09898842871189117,
+ 0.9958882927894592
+ ],
+ "perturbation_rho": [
+ -0.017015788704156876,
+ -0.0317268893122673,
+ -0.004754193127155304,
+ -0.006329755764454603,
+ 0.03243139386177063,
+ -0.012378348037600517
+ ],
+ "nudging": {
+ "0.001": [
+ -1.5720142982900143e-06,
+ -4.273606464266777e-07,
+ 7.217749953269958e-08,
+ 1.2828968465328217e-07,
+ 1.2386590242385864e-07,
+ -1.2737000361084938e-06
+ ],
+ "0.003": [
+ -4.96965367347002e-06,
+ -1.4296965673565865e-06,
+ 4.01865690946579e-07,
+ 4.814937710762024e-07,
+ 5.081528797745705e-07,
+ -4.469649866223335e-06
+ ],
+ "0.01": [
+ -1.6447564121335745e-05,
+ -4.997651558369398e-06,
+ 1.1826632544398308e-06,
+ 1.6157864592969418e-06,
+ 1.566135324537754e-06,
+ -1.586077269166708e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 7316.48291015625,
+ 78755.234375,
+ 576686.625,
+ 1329546.125,
+ 1568668.375,
+ 1854290.875,
+ 1069435.5
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.8450938771129586e-05,
+ 1.794567538127012e-06,
+ 6.647851478192024e-07,
+ 6.471778988270671e-07,
+ 6.503790359602135e-07,
+ 6.49630294446979e-07,
+ 6.414796303033654e-07
+ ]
+ },
+ "drift": {
+ "embed.weight": 48.85389529931473,
+ "embed.bias": 13.565561887190782,
+ "blocks.0.ln.weight": 1.0624637379045918,
+ "blocks.0.w1.weight": 16.554310656593483,
+ "blocks.0.w1.bias": 11.372855905617644,
+ "blocks.0.w2.weight": 53.87251555976206,
+ "blocks.1.ln.weight": 1.0837239573564923,
+ "blocks.1.w1.weight": 22.586400420670774,
+ "blocks.1.w1.bias": 15.377758862989662,
+ "blocks.1.w2.weight": 35.85773072344426,
+ "blocks.2.ln.weight": 0.9078778614654982,
+ "blocks.2.w1.weight": 23.522098095099405,
+ "blocks.2.w1.bias": 22.904554985601767,
+ "blocks.2.w2.weight": 42.07479881121452,
+ "blocks.3.ln.weight": 0.6724399561234441,
+ "blocks.3.w1.weight": 20.752863459155623,
+ "blocks.3.w1.bias": 20.37186903428861,
+ "blocks.3.w2.weight": 36.191664332701706,
+ "blocks.4.ln.weight": 0.6795979662627959,
+ "blocks.4.w1.weight": 20.607291873742884,
+ "blocks.4.w1.bias": 20.91900548314815,
+ "blocks.4.w2.weight": 42.61545291740059,
+ "blocks.5.ln.weight": 0.6835153473115325,
+ "blocks.5.w1.weight": 20.653168018914645,
+ "blocks.5.w1.bias": 21.158310771641304,
+ "blocks.5.w2.weight": 45.94200541763277,
+ "out_ln.weight": 0.34596348666722354,
+ "out_head.weight": 6.343616372534138,
+ "out_head.bias": 0.7709641239019656
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 6,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 42
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_depth_scan_d512_L6",
+ "methods": [
+ "fa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file