summaryrefslogtreecommitdiff
path: root/results/fa_depth_scan_d512_L12/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_depth_scan_d512_L12/results_cifar10.json')
-rw-r--r--results/fa_depth_scan_d512_L12/results_cifar10.json499
1 files changed, 499 insertions, 0 deletions
diff --git a/results/fa_depth_scan_d512_L12/results_cifar10.json b/results/fa_depth_scan_d512_L12/results_cifar10.json
new file mode 100644
index 0000000..15a5792
--- /dev/null
+++ b/results/fa_depth_scan_d512_L12/results_cifar10.json
@@ -0,0 +1,499 @@
+{
+ "42": {
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.0427230606079103,
+ 1.9547925742340089,
+ 1.9269662255096436,
+ 1.9024112060546876,
+ 1.88389292137146,
+ 1.874641305809021,
+ 1.8671076870727539,
+ 1.8585125997543335,
+ 1.8507517318725586,
+ 1.8509845052719116,
+ 1.8455515924835204,
+ 1.8402700800323486,
+ 1.8322524318695068,
+ 1.8287768964385986,
+ 1.824175419845581,
+ 1.8240570126342774,
+ 1.817736747970581,
+ 1.8165113877105712,
+ 1.8092418829345702,
+ 1.8068542711639404,
+ 1.8066692431640625,
+ 1.8037006209945678,
+ 1.7959260940551758,
+ 1.797553392868042,
+ 1.7958658642196654,
+ 1.7940396698379517,
+ 1.7932731056976319,
+ 1.7874454331207275,
+ 1.7880735418319702,
+ 1.7836660583496093,
+ 1.7832960818862915,
+ 1.7804118716812134,
+ 1.7788523398208618,
+ 1.772011728515625,
+ 1.7708375668716432,
+ 1.7682569339370728,
+ 1.7717147860336304,
+ 1.7703663568115235,
+ 1.7637487329864503,
+ 1.7676782482910156,
+ 1.7649735053253175,
+ 1.7634011583709717,
+ 1.7645813860702515,
+ 1.7605182119369507,
+ 1.7599670697021483,
+ 1.7621903922271729,
+ 1.756671106300354,
+ 1.7577124716949464,
+ 1.7564089126205444,
+ 1.7521357986450194,
+ 1.7525928847885133,
+ 1.7497260301971436,
+ 1.7528332720184325,
+ 1.7475884844207763,
+ 1.7469696446990968,
+ 1.7445055263519287,
+ 1.752090754776001,
+ 1.7456406805038451,
+ 1.747734097251892,
+ 1.7441029932403564,
+ 1.743490291824341,
+ 1.7414577841949463,
+ 1.742126556777954,
+ 1.7391094409942627,
+ 1.7401588076019288,
+ 1.7370625415420533,
+ 1.7388630017471314,
+ 1.7353392750930785,
+ 1.736816965751648,
+ 1.7355695288085937,
+ 1.73539924369812,
+ 1.7323005257797242,
+ 1.7321935805511475,
+ 1.7312652449798585,
+ 1.7298928540420533,
+ 1.73121183719635,
+ 1.7288608194351196,
+ 1.7294834777069092,
+ 1.726299252166748,
+ 1.73074989528656,
+ 1.7293904189682008,
+ 1.7276834594345092,
+ 1.7300372393035888,
+ 1.731684062461853,
+ 1.7275019702529908,
+ 1.729561651916504,
+ 1.7284230736923218,
+ 1.7257295697021484,
+ 1.7226565048217772,
+ 1.726801979408264,
+ 1.7250631372833252,
+ 1.7279036038970947,
+ 1.726708238143921,
+ 1.7242388882064819,
+ 1.7248469045257568,
+ 1.7260398196411133,
+ 1.721121542892456,
+ 1.7220706603240967,
+ 1.7268135174942016,
+ 1.729515742111206
+ ],
+ "train_acc": [
+ 0.24062,
+ 0.28346,
+ 0.2951,
+ 0.30692,
+ 0.31778,
+ 0.3211,
+ 0.32388,
+ 0.32854,
+ 0.33456,
+ 0.33332,
+ 0.33668,
+ 0.33984,
+ 0.34108,
+ 0.34376,
+ 0.346,
+ 0.34636,
+ 0.35004,
+ 0.34922,
+ 0.35104,
+ 0.35196,
+ 0.35292,
+ 0.35532,
+ 0.3572,
+ 0.35614,
+ 0.3578,
+ 0.35934,
+ 0.35694,
+ 0.35918,
+ 0.36018,
+ 0.35928,
+ 0.3622,
+ 0.362,
+ 0.36236,
+ 0.36548,
+ 0.36778,
+ 0.36536,
+ 0.36884,
+ 0.367,
+ 0.36852,
+ 0.36842,
+ 0.36944,
+ 0.36784,
+ 0.3697,
+ 0.37156,
+ 0.37064,
+ 0.3725,
+ 0.37072,
+ 0.37062,
+ 0.37082,
+ 0.37298,
+ 0.37268,
+ 0.37554,
+ 0.3732,
+ 0.3752,
+ 0.37724,
+ 0.37652,
+ 0.37506,
+ 0.37708,
+ 0.37712,
+ 0.37668,
+ 0.37814,
+ 0.37944,
+ 0.37878,
+ 0.37886,
+ 0.38042,
+ 0.3778,
+ 0.38022,
+ 0.37988,
+ 0.38096,
+ 0.3807,
+ 0.3811,
+ 0.38084,
+ 0.37994,
+ 0.37914,
+ 0.38104,
+ 0.38152,
+ 0.38376,
+ 0.38158,
+ 0.38472,
+ 0.38244,
+ 0.38066,
+ 0.38392,
+ 0.3839,
+ 0.38222,
+ 0.38382,
+ 0.38384,
+ 0.38472,
+ 0.385,
+ 0.38792,
+ 0.3839,
+ 0.38516,
+ 0.3858,
+ 0.38262,
+ 0.38758,
+ 0.38396,
+ 0.38268,
+ 0.38628,
+ 0.38618,
+ 0.3846,
+ 0.38336
+ ],
+ "test_acc": [
+ 0.2963,
+ 0.3132,
+ 0.3406,
+ 0.3377,
+ 0.3353,
+ 0.3407,
+ 0.3367,
+ 0.3657,
+ 0.3618,
+ 0.3712,
+ 0.3519,
+ 0.3722,
+ 0.371,
+ 0.379,
+ 0.3666,
+ 0.372,
+ 0.3674,
+ 0.3754,
+ 0.3733,
+ 0.3747,
+ 0.3712,
+ 0.3772,
+ 0.3792,
+ 0.3804,
+ 0.3742,
+ 0.3852,
+ 0.3864,
+ 0.3907,
+ 0.3861,
+ 0.3827,
+ 0.3852,
+ 0.3833,
+ 0.3885,
+ 0.3865,
+ 0.3933,
+ 0.391,
+ 0.3837,
+ 0.3915,
+ 0.4,
+ 0.4088,
+ 0.3956,
+ 0.3878,
+ 0.407,
+ 0.3928,
+ 0.3983,
+ 0.4042,
+ 0.4064,
+ 0.4019,
+ 0.3975,
+ 0.3905,
+ 0.399,
+ 0.3953,
+ 0.3981,
+ 0.3986,
+ 0.399,
+ 0.3963,
+ 0.4013,
+ 0.3988,
+ 0.401,
+ 0.4042,
+ 0.3978,
+ 0.399,
+ 0.4035,
+ 0.4022,
+ 0.4052,
+ 0.4033,
+ 0.4035,
+ 0.4041,
+ 0.4026,
+ 0.4046,
+ 0.4012,
+ 0.3996,
+ 0.4052,
+ 0.4034,
+ 0.3962,
+ 0.4036,
+ 0.3996,
+ 0.4008,
+ 0.4053,
+ 0.4037,
+ 0.4033,
+ 0.4058,
+ 0.408,
+ 0.4066,
+ 0.4017,
+ 0.4038,
+ 0.4015,
+ 0.4035,
+ 0.4052,
+ 0.4014,
+ 0.4046,
+ 0.4027,
+ 0.4046,
+ 0.4036,
+ 0.4035,
+ 0.4042,
+ 0.4039,
+ 0.4033,
+ 0.4034,
+ 0.4035
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.04570477455854416,
+ 0.10783404111862183,
+ -0.03488321602344513,
+ -0.0594203844666481,
+ -0.04577865079045296,
+ -0.024857502430677414,
+ -0.03406952694058418,
+ 0.030555542558431625,
+ -0.00125521095469594,
+ 0.010614164173603058,
+ 0.05838795006275177,
+ 0.9949829578399658
+ ],
+ "perturbation_rho": [
+ -0.010346438735723495,
+ 0.04423713684082031,
+ 0.01146540604531765,
+ 0.03663264587521553,
+ -0.011911284178495407,
+ 0.0016591008752584457,
+ -0.02494950033724308,
+ 0.02218942530453205,
+ 0.0039163315668702126,
+ 0.07129630446434021,
+ 0.00445366557687521,
+ -0.01873880997300148
+ ],
+ "nudging": {
+ "0.001": [
+ -2.829881850630045e-06,
+ -3.539607860147953e-07,
+ 7.35744833946228e-08,
+ 8.218921720981598e-08,
+ 4.21423465013504e-08,
+ 2.7241185307502747e-08,
+ 7.008202373981476e-08,
+ -3.632158041000366e-08,
+ -3.958120942115784e-09,
+ -3.073364496231079e-08,
+ -9.918585419654846e-08,
+ -1.0794028639793396e-06
+ ],
+ "0.003": [
+ -8.66112532094121e-06,
+ -9.669456630945206e-07,
+ 1.387670636177063e-07,
+ 2.7869828045368195e-07,
+ 1.7974525690078735e-07,
+ 1.0058283805847168e-07,
+ 1.448206603527069e-07,
+ -2.1746382117271423e-07,
+ -1.0011717677116394e-08,
+ -1.1711381375789642e-07,
+ -2.377200871706009e-07,
+ -3.898283466696739e-06
+ ],
+ "0.01": [
+ -2.8825539629906416e-05,
+ -3.2445532269775867e-06,
+ 4.411558620631695e-07,
+ 9.136274456977844e-07,
+ 6.3673360273242e-07,
+ 3.696768544614315e-07,
+ 4.895846359431744e-07,
+ -5.699694156646729e-07,
+ -7.869675755500793e-08,
+ -1.8370337784290314e-07,
+ -8.582137525081635e-07,
+ -1.4071993064135313e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 7405.54296875,
+ 126799.640625,
+ 722124.125,
+ 1197351.125,
+ 1311770.625,
+ 1445317.875,
+ 1575290.0,
+ 1646774.0,
+ 1672649.625,
+ 1692752.625,
+ 1726090.75,
+ 1747446.5,
+ 1108917.0
+ ],
+ "bp_grad_norms_per_layer": [
+ 2.2136026018415578e-05,
+ 1.0887044936680468e-06,
+ 6.514224537568225e-07,
+ 6.450830483117898e-07,
+ 6.397550009751285e-07,
+ 6.399715175575693e-07,
+ 6.393033231688605e-07,
+ 6.382227297763166e-07,
+ 6.320739203147241e-07,
+ 6.241282335395226e-07,
+ 6.161063197396288e-07,
+ 6.117401767369302e-07,
+ 5.839314667355211e-07
+ ]
+ },
+ "drift": {
+ "embed.weight": 52.2471866434948,
+ "embed.bias": 18.97250327390356,
+ "blocks.0.ln.weight": 1.2566883045780834,
+ "blocks.0.w1.weight": 17.12006786604635,
+ "blocks.0.w1.bias": 14.342858083073688,
+ "blocks.0.w2.weight": 63.004850525998116,
+ "blocks.1.ln.weight": 1.0284467630081824,
+ "blocks.1.w1.weight": 21.225831949490352,
+ "blocks.1.w1.bias": 18.554260026881323,
+ "blocks.1.w2.weight": 42.67940842745791,
+ "blocks.2.ln.weight": 0.5431388174757359,
+ "blocks.2.w1.weight": 20.036899880398536,
+ "blocks.2.w1.bias": 21.66446091790098,
+ "blocks.2.w2.weight": 26.571695423395656,
+ "blocks.3.ln.weight": 0.4791053623183397,
+ "blocks.3.w1.weight": 17.857825652507895,
+ "blocks.3.w1.bias": 19.196407269205075,
+ "blocks.3.w2.weight": 24.453272281036483,
+ "blocks.4.ln.weight": 0.40179147711472446,
+ "blocks.4.w1.weight": 16.142007729189494,
+ "blocks.4.w1.bias": 18.38189338630125,
+ "blocks.4.w2.weight": 22.251118320035413,
+ "blocks.5.ln.weight": 0.3999388280630244,
+ "blocks.5.w1.weight": 16.08867610628456,
+ "blocks.5.w1.bias": 18.228301269113516,
+ "blocks.5.w2.weight": 22.282579138688718,
+ "blocks.6.ln.weight": 0.5139340433841122,
+ "blocks.6.w1.weight": 16.498928955337856,
+ "blocks.6.w1.bias": 17.341930385247757,
+ "blocks.6.w2.weight": 44.47264444577482,
+ "blocks.7.ln.weight": 0.5190564871460961,
+ "blocks.7.w1.weight": 15.921519106035,
+ "blocks.7.w1.bias": 13.554678640598476,
+ "blocks.7.w2.weight": 55.375944465972985,
+ "blocks.8.ln.weight": 0.5783217006624557,
+ "blocks.8.w1.weight": 15.308415657722076,
+ "blocks.8.w1.bias": 12.359797369765815,
+ "blocks.8.w2.weight": 60.55354023990087,
+ "blocks.9.ln.weight": 0.5265177438656736,
+ "blocks.9.w1.weight": 14.699539264919315,
+ "blocks.9.w1.bias": 12.199485985244364,
+ "blocks.9.w2.weight": 53.496852348666465,
+ "blocks.10.ln.weight": 0.5541756864436261,
+ "blocks.10.w1.weight": 14.732920668123558,
+ "blocks.10.w1.bias": 10.868519121164393,
+ "blocks.10.w2.weight": 61.24451839129346,
+ "blocks.11.ln.weight": 0.6274670342096703,
+ "blocks.11.w1.weight": 18.31665424290367,
+ "blocks.11.w1.bias": 18.6607903814988,
+ "blocks.11.w2.weight": 57.15975509546593,
+ "out_ln.weight": 0.317930900746446,
+ "out_head.weight": 6.3670164706750825,
+ "out_head.bias": 0.940628348025828
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 12,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 42
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_depth_scan_d512",
+ "methods": [
+ "fa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file