summaryrefslogtreecommitdiff
path: root/results/fa_depth_scan_d512_L2/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/fa_depth_scan_d512_L2/results_cifar10.json')
-rw-r--r--results/fa_depth_scan_d512_L2/results_cifar10.json389
1 files changed, 389 insertions, 0 deletions
diff --git a/results/fa_depth_scan_d512_L2/results_cifar10.json b/results/fa_depth_scan_d512_L2/results_cifar10.json
new file mode 100644
index 0000000..0c41380
--- /dev/null
+++ b/results/fa_depth_scan_d512_L2/results_cifar10.json
@@ -0,0 +1,389 @@
+{
+ "42": {
+ "fa": {
+ "log": {
+ "train_loss": [
+ 2.061217526626587,
+ 1.9565438193130493,
+ 1.9224825448608398,
+ 1.9001438703155518,
+ 1.8821109796524047,
+ 1.8704035317230225,
+ 1.857736103477478,
+ 1.844048505897522,
+ 1.8342980657958985,
+ 1.8290129190063475,
+ 1.8224646506118773,
+ 1.8214716808319091,
+ 1.8136491051483155,
+ 1.8157705508041382,
+ 1.8199064575195312,
+ 1.816836177368164,
+ 1.8065774325180053,
+ 1.8125089934921266,
+ 1.8090396573638916,
+ 1.81023629032135,
+ 1.8082425650787353,
+ 1.8127569119644165,
+ 1.808132509727478,
+ 1.8062178915405274,
+ 1.8039376613998412,
+ 1.8006342431259155,
+ 1.797272424888611,
+ 1.795366856956482,
+ 1.795199264755249,
+ 1.796318228149414,
+ 1.7931722381973267,
+ 1.790380922317505,
+ 1.787453678970337,
+ 1.7863555522918702,
+ 1.7848892670059204,
+ 1.782602568359375,
+ 1.7844260739135742,
+ 1.7822325122833251,
+ 1.7821675496673584,
+ 1.7775094485092162,
+ 1.775276083984375,
+ 1.772415744934082,
+ 1.771381389389038,
+ 1.7729799353790283,
+ 1.7665789907073974,
+ 1.7650687371063232,
+ 1.7673343083953856,
+ 1.7628559505844117,
+ 1.7635160286712646,
+ 1.7610479801177978,
+ 1.757714970741272,
+ 1.7587621269989013,
+ 1.75955526802063,
+ 1.7605536008453369,
+ 1.7632213006973267,
+ 1.7597938927459718,
+ 1.764720836868286,
+ 1.7602048022460937,
+ 1.7601288507843018,
+ 1.7592250678253174,
+ 1.763182290611267,
+ 1.7588830117034913,
+ 1.7620349166107179,
+ 1.762400091934204,
+ 1.7608643816375733,
+ 1.7610327990341186,
+ 1.7634911743164063,
+ 1.761160830154419,
+ 1.7584447234344482,
+ 1.758816735496521,
+ 1.7580244549560546,
+ 1.758498070678711,
+ 1.757904008178711,
+ 1.7605663097381592,
+ 1.7611833373260497,
+ 1.7573552610778809,
+ 1.7571686492538452,
+ 1.7577348608016967,
+ 1.7563239881134034,
+ 1.7563734949493408,
+ 1.757859500465393,
+ 1.7567143533325196,
+ 1.7577434346771241,
+ 1.75511939453125,
+ 1.7555543961334228,
+ 1.756235351524353,
+ 1.7555060604095458,
+ 1.7561510982894897,
+ 1.7538081964874268,
+ 1.7542751317977905,
+ 1.7549605862426758,
+ 1.7509819832611084,
+ 1.755103257446289,
+ 1.7511512590789795,
+ 1.7497140390396118,
+ 1.755158496170044,
+ 1.7556276675033569,
+ 1.7520254708862304,
+ 1.7512920989227294,
+ 1.7526899521255492
+ ],
+ "train_acc": [
+ 0.24758,
+ 0.29054,
+ 0.30476,
+ 0.31646,
+ 0.3238,
+ 0.33244,
+ 0.334,
+ 0.33794,
+ 0.34238,
+ 0.34354,
+ 0.3469,
+ 0.34778,
+ 0.34922,
+ 0.34738,
+ 0.34754,
+ 0.3477,
+ 0.3522,
+ 0.35128,
+ 0.3501,
+ 0.34894,
+ 0.3502,
+ 0.34714,
+ 0.35396,
+ 0.35312,
+ 0.35266,
+ 0.35432,
+ 0.35642,
+ 0.35256,
+ 0.35418,
+ 0.35464,
+ 0.35604,
+ 0.35646,
+ 0.35824,
+ 0.35708,
+ 0.35856,
+ 0.35934,
+ 0.35824,
+ 0.35668,
+ 0.36006,
+ 0.36048,
+ 0.36242,
+ 0.3658,
+ 0.36572,
+ 0.36512,
+ 0.36582,
+ 0.36634,
+ 0.36442,
+ 0.36774,
+ 0.3675,
+ 0.36846,
+ 0.36932,
+ 0.36868,
+ 0.3692,
+ 0.36584,
+ 0.36652,
+ 0.3708,
+ 0.36522,
+ 0.36784,
+ 0.36796,
+ 0.37036,
+ 0.36874,
+ 0.37152,
+ 0.37144,
+ 0.37078,
+ 0.36992,
+ 0.37114,
+ 0.3711,
+ 0.37028,
+ 0.37068,
+ 0.37472,
+ 0.3726,
+ 0.372,
+ 0.37436,
+ 0.37286,
+ 0.37184,
+ 0.37572,
+ 0.37322,
+ 0.37538,
+ 0.37558,
+ 0.37514,
+ 0.37416,
+ 0.37244,
+ 0.37488,
+ 0.3776,
+ 0.37426,
+ 0.37688,
+ 0.37648,
+ 0.3746,
+ 0.37672,
+ 0.37686,
+ 0.3762,
+ 0.37536,
+ 0.3752,
+ 0.37636,
+ 0.37886,
+ 0.37486,
+ 0.3733,
+ 0.37878,
+ 0.3779,
+ 0.37676
+ ],
+ "test_acc": [
+ 0.3028,
+ 0.3196,
+ 0.3402,
+ 0.3524,
+ 0.3584,
+ 0.3591,
+ 0.3566,
+ 0.3543,
+ 0.3712,
+ 0.3705,
+ 0.3579,
+ 0.3373,
+ 0.3627,
+ 0.3557,
+ 0.3414,
+ 0.3688,
+ 0.3572,
+ 0.3632,
+ 0.354,
+ 0.3634,
+ 0.362,
+ 0.3549,
+ 0.363,
+ 0.3531,
+ 0.345,
+ 0.3459,
+ 0.3517,
+ 0.3421,
+ 0.3294,
+ 0.3398,
+ 0.3294,
+ 0.3409,
+ 0.3476,
+ 0.3318,
+ 0.3477,
+ 0.3302,
+ 0.3283,
+ 0.3309,
+ 0.3337,
+ 0.3497,
+ 0.3314,
+ 0.3292,
+ 0.3374,
+ 0.3361,
+ 0.3335,
+ 0.3461,
+ 0.3254,
+ 0.3366,
+ 0.3353,
+ 0.3288,
+ 0.3467,
+ 0.3374,
+ 0.3445,
+ 0.3415,
+ 0.3358,
+ 0.3474,
+ 0.3382,
+ 0.333,
+ 0.3356,
+ 0.3376,
+ 0.3356,
+ 0.3418,
+ 0.3358,
+ 0.3446,
+ 0.35,
+ 0.3412,
+ 0.3452,
+ 0.3429,
+ 0.3438,
+ 0.3421,
+ 0.3477,
+ 0.3497,
+ 0.3499,
+ 0.3473,
+ 0.3451,
+ 0.3504,
+ 0.3474,
+ 0.3503,
+ 0.344,
+ 0.3497,
+ 0.3487,
+ 0.3488,
+ 0.3521,
+ 0.3509,
+ 0.3455,
+ 0.3511,
+ 0.3469,
+ 0.3474,
+ 0.353,
+ 0.3472,
+ 0.3472,
+ 0.3501,
+ 0.3493,
+ 0.3492,
+ 0.349,
+ 0.3496,
+ 0.3496,
+ 0.3494,
+ 0.3494,
+ 0.3495
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.03441809490323067,
+ 0.955886721611023
+ ],
+ "perturbation_rho": [
+ 0.04754525423049927,
+ 0.05055658146739006
+ ],
+ "nudging": {
+ "0.001": [
+ -5.270587280392647e-06,
+ -7.06920400261879e-06
+ ],
+ "0.003": [
+ -1.57852191478014e-05,
+ -2.1289335563778877e-05
+ ],
+ "0.01": [
+ -5.261087790131569e-05,
+ -7.100868970155716e-05
+ ]
+ },
+ "hidden_norms_per_layer": [
+ 4686.95556640625,
+ 94784.5546875,
+ 138362.359375
+ ],
+ "bp_grad_norms_per_layer": [
+ 1.9998093193862587e-05,
+ 1.4634815670433454e-06,
+ 1.188113401440205e-06
+ ]
+ },
+ "drift": {
+ "embed.weight": 28.586715545463985,
+ "embed.bias": 19.716378864552336,
+ "blocks.0.ln.weight": 1.4738119287890208,
+ "blocks.0.w1.weight": 26.045392429453724,
+ "blocks.0.w1.bias": 15.939058582542359,
+ "blocks.0.w2.weight": 59.12906119267325,
+ "blocks.1.ln.weight": 1.2124303196678357,
+ "blocks.1.w1.weight": 16.696964117465345,
+ "blocks.1.w1.bias": 8.535990814749171,
+ "blocks.1.w2.weight": 37.85731940298285,
+ "out_ln.weight": 0.5125606883018807,
+ "out_head.weight": 3.721893823331011,
+ "out_head.bias": 11.592811594248388
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 2,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 42
+ ],
+ "gpu": 0,
+ "output_dir": "results/fa_depth_scan_d512_L2",
+ "methods": [
+ "fa"
+ ],
+ "random_targets": false,
+ "penalty_lam": 0.0,
+ "num_classes": 10
+ }
+} \ No newline at end of file