summaryrefslogtreecommitdiff
path: root/results/smoke_test/results_fashionmnist.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/smoke_test/results_fashionmnist.json')
-rw-r--r--results/smoke_test/results_fashionmnist.json511
1 files changed, 511 insertions, 0 deletions
diff --git a/results/smoke_test/results_fashionmnist.json b/results/smoke_test/results_fashionmnist.json
new file mode 100644
index 0000000..8fd82c0
--- /dev/null
+++ b/results/smoke_test/results_fashionmnist.json
@@ -0,0 +1,511 @@
+{
+ "42": {
+ "bp": {
+ "log": {
+ "train_loss": [
+ 0.7028828698158264,
+ 0.5331447437604269,
+ 0.4640675885995229,
+ 0.416527880080541,
+ 0.3784152720451355
+ ],
+ "train_acc": [
+ 0.73755,
+ 0.8002166666666667,
+ 0.8256666666666667,
+ 0.8436666666666667,
+ 0.8591833333333333
+ ],
+ "test_acc": [
+ 0.7939,
+ 0.8157,
+ 0.8379,
+ 0.8606,
+ 0.8658
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 1.0,
+ 1.0,
+ 1.0,
+ 1.0,
+ 1.0,
+ 1.0,
+ 1.0,
+ 1.0
+ ],
+ "perturbation_rho": [
+ 0.9998708367347717,
+ 0.9998407959938049,
+ 0.9997469186782837,
+ 0.9998122453689575,
+ 0.9997262358665466,
+ 0.9996491074562073,
+ 0.9996585845947266,
+ 0.9995328783988953
+ ],
+ "nudging": {
+ "0.001": [
+ -0.0019641336984932423,
+ -0.00174636859446764,
+ -0.00154352025128901,
+ -0.0013810225063934922,
+ -0.0012467722408473492,
+ -0.0011190228397026658,
+ -0.0010304137831553817,
+ -0.0009783159475773573
+ ],
+ "0.003": [
+ -0.005858615506440401,
+ -0.005213461350649595,
+ -0.004612031392753124,
+ -0.004128905013203621,
+ -0.0037290011532604694,
+ -0.003348270896822214,
+ -0.003083921270444989,
+ -0.002928499598056078
+ ],
+ "0.01": [
+ -0.019138235598802567,
+ -0.017080917954444885,
+ -0.015158241614699364,
+ -0.013598069548606873,
+ -0.01229821052402258,
+ -0.01105712354183197,
+ -0.010194781236350536,
+ -0.009686501696705818
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 1.1395236897587921,
+ "embed.bias": 0.6760135861021652,
+ "blocks.0.ln.weight": 0.0347786583006382,
+ "blocks.0.w1.weight": 0.8267150385727446,
+ "blocks.0.w1.bias": 0.7665003752239994,
+ "blocks.0.w2.weight": 2.522163826858937,
+ "blocks.1.ln.weight": 0.0373835414648056,
+ "blocks.1.w1.weight": 0.8094006579319112,
+ "blocks.1.w1.bias": 0.7074648417912711,
+ "blocks.1.w2.weight": 2.427488314293417,
+ "blocks.2.ln.weight": 0.0362338162958622,
+ "blocks.2.w1.weight": 0.7981608599321399,
+ "blocks.2.w1.bias": 0.6653993627306621,
+ "blocks.2.w2.weight": 2.3264717248101827,
+ "blocks.3.ln.weight": 0.03489774093031883,
+ "blocks.3.w1.weight": 0.8024856088475522,
+ "blocks.3.w1.bias": 0.6243261101573547,
+ "blocks.3.w2.weight": 2.2732641732905714,
+ "blocks.4.ln.weight": 0.036862026900053024,
+ "blocks.4.w1.weight": 0.7702369058900084,
+ "blocks.4.w1.bias": 0.671902653164234,
+ "blocks.4.w2.weight": 2.11229934068397,
+ "blocks.5.ln.weight": 0.04049132019281387,
+ "blocks.5.w1.weight": 0.74033776504041,
+ "blocks.5.w1.bias": 0.6447910547850285,
+ "blocks.5.w2.weight": 1.9146335569252138,
+ "blocks.6.ln.weight": 0.03797098994255066,
+ "blocks.6.w1.weight": 0.7241522377185389,
+ "blocks.6.w1.bias": 0.6486550903936706,
+ "blocks.6.w2.weight": 1.8210870137239685,
+ "blocks.7.ln.weight": 0.03962903097271919,
+ "blocks.7.w1.weight": 0.6992516513120532,
+ "blocks.7.w1.bias": 0.7021825186584477,
+ "blocks.7.w2.weight": 1.7902862835380957,
+ "out_ln.weight": 0.026629405096173286,
+ "out_head.weight": 0.5610428179907003,
+ "out_head.bias": 0.24151687322978704
+ }
+ },
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 1.4100907169977823,
+ 1.4334057479222615,
+ 1.4326289967854817,
+ 1.4254953683853149,
+ 1.4169784986495972
+ ],
+ "train_acc": [
+ 0.4805,
+ 0.49806666666666666,
+ 0.49725,
+ 0.5031166666666667,
+ 0.5098
+ ],
+ "test_acc": [
+ 0.5175,
+ 0.5282,
+ 0.5025,
+ 0.5027,
+ 0.5338
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.2141590267419815,
+ 0.0797841027379036,
+ 0.04707183688879013,
+ 0.0032249214127659798,
+ 0.024886084720492363,
+ -0.0050605954602360725,
+ 0.009758025407791138,
+ 0.020020857453346252
+ ],
+ "perturbation_rho": [
+ 0.07338915765285492,
+ -0.004745986312627792,
+ 0.018682830035686493,
+ 0.031185101717710495,
+ -0.02063235454261303,
+ 0.0006608979310840368,
+ 0.0,
+ 0.04759033024311066
+ ],
+ "nudging": {
+ "0.001": [
+ -3.5976991057395935e-06,
+ 2.3283064365386963e-09,
+ -9.313225746154785e-10,
+ -9.313225746154785e-09,
+ 4.656612873077393e-10,
+ -3.725290298461914e-09,
+ 1.3969838619232178e-09,
+ 9.313225746154785e-10
+ ],
+ "0.003": [
+ -1.0745832696557045e-05,
+ 2.3283064365386963e-09,
+ 1.6298145055770874e-09,
+ -2.3283064365386963e-09,
+ 6.752088665962219e-09,
+ 1.0244548320770264e-08,
+ -4.6566128730773926e-09,
+ 0.0
+ ],
+ "0.01": [
+ -3.5760458558797836e-05,
+ -9.313225746154785e-10,
+ 1.3271346688270569e-08,
+ -1.0244548320770264e-08,
+ -8.381903171539307e-09,
+ 4.1443854570388794e-08,
+ 8.847564458847046e-09,
+ 1.30385160446167e-08
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 34.15137184586086,
+ "embed.bias": 25.886722942466992,
+ "blocks.0.ln.weight": 2.2413852214813232,
+ "blocks.0.w1.weight": 42.91370684219911,
+ "blocks.0.w1.bias": 42.38937429728957,
+ "blocks.0.w2.weight": 115.11173260217275,
+ "blocks.1.ln.weight": 2.0233230590820312,
+ "blocks.1.w1.weight": 36.64772802731374,
+ "blocks.1.w1.bias": 34.57367344043412,
+ "blocks.1.w2.weight": 84.1198032305499,
+ "blocks.2.ln.weight": 1.9000216722488403,
+ "blocks.2.w1.weight": 33.172328512058,
+ "blocks.2.w1.bias": 31.908254113444393,
+ "blocks.2.w2.weight": 78.32752075434591,
+ "blocks.3.ln.weight": 1.9099335670471191,
+ "blocks.3.w1.weight": 36.73019631908303,
+ "blocks.3.w1.bias": 32.60666919280332,
+ "blocks.3.w2.weight": 83.75068434979308,
+ "blocks.4.ln.weight": 1.891120195388794,
+ "blocks.4.w1.weight": 35.27032832987592,
+ "blocks.4.w1.bias": 38.017692746712825,
+ "blocks.4.w2.weight": 80.26417466790754,
+ "blocks.5.ln.weight": 2.0106024742126465,
+ "blocks.5.w1.weight": 42.09808335703852,
+ "blocks.5.w1.bias": 43.15100280108635,
+ "blocks.5.w2.weight": 94.64753309078039,
+ "blocks.6.ln.weight": 1.8941009044647217,
+ "blocks.6.w1.weight": 38.94163125135345,
+ "blocks.6.w1.bias": 38.10426587138794,
+ "blocks.6.w2.weight": 84.40488806201412,
+ "blocks.7.ln.weight": 1.9035111665725708,
+ "blocks.7.w1.weight": 38.65051912560395,
+ "blocks.7.w1.bias": 40.760402959190415,
+ "blocks.7.w2.weight": 81.97372863530312,
+ "out_ln.weight": 0.39740806818008423,
+ "out_head.weight": 3.609484615833081,
+ "out_head.bias": 0.8344298895862311
+ }
+ },
+ "state_bridge": {
+ "log": {
+ "train_loss": [
+ 1.7336509002049765,
+ 1.5851847206751506,
+ 1.8742321704864502,
+ 1.8100628153483074,
+ 1.5580067304611207
+ ],
+ "train_acc": [
+ 0.32705,
+ 0.3616333333333333,
+ 0.2679166666666667,
+ 0.31853333333333333,
+ 0.4080166666666667
+ ],
+ "test_acc": [
+ 0.4036,
+ 0.4047,
+ 0.3046,
+ 0.4005,
+ 0.4651
+ ],
+ "state_pred_error": [
+ 5076234.573784879,
+ 343992182.36586666,
+ 517900685.38026667,
+ 557639895.7226666,
+ 383439664.5205333
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.35149621963500977,
+ 0.27368226647377014,
+ 0.045176729559898376,
+ 0.04587914049625397,
+ 0.06403794139623642,
+ 0.06599076837301254,
+ 0.10026843845844269,
+ 0.11267217993736267
+ ],
+ "perturbation_rho": [
+ 0.37996596097946167,
+ 0.0075237625278532505,
+ -0.017497196793556213,
+ 0.001783197745680809,
+ 0.026772135868668556,
+ 0.011043311096727848,
+ 0.0037202914245426655,
+ 0.008577261120080948
+ ],
+ "nudging": {
+ "0.001": [
+ -7.0138368755579e-05,
+ -1.0319054126739502e-06,
+ -6.495974957942963e-08,
+ -4.190951585769653e-09,
+ -3.3993273973464966e-08,
+ -2.2584572434425354e-08,
+ -6.123445928096771e-08,
+ -4.1443854570388794e-08
+ ],
+ "0.003": [
+ -0.00021021789871156216,
+ -3.0745286494493484e-06,
+ -1.0547228157520294e-07,
+ -4.866160452365875e-08,
+ -8.591450750827789e-08,
+ -6.938353180885315e-08,
+ -1.1292286217212677e-07,
+ -9.825453162193298e-08
+ ],
+ "0.01": [
+ -0.0006983885541558266,
+ -1.027202233672142e-05,
+ -3.688037395477295e-07,
+ -1.073349267244339e-07,
+ -2.153683453798294e-07,
+ -2.0815059542655945e-07,
+ -2.6938505470752716e-07,
+ -3.08966264128685e-07
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 4.244627827603776,
+ "embed.bias": 2.284214237417933,
+ "blocks.0.ln.weight": 0.7376585006713867,
+ "blocks.0.w1.weight": 10.052587254542228,
+ "blocks.0.w1.bias": 12.863219234970343,
+ "blocks.0.w2.weight": 32.7856072339516,
+ "blocks.1.ln.weight": 0.8459606170654297,
+ "blocks.1.w1.weight": 17.10440998330836,
+ "blocks.1.w1.bias": 22.587196662115986,
+ "blocks.1.w2.weight": 48.94107595877311,
+ "blocks.2.ln.weight": 0.5776991248130798,
+ "blocks.2.w1.weight": 12.17296546064332,
+ "blocks.2.w1.bias": 14.464613959802604,
+ "blocks.2.w2.weight": 33.58238884289355,
+ "blocks.3.ln.weight": 0.6916943788528442,
+ "blocks.3.w1.weight": 11.021146543598332,
+ "blocks.3.w1.bias": 11.779720628235973,
+ "blocks.3.w2.weight": 25.18170826322489,
+ "blocks.4.ln.weight": 0.5363020300865173,
+ "blocks.4.w1.weight": 8.488676390390957,
+ "blocks.4.w1.bias": 11.968348972417077,
+ "blocks.4.w2.weight": 23.562556821259157,
+ "blocks.5.ln.weight": 0.749293863773346,
+ "blocks.5.w1.weight": 13.199470836216618,
+ "blocks.5.w1.bias": 17.384581140704626,
+ "blocks.5.w2.weight": 36.38642209120496,
+ "blocks.6.ln.weight": 0.45835214853286743,
+ "blocks.6.w1.weight": 10.662863447362852,
+ "blocks.6.w1.bias": 15.855775302559838,
+ "blocks.6.w2.weight": 28.70293410646866,
+ "blocks.7.ln.weight": 0.4122738838195801,
+ "blocks.7.w1.weight": 7.193545064718527,
+ "blocks.7.w1.bias": 7.340520731384394,
+ "blocks.7.w2.weight": 22.53669113456487,
+ "out_ln.weight": 0.06885236501693726,
+ "out_head.weight": 1.473306835980063,
+ "out_head.bias": 1.5084479134035678
+ }
+ },
+ "credit_bridge": {
+ "log": {
+ "train_loss": [
+ 2.0466531958262126,
+ 2.2737758037567137,
+ 2.280587441889445,
+ 2.25820095837911,
+ 2.270971960576375
+ ],
+ "train_acc": [
+ 0.22976666666666667,
+ 0.13306666666666667,
+ 0.13921666666666666,
+ 0.15853333333333333,
+ 0.15521666666666667
+ ],
+ "test_acc": [
+ 0.1866,
+ 0.101,
+ 0.1455,
+ 0.1616,
+ 0.0958
+ ],
+ "value_loss": [
+ 1.105676996310552,
+ 0.06329173700014751,
+ 0.02014747195293506,
+ 0.01469622576336066,
+ 0.0050645585257560015
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ -0.04117349535226822,
+ 0.006370606832206249,
+ 0.03125208616256714,
+ -0.015287259593605995,
+ -0.04197325184941292,
+ -0.021368175745010376,
+ 0.009605868719518185,
+ 0.029422588646411896
+ ],
+ "perturbation_rho": [
+ -0.09283949434757233,
+ -0.030718784779310226,
+ 0.00206748116761446,
+ 0.0,
+ -0.0060626850463449955,
+ -0.015737878158688545,
+ 0.02677903138101101,
+ -0.040315717458724976
+ ],
+ "nudging": {
+ "0.001": [
+ 3.939494490623474e-06,
+ -1.4901161193847656e-08,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.003": [
+ 1.1788681149482727e-05,
+ -3.725290298461914e-09,
+ 1.862645149230957e-09,
+ 0.0,
+ 0.0,
+ -1.862645149230957e-09,
+ 1.862645149230957e-09,
+ 0.0
+ ],
+ "0.01": [
+ 3.923662006855011e-05,
+ 2.60770320892334e-08,
+ 7.450580596923828e-09,
+ -1.862645149230957e-09,
+ 1.862645149230957e-09,
+ 1.862645149230957e-09,
+ 1.862645149230957e-09,
+ 5.587935447692871e-09
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 5.5176286267072285,
+ "embed.bias": 5.84115130180781,
+ "blocks.0.ln.weight": 0.7516779899597168,
+ "blocks.0.w1.weight": 13.130250396475844,
+ "blocks.0.w1.bias": 16.418874968953887,
+ "blocks.0.w2.weight": 35.524006089100524,
+ "blocks.1.ln.weight": 1.0247337818145752,
+ "blocks.1.w1.weight": 24.629494668532566,
+ "blocks.1.w1.bias": 31.389502706524333,
+ "blocks.1.w2.weight": 66.32116257377548,
+ "blocks.2.ln.weight": 1.0405563116073608,
+ "blocks.2.w1.weight": 19.820545045709153,
+ "blocks.2.w1.bias": 21.04420170821489,
+ "blocks.2.w2.weight": 47.599865577930004,
+ "blocks.3.ln.weight": 0.698647677898407,
+ "blocks.3.w1.weight": 11.782448138509505,
+ "blocks.3.w1.bias": 11.300932589985935,
+ "blocks.3.w2.weight": 29.52897326429494,
+ "blocks.4.ln.weight": 0.7269545197486877,
+ "blocks.4.w1.weight": 12.151248949786332,
+ "blocks.4.w1.bias": 11.545512427875654,
+ "blocks.4.w2.weight": 31.11028303079019,
+ "blocks.5.ln.weight": 0.7007301449775696,
+ "blocks.5.w1.weight": 10.093534441471926,
+ "blocks.5.w1.bias": 8.779689334059729,
+ "blocks.5.w2.weight": 24.2612493038314,
+ "blocks.6.ln.weight": 0.7457646727561951,
+ "blocks.6.w1.weight": 9.34015610077582,
+ "blocks.6.w1.bias": 7.819986138941612,
+ "blocks.6.w2.weight": 24.326245888357803,
+ "blocks.7.ln.weight": 0.7317199110984802,
+ "blocks.7.w1.weight": 10.73492434511088,
+ "blocks.7.w1.bias": 9.150645079981764,
+ "blocks.7.w2.weight": 27.11222424242763,
+ "out_ln.weight": 0.07713422179222107,
+ "out_head.weight": 1.4131541672079744,
+ "out_head.bias": 0.7976411656775528
+ }
+ }
+ },
+ "config": {
+ "dataset": "fashionmnist",
+ "d_hidden": 256,
+ "num_blocks": 8,
+ "batch_size": 128,
+ "epochs": 5,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 42
+ ],
+ "gpu": 0,
+ "output_dir": "results/smoke_test",
+ "num_classes": 10
+ }
+} \ No newline at end of file