summaryrefslogtreecommitdiff
path: root/results/synth_ladder_v2_hi/summary.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/synth_ladder_v2_hi/summary.json')
-rw-r--r--results/synth_ladder_v2_hi/summary.json3590
1 files changed, 3590 insertions, 0 deletions
diff --git a/results/synth_ladder_v2_hi/summary.json b/results/synth_ladder_v2_hi/summary.json
new file mode 100644
index 0000000..b7ad268
--- /dev/null
+++ b/results/synth_ladder_v2_hi/summary.json
@@ -0,0 +1,3590 @@
+{
+ "a0.5_L2_s42": {
+ "bp": {
+ "test_acc": 0.8845,
+ "mean_bp_cosine": 0.9139105975627899,
+ "mean_rho": 0.9999974966049194,
+ "mean_nudge_001": -0.021973546594381332,
+ "mean_nudge_003": -0.061596330255270004,
+ "mean_nudge_01": -0.16279328987002373,
+ "bp_cosine_per_layer": [
+ 0.9165740013122559,
+ 0.911247193813324
+ ],
+ "rho_per_layer": [
+ 0.9999988079071045,
+ 0.9999961853027344
+ ],
+ "nudge_per_layer": [
+ -0.21485117077827454,
+ -0.11073540896177292
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.8185,
+ "mean_bp_cosine": 0.013388294260948896,
+ "mean_rho": -0.010654313489794731,
+ "mean_nudge_001": 0.00010355231643188745,
+ "mean_nudge_003": 0.00034307173336856067,
+ "mean_nudge_01": 0.0015135867288336158,
+ "bp_cosine_per_layer": [
+ -0.008949288167059422,
+ 0.035725876688957214
+ ],
+ "rho_per_layer": [
+ -0.042064815759658813,
+ 0.02075618878006935
+ ],
+ "nudge_per_layer": [
+ 0.004335631616413593,
+ -0.0013084581587463617
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.8125,
+ "mean_bp_cosine": 0.6582441031932831,
+ "mean_rho": 0.6169608980417252,
+ "mean_nudge_001": -0.013940556207671762,
+ "mean_nudge_003": -0.040253227576613426,
+ "mean_nudge_01": -0.11712449323385954,
+ "bp_cosine_per_layer": [
+ 0.8927175402641296,
+ 0.4237706661224365
+ ],
+ "rho_per_layer": [
+ 0.8139950037002563,
+ 0.41992679238319397
+ ],
+ "nudge_per_layer": [
+ -0.20875152945518494,
+ -0.02549745701253414
+ ],
+ "state_pred_error_per_layer": [
+ 1690.90478515625,
+ 278.7707214355469
+ ],
+ "mean_state_pred_error": 984.8377532958984
+ },
+ "credit_bridge": {
+ "test_acc": 0.6365,
+ "mean_bp_cosine": 0.23397326469421387,
+ "mean_rho": 0.31064942479133606,
+ "mean_nudge_001": -0.004609669325873256,
+ "mean_nudge_003": -0.013776597566902637,
+ "mean_nudge_01": -0.04530538059771061,
+ "bp_cosine_per_layer": [
+ 0.12511783838272095,
+ 0.3428286910057068
+ ],
+ "rho_per_layer": [
+ 0.21235734224319458,
+ 0.40894150733947754
+ ],
+ "nudge_per_layer": [
+ -0.061930932104587555,
+ -0.028679829090833664
+ ],
+ "final_value_loss": 0.48061015357971193,
+ "final_term_loss": 0.14492559936642646,
+ "final_bridge_loss": 0.020528473022580148,
+ "final_tgrad_loss": 0.31515607919692995
+ }
+ },
+ "a0.5_L2_s123": {
+ "bp": {
+ "test_acc": 0.895,
+ "mean_bp_cosine": 0.878325492143631,
+ "mean_rho": 0.9999979734420776,
+ "mean_nudge_001": -0.019721894524991512,
+ "mean_nudge_003": -0.055400675162672997,
+ "mean_nudge_01": -0.14613648504018784,
+ "bp_cosine_per_layer": [
+ 0.8870643973350525,
+ 0.8695865869522095
+ ],
+ "rho_per_layer": [
+ 0.9999991059303284,
+ 0.9999968409538269
+ ],
+ "nudge_per_layer": [
+ -0.1920192688703537,
+ -0.10025370121002197
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.8405,
+ "mean_bp_cosine": 0.08467924036085606,
+ "mean_rho": 0.07321365177631378,
+ "mean_nudge_001": -0.0010137155040865764,
+ "mean_nudge_003": -0.0030202887719497085,
+ "mean_nudge_01": -0.009814865421503782,
+ "bp_cosine_per_layer": [
+ 0.05535196140408516,
+ 0.11400651931762695
+ ],
+ "rho_per_layer": [
+ 0.07898944616317749,
+ 0.06743785738945007
+ ],
+ "nudge_per_layer": [
+ -0.015302825719118118,
+ -0.004326905123889446
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.8305,
+ "mean_bp_cosine": 0.659128725528717,
+ "mean_rho": 0.5701804161071777,
+ "mean_nudge_001": -0.012253106338903308,
+ "mean_nudge_003": -0.035399872343987226,
+ "mean_nudge_01": -0.10352936759591103,
+ "bp_cosine_per_layer": [
+ 0.8879689574241638,
+ 0.43028849363327026
+ ],
+ "rho_per_layer": [
+ 0.7560213804244995,
+ 0.38433945178985596
+ ],
+ "nudge_per_layer": [
+ -0.18288554251194,
+ -0.02417319267988205
+ ],
+ "state_pred_error_per_layer": [
+ 1696.6031494140625,
+ 278.31060791015625
+ ],
+ "mean_state_pred_error": 987.4568786621094
+ },
+ "credit_bridge": {
+ "test_acc": 0.634,
+ "mean_bp_cosine": 0.21542657166719437,
+ "mean_rho": 0.3815983682870865,
+ "mean_nudge_001": -0.004454661626368761,
+ "mean_nudge_003": -0.0132976695895195,
+ "mean_nudge_01": -0.04354145657271147,
+ "bp_cosine_per_layer": [
+ 0.11650891602039337,
+ 0.31434422731399536
+ ],
+ "rho_per_layer": [
+ 0.23759987950325012,
+ 0.5255968570709229
+ ],
+ "nudge_per_layer": [
+ -0.05865050479769707,
+ -0.028432408347725868
+ ],
+ "final_value_loss": 0.5198581983566284,
+ "final_term_loss": 0.1660363396883011,
+ "final_bridge_loss": 0.026915473002195357,
+ "final_tgrad_loss": 0.32690638537406924
+ }
+ },
+ "a0.5_L2_s456": {
+ "bp": {
+ "test_acc": 0.875,
+ "mean_bp_cosine": 0.8901284635066986,
+ "mean_rho": 0.9999979138374329,
+ "mean_nudge_001": -0.024593621492385864,
+ "mean_nudge_003": -0.06968314573168755,
+ "mean_nudge_01": -0.18856997787952423,
+ "bp_cosine_per_layer": [
+ 0.8992727398872375,
+ 0.8809841871261597
+ ],
+ "rho_per_layer": [
+ 0.999998927116394,
+ 0.9999969005584717
+ ],
+ "nudge_per_layer": [
+ -0.2502431571483612,
+ -0.12689679861068726
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.816,
+ "mean_bp_cosine": 0.04272198863327503,
+ "mean_rho": 0.0372689850628376,
+ "mean_nudge_001": -0.0004823530907742679,
+ "mean_nudge_003": -0.0014278392773121595,
+ "mean_nudge_01": -0.004543605959042907,
+ "bp_cosine_per_layer": [
+ 0.017043430358171463,
+ 0.0684005469083786
+ ],
+ "rho_per_layer": [
+ -0.039058439433574677,
+ 0.11359640955924988
+ ],
+ "nudge_per_layer": [
+ -0.005804130807518959,
+ -0.0032830811105668545
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.807,
+ "mean_bp_cosine": 0.6757712662220001,
+ "mean_rho": 0.6000171899795532,
+ "mean_nudge_001": -0.01571581745520234,
+ "mean_nudge_003": -0.04562427382916212,
+ "mean_nudge_01": -0.13532716780900955,
+ "bp_cosine_per_layer": [
+ 0.8896123766899109,
+ 0.46193015575408936
+ ],
+ "rho_per_layer": [
+ 0.8089620471000671,
+ 0.3910723328590393
+ ],
+ "nudge_per_layer": [
+ -0.23563425242900848,
+ -0.03502008318901062
+ ],
+ "state_pred_error_per_layer": [
+ 1470.6129150390625,
+ 266.84222412109375
+ ],
+ "mean_state_pred_error": 868.7275695800781
+ },
+ "credit_bridge": {
+ "test_acc": 0.6605,
+ "mean_bp_cosine": 0.23513908684253693,
+ "mean_rho": 0.3664921522140503,
+ "mean_nudge_001": -0.005338509101420641,
+ "mean_nudge_003": -0.015948554500937462,
+ "mean_nudge_01": -0.052367652766406536,
+ "bp_cosine_per_layer": [
+ 0.15452352166175842,
+ 0.31575465202331543
+ ],
+ "rho_per_layer": [
+ 0.26963475346565247,
+ 0.4633495509624481
+ ],
+ "nudge_per_layer": [
+ -0.07802344858646393,
+ -0.026711856946349144
+ ],
+ "final_value_loss": 0.3851433990240097,
+ "final_term_loss": 0.10070284021273256,
+ "final_bridge_loss": 0.01744421122968197,
+ "final_tgrad_loss": 0.26699634662866595
+ }
+ },
+ "a0.5_L4_s42": {
+ "bp": {
+ "test_acc": 0.883,
+ "mean_bp_cosine": 0.8371244817972183,
+ "mean_rho": 0.9999875724315643,
+ "mean_nudge_001": -0.0205106531502679,
+ "mean_nudge_003": -0.05829396191984415,
+ "mean_nudge_01": -0.15927099250257015,
+ "bp_cosine_per_layer": [
+ 0.8572149276733398,
+ 0.8503379821777344,
+ 0.8309497833251953,
+ 0.8099952340126038
+ ],
+ "rho_per_layer": [
+ 0.9999990463256836,
+ 0.9999980330467224,
+ 0.999992311000824,
+ 0.9999608993530273
+ ],
+ "nudge_per_layer": [
+ -0.29344552755355835,
+ -0.19200363755226135,
+ -0.10158533602952957,
+ -0.050049468874931335
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.825,
+ "mean_bp_cosine": 0.08056101959664375,
+ "mean_rho": 0.07036433229222894,
+ "mean_nudge_001": -0.0004525305703282356,
+ "mean_nudge_003": -0.0013484152732416987,
+ "mean_nudge_01": -0.004391533322632313,
+ "bp_cosine_per_layer": [
+ 0.0060789515264332294,
+ 0.09873200953006744,
+ 0.10723873972892761,
+ 0.1101943776011467
+ ],
+ "rho_per_layer": [
+ -0.012974856421351433,
+ 0.14552229642868042,
+ 0.08513970673084259,
+ 0.06377018243074417
+ ],
+ "nudge_per_layer": [
+ -0.0025177751667797565,
+ -0.006775799673050642,
+ -0.004219442140311003,
+ -0.00405311631038785
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.7175,
+ "mean_bp_cosine": 0.389427974820137,
+ "mean_rho": 0.3547045961022377,
+ "mean_nudge_001": -0.006397623001248576,
+ "mean_nudge_003": -0.018759612808935344,
+ "mean_nudge_01": -0.05771041696425527,
+ "bp_cosine_per_layer": [
+ 0.81822270154953,
+ 0.44441917538642883,
+ 0.15419423580169678,
+ 0.14087578654289246
+ ],
+ "rho_per_layer": [
+ 0.7556701302528381,
+ 0.42722654342651367,
+ 0.13306331634521484,
+ 0.10285839438438416
+ ],
+ "nudge_per_layer": [
+ -0.2031538337469101,
+ -0.01867133006453514,
+ -0.004740326199680567,
+ -0.00427617784589529
+ ],
+ "state_pred_error_per_layer": [
+ 6433.45703125,
+ 2426.59619140625,
+ 1950.234130859375,
+ 1929.63232421875
+ ],
+ "mean_state_pred_error": 3184.9799194335938
+ },
+ "credit_bridge": {
+ "test_acc": 0.662,
+ "mean_bp_cosine": 0.2142251469194889,
+ "mean_rho": 0.3778097555041313,
+ "mean_nudge_001": -0.002453161054290831,
+ "mean_nudge_003": -0.007344013080000877,
+ "mean_nudge_01": -0.024294552858918905,
+ "bp_cosine_per_layer": [
+ 0.08037468791007996,
+ 0.24492917954921722,
+ 0.2708122730255127,
+ 0.26078444719314575
+ ],
+ "rho_per_layer": [
+ 0.14874565601348877,
+ 0.4311285614967346,
+ 0.48388832807540894,
+ 0.44747647643089294
+ ],
+ "nudge_per_layer": [
+ -0.03933826461434364,
+ -0.020281529054045677,
+ -0.01922188699245453,
+ -0.018336530774831772
+ ],
+ "final_value_loss": 0.4397273305892944,
+ "final_term_loss": 0.15641304728984834,
+ "final_bridge_loss": 0.03557699205875397,
+ "final_tgrad_loss": 0.24773729231357575
+ }
+ },
+ "a0.5_L4_s123": {
+ "bp": {
+ "test_acc": 0.882,
+ "mean_bp_cosine": 0.7865977436304092,
+ "mean_rho": 0.9999855011701584,
+ "mean_nudge_001": -0.019216455286368728,
+ "mean_nudge_003": -0.05414565000683069,
+ "mean_nudge_01": -0.14401183556765318,
+ "bp_cosine_per_layer": [
+ 0.817541241645813,
+ 0.7992762923240662,
+ 0.7803024053573608,
+ 0.749271035194397
+ ],
+ "rho_per_layer": [
+ 0.9999992847442627,
+ 0.9999971389770508,
+ 0.9999915361404419,
+ 0.9999540448188782
+ ],
+ "nudge_per_layer": [
+ -0.25995129346847534,
+ -0.17589232325553894,
+ -0.09449617564678192,
+ -0.04570754989981651
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.8045,
+ "mean_bp_cosine": 0.13894247123971581,
+ "mean_rho": 0.15608793403953314,
+ "mean_nudge_001": -0.0003833890805253759,
+ "mean_nudge_003": -0.0011389600113034248,
+ "mean_nudge_01": -0.0036781042581424117,
+ "bp_cosine_per_layer": [
+ -0.027901431545615196,
+ 0.2837410271167755,
+ 0.17885790765285492,
+ 0.12107238173484802
+ ],
+ "rho_per_layer": [
+ -0.007988158613443375,
+ 0.25683730840682983,
+ 0.21096175909042358,
+ 0.1645408272743225
+ ],
+ "nudge_per_layer": [
+ 0.005267709027975798,
+ -0.009674372151494026,
+ -0.005893784575164318,
+ -0.0044119693338871
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.7345,
+ "mean_bp_cosine": 0.3779419884085655,
+ "mean_rho": 0.3288300409913063,
+ "mean_nudge_001": -0.006349694755044766,
+ "mean_nudge_003": -0.018683148198761046,
+ "mean_nudge_01": -0.05818818649277091,
+ "bp_cosine_per_layer": [
+ 0.8108769655227661,
+ 0.3922353684902191,
+ 0.15907782316207886,
+ 0.149577796459198
+ ],
+ "rho_per_layer": [
+ 0.6536975502967834,
+ 0.33696871995925903,
+ 0.15431806445121765,
+ 0.1703358292579651
+ ],
+ "nudge_per_layer": [
+ -0.2048409879207611,
+ -0.01618226245045662,
+ -0.006159749813377857,
+ -0.005569745786488056
+ ],
+ "state_pred_error_per_layer": [
+ 3474.9130859375,
+ 1348.3646240234375,
+ 1462.0654296875,
+ 924.672607421875
+ ],
+ "mean_state_pred_error": 1802.5039367675781
+ },
+ "credit_bridge": {
+ "test_acc": 0.668,
+ "mean_bp_cosine": 0.16247223876416683,
+ "mean_rho": 0.2929591853171587,
+ "mean_nudge_001": -0.001968744763871655,
+ "mean_nudge_003": -0.005892619024962187,
+ "mean_nudge_01": -0.019490228034555912,
+ "bp_cosine_per_layer": [
+ 0.05806349962949753,
+ 0.19388319551944733,
+ 0.1997416615486145,
+ 0.19820059835910797
+ ],
+ "rho_per_layer": [
+ 0.05481833964586258,
+ 0.3572811782360077,
+ 0.4186326265335083,
+ 0.3411045968532562
+ ],
+ "nudge_per_layer": [
+ -0.0286177359521389,
+ -0.01660466194152832,
+ -0.01654389500617981,
+ -0.016194619238376617
+ ],
+ "final_value_loss": 0.4729928963661194,
+ "final_term_loss": 0.15622255086898804,
+ "final_bridge_loss": 0.034451057982444765,
+ "final_tgrad_loss": 0.28231928570270537
+ }
+ },
+ "a0.5_L4_s456": {
+ "bp": {
+ "test_acc": 0.8855,
+ "mean_bp_cosine": 0.7703797668218613,
+ "mean_rho": 0.999986544251442,
+ "mean_nudge_001": -0.017331300303339958,
+ "mean_nudge_003": -0.04883333737961948,
+ "mean_nudge_01": -0.13096668012440205,
+ "bp_cosine_per_layer": [
+ 0.792909562587738,
+ 0.7804109454154968,
+ 0.7618845105171204,
+ 0.7463140487670898
+ ],
+ "rho_per_layer": [
+ 0.9999990463256836,
+ 0.9999976754188538,
+ 0.9999912977218628,
+ 0.9999581575393677
+ ],
+ "nudge_per_layer": [
+ -0.2336917370557785,
+ -0.1588592678308487,
+ -0.0874030739068985,
+ -0.04391264170408249
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.817,
+ "mean_bp_cosine": 0.07182160578668118,
+ "mean_rho": 0.09282832965254784,
+ "mean_nudge_001": -0.0003612322652770672,
+ "mean_nudge_003": -0.0010782249155454338,
+ "mean_nudge_01": -0.0035168152826372534,
+ "bp_cosine_per_layer": [
+ -0.010789386928081512,
+ 0.08449429273605347,
+ 0.10027095675468445,
+ 0.1133105605840683
+ ],
+ "rho_per_layer": [
+ -0.022197294980287552,
+ 0.02167895808815956,
+ 0.18905602395534515,
+ 0.18277563154697418
+ ],
+ "nudge_per_layer": [
+ -0.0005262043559923768,
+ -0.005684657022356987,
+ -0.003974507562816143,
+ -0.0038818921893835068
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.7675,
+ "mean_bp_cosine": 0.4189938008785248,
+ "mean_rho": 0.348801476880908,
+ "mean_nudge_001": -0.006437422598537523,
+ "mean_nudge_003": -0.018775500764604658,
+ "mean_nudge_01": -0.056744852219708264,
+ "bp_cosine_per_layer": [
+ 0.8223247528076172,
+ 0.5256583094596863,
+ 0.17289233207702637,
+ 0.1550998091697693
+ ],
+ "rho_per_layer": [
+ 0.7023045420646667,
+ 0.4341009259223938,
+ 0.10907860845327377,
+ 0.14972183108329773
+ ],
+ "nudge_per_layer": [
+ -0.19577056169509888,
+ -0.022263746708631516,
+ -0.004863455425947905,
+ -0.0040816450491547585
+ ],
+ "state_pred_error_per_layer": [
+ 6500.04248046875,
+ 2179.638671875,
+ 1695.392333984375,
+ 1466.414306640625
+ ],
+ "mean_state_pred_error": 2960.3719482421875
+ },
+ "credit_bridge": {
+ "test_acc": 0.617,
+ "mean_bp_cosine": 0.19905064720660448,
+ "mean_rho": 0.27845675125718117,
+ "mean_nudge_001": -0.0017877554928418249,
+ "mean_nudge_003": -0.005349543411284685,
+ "mean_nudge_01": -0.017666283063590527,
+ "bp_cosine_per_layer": [
+ 0.0613640733063221,
+ 0.23986753821372986,
+ 0.24101567268371582,
+ 0.25395530462265015
+ ],
+ "rho_per_layer": [
+ 0.07897584140300751,
+ 0.3258228003978729,
+ 0.35056060552597046,
+ 0.3584677577018738
+ ],
+ "nudge_per_layer": [
+ -0.019116222858428955,
+ -0.01759088784456253,
+ -0.016751645132899284,
+ -0.017206376418471336
+ ],
+ "final_value_loss": 0.4424677228450775,
+ "final_term_loss": 0.12383701201379299,
+ "final_bridge_loss": 0.02319883658438921,
+ "final_tgrad_loss": 0.29543187527656556
+ }
+ },
+ "a0.5_L8_s42": {
+ "bp": {
+ "test_acc": 0.8715,
+ "mean_bp_cosine": 0.808967724442482,
+ "mean_rho": 0.999945156276226,
+ "mean_nudge_001": -0.011501751199830323,
+ "mean_nudge_003": -0.03289153927471489,
+ "mean_nudge_01": -0.09379934845492244,
+ "bp_cosine_per_layer": [
+ 0.8294941186904907,
+ 0.823101282119751,
+ 0.815970778465271,
+ 0.8095235824584961,
+ 0.8066394329071045,
+ 0.8012610673904419,
+ 0.7956615686416626,
+ 0.7900899648666382
+ ],
+ "rho_per_layer": [
+ 0.999998927116394,
+ 0.999997615814209,
+ 0.9999938011169434,
+ 0.9999845027923584,
+ 0.9999604225158691,
+ 0.9999330043792725,
+ 0.999873697757721,
+ 0.999819278717041
+ ],
+ "nudge_per_layer": [
+ -0.2528620958328247,
+ -0.17482446134090424,
+ -0.11384513974189758,
+ -0.07313278317451477,
+ -0.04917728155851364,
+ -0.03563641011714935,
+ -0.02781001478433609,
+ -0.02310660108923912
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.804,
+ "mean_bp_cosine": 0.06822564313188195,
+ "mean_rho": 0.08298261812888086,
+ "mean_nudge_001": -5.095545566291548e-05,
+ "mean_nudge_003": -0.0001400069668306969,
+ "mean_nudge_01": -0.0003324677818454802,
+ "bp_cosine_per_layer": [
+ -0.029147807508707047,
+ 0.09590217471122742,
+ 0.0916377604007721,
+ 0.10714393854141235,
+ 0.10661958158016205,
+ 0.05731643736362457,
+ 0.06447312980890274,
+ 0.05185993015766144
+ ],
+ "rho_per_layer": [
+ -0.08288859575986862,
+ 0.14039787650108337,
+ 0.1433517336845398,
+ 0.1548803746700287,
+ 0.09298646450042725,
+ 0.08800182491540909,
+ 0.09949750453233719,
+ 0.02763376198709011
+ ],
+ "nudge_per_layer": [
+ 0.019184602424502373,
+ -0.0062692309729754925,
+ -0.0031640869565308094,
+ -0.0033698435872793198,
+ -0.003262510057538748,
+ -0.0018756084609776735,
+ -0.0022803605534136295,
+ -0.0016227040905505419
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.7265,
+ "mean_bp_cosine": 0.2766533959656954,
+ "mean_rho": 0.24636799190193415,
+ "mean_nudge_001": -0.003215807260858128,
+ "mean_nudge_003": -0.00946771033341065,
+ "mean_nudge_01": -0.029514338413719088,
+ "bp_cosine_per_layer": [
+ 0.8188973069190979,
+ 0.4508240222930908,
+ 0.20906424522399902,
+ 0.16529136896133423,
+ 0.1612900048494339,
+ 0.1292058229446411,
+ 0.14780420064926147,
+ 0.1308501958847046
+ ],
+ "rho_per_layer": [
+ 0.7345798015594482,
+ 0.40806666016578674,
+ 0.18922817707061768,
+ 0.1360217034816742,
+ 0.11187596619129181,
+ 0.1472519189119339,
+ 0.12442155927419662,
+ 0.11949814856052399
+ ],
+ "nudge_per_layer": [
+ -0.19829359650611877,
+ -0.01426965557038784,
+ -0.005409521050751209,
+ -0.004344802349805832,
+ -0.0038992268964648247,
+ -0.0032464847899973392,
+ -0.003532196395099163,
+ -0.00311922375112772
+ ],
+ "state_pred_error_per_layer": [
+ 5640.76416015625,
+ 3768.9912109375,
+ 2209.80126953125,
+ 1863.6328125,
+ 1833.0330810546875,
+ 2052.747802734375,
+ 1687.1876220703125,
+ 1871.18310546875
+ ],
+ "mean_state_pred_error": 2615.9176330566406
+ },
+ "credit_bridge": {
+ "test_acc": 0.5935,
+ "mean_bp_cosine": 0.12945402902550995,
+ "mean_rho": 0.20130334049463272,
+ "mean_nudge_001": -0.0008943625434767455,
+ "mean_nudge_003": -0.0026800249179359525,
+ "mean_nudge_01": -0.00888864736771211,
+ "bp_cosine_per_layer": [
+ 0.014968650415539742,
+ 0.08219218999147415,
+ 0.12315872311592102,
+ 0.1350458562374115,
+ 0.16176681220531464,
+ 0.1692444086074829,
+ 0.17282617092132568,
+ 0.17642942070960999
+ ],
+ "rho_per_layer": [
+ 0.09865723550319672,
+ 0.1636437624692917,
+ 0.19447889924049377,
+ 0.2091381549835205,
+ 0.2243458330631256,
+ 0.23168572783470154,
+ 0.2512606978416443,
+ 0.23721641302108765
+ ],
+ "nudge_per_layer": [
+ -0.006006492767482996,
+ -0.006066862493753433,
+ -0.008294559083878994,
+ -0.008802486583590508,
+ -0.009770728647708893,
+ -0.010544568300247192,
+ -0.010718668811023235,
+ -0.010904812254011631
+ ],
+ "final_value_loss": 0.3977136660575867,
+ "final_term_loss": 0.13710964921712876,
+ "final_bridge_loss": 0.018799800185859205,
+ "final_tgrad_loss": 0.24180421624183654
+ }
+ },
+ "a0.5_L8_s123": {
+ "bp": {
+ "test_acc": 0.868,
+ "mean_bp_cosine": 0.8070773705840111,
+ "mean_rho": 0.9999594464898109,
+ "mean_nudge_001": -0.01314116342109628,
+ "mean_nudge_003": -0.037657674751244485,
+ "mean_nudge_01": -0.10643287934362888,
+ "bp_cosine_per_layer": [
+ 0.8442516326904297,
+ 0.8351782560348511,
+ 0.8238041400909424,
+ 0.811212420463562,
+ 0.800036609172821,
+ 0.789252519607544,
+ 0.7798817157745361,
+ 0.7730016708374023
+ ],
+ "rho_per_layer": [
+ 0.9999992251396179,
+ 0.9999983906745911,
+ 0.9999960660934448,
+ 0.99998939037323,
+ 0.9999715685844421,
+ 0.9999511241912842,
+ 0.9999076128005981,
+ 0.9998621940612793
+ ],
+ "nudge_per_layer": [
+ -0.281266987323761,
+ -0.2009655237197876,
+ -0.1321270614862442,
+ -0.08429376780986786,
+ -0.05586903542280197,
+ -0.039932381361722946,
+ -0.031076554208993912,
+ -0.025931723415851593
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.8,
+ "mean_bp_cosine": 0.07366255111992359,
+ "mean_rho": 0.07397386711090803,
+ "mean_nudge_001": -8.963746586232446e-05,
+ "mean_nudge_003": -0.0002625839406391606,
+ "mean_nudge_01": -0.0007999172084964812,
+ "bp_cosine_per_layer": [
+ -0.02832707017660141,
+ 0.13987571001052856,
+ 0.07857642322778702,
+ 0.061437755823135376,
+ 0.0877213403582573,
+ 0.09552451223134995,
+ 0.07042402029037476,
+ 0.08406771719455719
+ ],
+ "rho_per_layer": [
+ 0.034647777676582336,
+ 0.1467832326889038,
+ 0.036387018859386444,
+ 0.061308689415454865,
+ 0.1038040965795517,
+ 0.09023141860961914,
+ 0.03672575205564499,
+ 0.08190295100212097
+ ],
+ "nudge_per_layer": [
+ 0.012113340198993683,
+ -0.00537356361746788,
+ -0.0023620566353201866,
+ -0.001645779935643077,
+ -0.002037967788055539,
+ -0.0027765799313783646,
+ -0.001988787204027176,
+ -0.002327942755073309
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.718,
+ "mean_bp_cosine": 0.2835564874112606,
+ "mean_rho": 0.2681517219170928,
+ "mean_nudge_001": -0.0027127867688250262,
+ "mean_nudge_003": -0.007993465682375245,
+ "mean_nudge_01": -0.025023294263519347,
+ "bp_cosine_per_layer": [
+ 0.8429861068725586,
+ 0.3551006317138672,
+ 0.246289923787117,
+ 0.21019335091114044,
+ 0.17309927940368652,
+ 0.14295682311058044,
+ 0.15966862440109253,
+ 0.13815715909004211
+ ],
+ "rho_per_layer": [
+ 0.7732758522033691,
+ 0.2933464050292969,
+ 0.24295836687088013,
+ 0.22880345582962036,
+ 0.1602117419242859,
+ 0.11042392998933792,
+ 0.18763291835784912,
+ 0.14856110513210297
+ ],
+ "nudge_per_layer": [
+ -0.15847395360469818,
+ -0.010836342349648476,
+ -0.007060050964355469,
+ -0.005947217810899019,
+ -0.004753550048917532,
+ -0.004264200571924448,
+ -0.004713424481451511,
+ -0.0041376142762601376
+ ],
+ "state_pred_error_per_layer": [
+ 3389.93017578125,
+ 4477.634765625,
+ 1038.2586669921875,
+ 911.949951171875,
+ 702.6972045898438,
+ 659.9431762695312,
+ 824.164794921875,
+ 821.9293212890625
+ ],
+ "mean_state_pred_error": 1603.3135070800781
+ },
+ "credit_bridge": {
+ "test_acc": 0.6185,
+ "mean_bp_cosine": 0.1525184395723045,
+ "mean_rho": 0.23177338391542435,
+ "mean_nudge_001": -0.0011540915293153375,
+ "mean_nudge_003": -0.0034589636488817632,
+ "mean_nudge_01": -0.01147624314762652,
+ "bp_cosine_per_layer": [
+ 0.024487923830747604,
+ 0.1551763117313385,
+ 0.17440856993198395,
+ 0.18776318430900574,
+ 0.163284569978714,
+ 0.17855775356292725,
+ 0.162883460521698,
+ 0.17358574271202087
+ ],
+ "rho_per_layer": [
+ 0.024775028228759766,
+ 0.25605684518814087,
+ 0.2314496785402298,
+ 0.2697882056236267,
+ 0.24329833686351776,
+ 0.3152206242084503,
+ 0.23843368887901306,
+ 0.2751646637916565
+ ],
+ "nudge_per_layer": [
+ -0.010280786082148552,
+ -0.011451397091150284,
+ -0.01173271145671606,
+ -0.012431012466549873,
+ -0.01105603575706482,
+ -0.011893808841705322,
+ -0.011241357773542404,
+ -0.011722835712134838
+ ],
+ "final_value_loss": 0.3728706964492798,
+ "final_term_loss": 0.12118487646579743,
+ "final_bridge_loss": 0.015310661105066539,
+ "final_tgrad_loss": 0.23637515988349914
+ }
+ },
+ "a0.5_L8_s456": {
+ "bp": {
+ "test_acc": 0.8555,
+ "mean_bp_cosine": 0.8527287542819977,
+ "mean_rho": 0.9999570250511169,
+ "mean_nudge_001": -0.01194569593644701,
+ "mean_nudge_003": -0.033871308725792915,
+ "mean_nudge_01": -0.09340489702299237,
+ "bp_cosine_per_layer": [
+ 0.8810831904411316,
+ 0.8730225563049316,
+ 0.8656145334243774,
+ 0.8578245639801025,
+ 0.8490546345710754,
+ 0.8397257328033447,
+ 0.8311692476272583,
+ 0.8243355751037598
+ ],
+ "rho_per_layer": [
+ 0.9999987483024597,
+ 0.9999980330467224,
+ 0.9999955892562866,
+ 0.9999854564666748,
+ 0.9999719858169556,
+ 0.999948263168335,
+ 0.9998974204063416,
+ 0.9998607039451599
+ ],
+ "nudge_per_layer": [
+ -0.23731596767902374,
+ -0.17453062534332275,
+ -0.11795195937156677,
+ -0.07674264907836914,
+ -0.05135927349328995,
+ -0.036901768296957016,
+ -0.028667811304330826,
+ -0.02376912161707878
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.7985,
+ "mean_bp_cosine": 0.09374871966429055,
+ "mean_rho": 0.12165694544091821,
+ "mean_nudge_001": -0.0004589786858559819,
+ "mean_nudge_003": -0.0013758796121692285,
+ "mean_nudge_01": -0.004529613710474223,
+ "bp_cosine_per_layer": [
+ 0.027731137350201607,
+ 0.10604047030210495,
+ 0.13601002097129822,
+ 0.07596071809530258,
+ 0.0985877588391304,
+ 0.08992618322372437,
+ 0.1115533858537674,
+ 0.10418008267879486
+ ],
+ "rho_per_layer": [
+ -0.01300876960158348,
+ 0.12486347556114197,
+ 0.1899794042110443,
+ 0.08801613748073578,
+ 0.11934874951839447,
+ 0.15905101597309113,
+ 0.1374979466199875,
+ 0.167507603764534
+ ],
+ "nudge_per_layer": [
+ -0.011210349388420582,
+ -0.00580610241740942,
+ -0.004417200107127428,
+ -0.002277099061757326,
+ -0.003015844151377678,
+ -0.0030763214454054832,
+ -0.003333096392452717,
+ -0.003100896719843149
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.7505,
+ "mean_bp_cosine": 0.25108483247458935,
+ "mean_rho": 0.22314902767539024,
+ "mean_nudge_001": -0.0032180442212847993,
+ "mean_nudge_003": -0.009445599382161163,
+ "mean_nudge_01": -0.029192803369369358,
+ "bp_cosine_per_layer": [
+ 0.8145060539245605,
+ 0.39495280385017395,
+ 0.15602949261665344,
+ 0.14954066276550293,
+ 0.1189848780632019,
+ 0.14297258853912354,
+ 0.11834269762039185,
+ 0.11334948241710663
+ ],
+ "rho_per_layer": [
+ 0.7131592035293579,
+ 0.31938445568084717,
+ 0.13574811816215515,
+ 0.13510501384735107,
+ 0.12680554389953613,
+ 0.13444143533706665,
+ 0.1260460913181305,
+ 0.09450235962867737
+ ],
+ "nudge_per_layer": [
+ -0.20040717720985413,
+ -0.012472910806536674,
+ -0.003969438374042511,
+ -0.003768536727875471,
+ -0.0031205681152641773,
+ -0.00363306887447834,
+ -0.0031901695765554905,
+ -0.002980557270348072
+ ],
+ "state_pred_error_per_layer": [
+ 7208.7744140625,
+ 4043.077392578125,
+ 2431.6259765625,
+ 2036.907958984375,
+ 1977.547119140625,
+ 1708.2327880859375,
+ 1901.497314453125,
+ 1821.6331787109375
+ ],
+ "mean_state_pred_error": 2891.1620178222656
+ },
+ "credit_bridge": {
+ "test_acc": 0.555,
+ "mean_bp_cosine": 0.12328627426177263,
+ "mean_rho": 0.16509935073554516,
+ "mean_nudge_001": -0.000985160811978858,
+ "mean_nudge_003": -0.002952177223050967,
+ "mean_nudge_01": -0.009791445219889283,
+ "bp_cosine_per_layer": [
+ 0.03383665531873703,
+ 0.10378465056419373,
+ 0.1522345095872879,
+ 0.12050338089466095,
+ 0.12787620723247528,
+ 0.13963481783866882,
+ 0.14998120069503784,
+ 0.1584387719631195
+ ],
+ "rho_per_layer": [
+ 0.02018044888973236,
+ 0.14589767158031464,
+ 0.20607107877731323,
+ 0.18045580387115479,
+ 0.1894514560699463,
+ 0.16447019577026367,
+ 0.1924649477005005,
+ 0.2218032032251358
+ ],
+ "nudge_per_layer": [
+ -0.00981426052749157,
+ -0.00849075522273779,
+ -0.010712197050452232,
+ -0.009203735738992691,
+ -0.009092864580452442,
+ -0.00978156179189682,
+ -0.010470103472471237,
+ -0.010766083374619484
+ ],
+ "final_value_loss": 0.5412774887084961,
+ "final_term_loss": 0.23150972747802734,
+ "final_bridge_loss": 0.02621319934129715,
+ "final_tgrad_loss": 0.28355456256866457
+ }
+ },
+ "a0.5_L12_s42": {
+ "bp": {
+ "test_acc": 0.8585,
+ "mean_bp_cosine": 0.8183901458978653,
+ "mean_rho": 0.9998798171679179,
+ "mean_nudge_001": -0.011188714299350977,
+ "mean_nudge_003": -0.03214278844340394,
+ "mean_nudge_01": -0.09301998885348439,
+ "bp_cosine_per_layer": [
+ 0.8657882213592529,
+ 0.8541754484176636,
+ 0.8436384201049805,
+ 0.832263708114624,
+ 0.8208613991737366,
+ 0.8122134208679199,
+ 0.8057717084884644,
+ 0.8017721176147461,
+ 0.7986597418785095,
+ 0.7967146635055542,
+ 0.7952107787132263,
+ 0.7936121225357056
+ ],
+ "rho_per_layer": [
+ 0.9999991655349731,
+ 0.9999977350234985,
+ 0.9999939203262329,
+ 0.9999861121177673,
+ 0.9999700784683228,
+ 0.9999415874481201,
+ 0.9999051094055176,
+ 0.9998413324356079,
+ 0.9998086094856262,
+ 0.9997647404670715,
+ 0.9996839165687561,
+ 0.9996654987335205
+ ],
+ "nudge_per_layer": [
+ -0.3461707830429077,
+ -0.23528623580932617,
+ -0.151905819773674,
+ -0.0986800491809845,
+ -0.06758347898721695,
+ -0.04991145431995392,
+ -0.039162103086709976,
+ -0.032274406403303146,
+ -0.02771918475627899,
+ -0.024551689624786377,
+ -0.02231007255613804,
+ -0.020684588700532913
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.791,
+ "mean_bp_cosine": 0.07122930279001594,
+ "mean_rho": 0.10592638049274683,
+ "mean_nudge_001": -0.00047647209915642935,
+ "mean_nudge_003": -0.0014203774189809337,
+ "mean_nudge_01": -0.004644906090106815,
+ "bp_cosine_per_layer": [
+ 0.023988625034689903,
+ 0.0961650088429451,
+ 0.10208466649055481,
+ 0.07022920250892639,
+ 0.09604307264089584,
+ 0.07800711691379547,
+ 0.08064866811037064,
+ 0.015484225004911423,
+ 0.04617477208375931,
+ 0.10530653595924377,
+ 0.06217034161090851,
+ 0.07844939827919006
+ ],
+ "rho_per_layer": [
+ -0.021668296307325363,
+ 0.13302525877952576,
+ 0.14676621556282043,
+ 0.11482817679643631,
+ 0.09230026602745056,
+ 0.15572097897529602,
+ 0.084853395819664,
+ 0.06741442531347275,
+ 0.09585727006196976,
+ 0.17402535676956177,
+ 0.1249062716960907,
+ 0.10308724641799927
+ ],
+ "nudge_per_layer": [
+ -0.013704460114240646,
+ -0.009605048224329948,
+ -0.004514003172516823,
+ -0.00345102627761662,
+ -0.003412249032407999,
+ -0.0038682736922055483,
+ -0.0031317053362727165,
+ -0.0012646813411265612,
+ -0.002444072160869837,
+ -0.004538315813988447,
+ -0.0027466074097901583,
+ -0.0030584305059164762
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.684,
+ "mean_bp_cosine": 0.17019233045478663,
+ "mean_rho": 0.14254611171782017,
+ "mean_nudge_001": -0.0020112845547070415,
+ "mean_nudge_003": -0.005932022473037553,
+ "mean_nudge_01": -0.01860854132488991,
+ "bp_cosine_per_layer": [
+ 0.7669721841812134,
+ 0.3159201741218567,
+ 0.12931227684020996,
+ 0.11285121738910675,
+ 0.11607236415147781,
+ 0.09898597002029419,
+ 0.08882047981023788,
+ 0.08661012351512909,
+ 0.08416090905666351,
+ 0.07891363650560379,
+ 0.08571723103523254,
+ 0.07797139883041382
+ ],
+ "rho_per_layer": [
+ 0.6671731472015381,
+ 0.26826971769332886,
+ 0.10340800136327744,
+ 0.06843797862529755,
+ 0.0669264942407608,
+ 0.08176875114440918,
+ 0.10683348774909973,
+ 0.06641782820224762,
+ 0.09755225479602814,
+ 0.04477599635720253,
+ 0.0847611278295517,
+ 0.05422855541110039
+ ],
+ "nudge_per_layer": [
+ -0.18878120183944702,
+ -0.009807860478758812,
+ -0.003219514386728406,
+ -0.0027990485541522503,
+ -0.0029557342641055584,
+ -0.002479594200849533,
+ -0.0022394107654690742,
+ -0.0022681057453155518,
+ -0.0022236446384340525,
+ -0.0021239176858216524,
+ -0.002271223347634077,
+ -0.0021332399919629097
+ ],
+ "state_pred_error_per_layer": [
+ 11168.2578125,
+ 8443.55078125,
+ 4301.74609375,
+ 3486.31884765625,
+ 3134.353515625,
+ 2733.8369140625,
+ 2666.431640625,
+ 2571.673095703125,
+ 2489.172119140625,
+ 2732.81298828125,
+ 3179.04296875,
+ 3116.75927734375
+ ],
+ "mean_state_pred_error": 4168.663004557292
+ },
+ "credit_bridge": {
+ "test_acc": 0.571,
+ "mean_bp_cosine": 0.08207109943032265,
+ "mean_rho": 0.14231220919949314,
+ "mean_nudge_001": -0.0008072109461257545,
+ "mean_nudge_003": -0.0024178701957377293,
+ "mean_nudge_01": -0.008001433801837265,
+ "bp_cosine_per_layer": [
+ 0.009321734309196472,
+ 0.04962325841188431,
+ 0.06880976259708405,
+ 0.07808464020490646,
+ 0.08887439966201782,
+ 0.0946938544511795,
+ 0.09941184520721436,
+ 0.09979166835546494,
+ 0.10197117179632187,
+ 0.10147081315517426,
+ 0.09914548695087433,
+ 0.0936545580625534
+ ],
+ "rho_per_layer": [
+ -0.0036096302792429924,
+ 0.0626683160662651,
+ 0.10237888991832733,
+ 0.12722331285476685,
+ 0.138666570186615,
+ 0.14094725251197815,
+ 0.1720128357410431,
+ 0.18820315599441528,
+ 0.1971924901008606,
+ 0.19901405274868011,
+ 0.18742212653160095,
+ 0.1956271380186081
+ ],
+ "nudge_per_layer": [
+ -0.00799381174147129,
+ -0.0042757005430758,
+ -0.005744780879467726,
+ -0.006799482740461826,
+ -0.0076793828047811985,
+ -0.008442584425210953,
+ -0.008797119371592999,
+ -0.009013657458126545,
+ -0.009450232610106468,
+ -0.009471941739320755,
+ -0.009278533980250359,
+ -0.009069977328181267
+ ],
+ "final_value_loss": 0.95497522315979,
+ "final_term_loss": 0.6288936994552612,
+ "final_bridge_loss": 0.0344168305516243,
+ "final_tgrad_loss": 0.2916646807193756
+ }
+ },
+ "a0.5_L12_s123": {
+ "bp": {
+ "test_acc": 0.873,
+ "mean_bp_cosine": 0.7415736317634583,
+ "mean_rho": 0.9999099324146906,
+ "mean_nudge_001": -0.010182377610666057,
+ "mean_nudge_003": -0.029109801825446386,
+ "mean_nudge_01": -0.08149818579355876,
+ "bp_cosine_per_layer": [
+ 0.8060421943664551,
+ 0.7944625616073608,
+ 0.776944637298584,
+ 0.7588614821434021,
+ 0.7418972849845886,
+ 0.7322722673416138,
+ 0.724165678024292,
+ 0.7197043299674988,
+ 0.7152823209762573,
+ 0.7119243144989014,
+ 0.709496021270752,
+ 0.7078304886817932
+ ],
+ "rho_per_layer": [
+ 0.9999996423721313,
+ 0.9999984502792358,
+ 0.9999962449073792,
+ 0.999989926815033,
+ 0.9999754428863525,
+ 0.9999579191207886,
+ 0.999927818775177,
+ 0.999887228012085,
+ 0.9998751878738403,
+ 0.9997915029525757,
+ 0.9997637867927551,
+ 0.9997560381889343
+ ],
+ "nudge_per_layer": [
+ -0.2872876822948456,
+ -0.20931334793567657,
+ -0.13937950134277344,
+ -0.09144100546836853,
+ -0.06199805811047554,
+ -0.04483566805720329,
+ -0.03463221341371536,
+ -0.02817366272211075,
+ -0.023888790979981422,
+ -0.02094285935163498,
+ -0.01881779544055462,
+ -0.01726764440536499
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.7975,
+ "mean_bp_cosine": 0.06331516286203016,
+ "mean_rho": 0.04216622615543505,
+ "mean_nudge_001": -0.00018036465129019538,
+ "mean_nudge_003": -0.0005390862012670065,
+ "mean_nudge_01": -0.0017679805799465005,
+ "bp_cosine_per_layer": [
+ 0.004078918602317572,
+ 0.1059243381023407,
+ 0.07574640959501266,
+ 0.07308551669120789,
+ 0.066571444272995,
+ 0.056897446513175964,
+ 0.12165610492229462,
+ 0.06462406367063522,
+ 0.04925639182329178,
+ 0.04602370783686638,
+ 0.035759277641773224,
+ 0.06015833467245102
+ ],
+ "rho_per_layer": [
+ -0.011486321687698364,
+ 0.04376016557216644,
+ 0.037421341985464096,
+ 0.05220063030719757,
+ 0.09364941716194153,
+ -0.03169674053788185,
+ 0.15961039066314697,
+ 0.10634914040565491,
+ 0.03384825587272644,
+ 0.02390148863196373,
+ -0.010392685420811176,
+ 0.00882963091135025
+ ],
+ "nudge_per_layer": [
+ -0.0026711553800851107,
+ -0.003443576628342271,
+ -0.001918894238770008,
+ -0.0020233127288520336,
+ -0.0016027885721996427,
+ -0.0010300527792423964,
+ -0.002917288802564144,
+ -0.001525502186268568,
+ -0.0009703689720481634,
+ -0.0010098961647599936,
+ -0.0008095581433735788,
+ -0.0012933723628520966
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.69,
+ "mean_bp_cosine": 0.17323703753451505,
+ "mean_rho": 0.15179013274610043,
+ "mean_nudge_001": -0.0019852635256635645,
+ "mean_nudge_003": -0.005834519392616737,
+ "mean_nudge_01": -0.018113662886510912,
+ "bp_cosine_per_layer": [
+ 0.7613614797592163,
+ 0.3896995782852173,
+ 0.1309610903263092,
+ 0.10979019105434418,
+ 0.09164053201675415,
+ 0.07316795736551285,
+ 0.09407100081443787,
+ 0.08964815735816956,
+ 0.08292470127344131,
+ 0.08648289740085602,
+ 0.0870373547077179,
+ 0.08205951005220413
+ ],
+ "rho_per_layer": [
+ 0.6734859943389893,
+ 0.37621644139289856,
+ 0.08932416141033173,
+ 0.11710754036903381,
+ 0.07942430675029755,
+ 0.058268360793590546,
+ 0.05698401480913162,
+ 0.12727776169776917,
+ 0.03869014233350754,
+ 0.06775026768445969,
+ 0.0798446387052536,
+ 0.05710796266794205
+ ],
+ "nudge_per_layer": [
+ -0.1828688532114029,
+ -0.012644743546843529,
+ -0.003011793363839388,
+ -0.0024378912057727575,
+ -0.0020753229036927223,
+ -0.0017659795703366399,
+ -0.0021767604630440474,
+ -0.0021774054039269686,
+ -0.0019914493896067142,
+ -0.0021301559172570705,
+ -0.0020812181755900383,
+ -0.0020023814868181944
+ ],
+ "state_pred_error_per_layer": [
+ 12496.853515625,
+ 8106.66162109375,
+ 5059.9169921875,
+ 4050.405517578125,
+ 3454.0888671875,
+ 2936.005859375,
+ 2830.2294921875,
+ 2863.870361328125,
+ 3118.476806640625,
+ 3786.361083984375,
+ 3251.337890625,
+ 3255.708740234375
+ ],
+ "mean_state_pred_error": 4600.826395670573
+ },
+ "credit_bridge": {
+ "test_acc": 0.6545,
+ "mean_bp_cosine": -0.010937775252386928,
+ "mean_rho": 0.02020453056320548,
+ "mean_nudge_001": 7.376461204936884e-05,
+ "mean_nudge_003": 0.00022662243100057822,
+ "mean_nudge_01": 0.0008031492385877451,
+ "bp_cosine_per_layer": [
+ -0.022733785212039948,
+ -0.008966443128883839,
+ -0.020323125645518303,
+ -0.018136776983737946,
+ -0.01592089980840683,
+ -0.019174236804246902,
+ -0.014491843990981579,
+ -0.016727179288864136,
+ -0.008660020306706429,
+ -0.007111798040568829,
+ 0.0011803526431322098,
+ 0.019812453538179398
+ ],
+ "rho_per_layer": [
+ -0.05155084282159805,
+ 0.03821132332086563,
+ 0.07940525561571121,
+ 0.014752240851521492,
+ 0.016678672283887863,
+ 0.04385560005903244,
+ 0.03276895359158516,
+ -0.0006132312119007111,
+ -0.024450641125440598,
+ -0.029637619853019714,
+ 0.058109357953071594,
+ 0.06492529809474945
+ ],
+ "nudge_per_layer": [
+ 0.00777015183120966,
+ 0.00029987754533067346,
+ 0.00037500812322832644,
+ 0.00043640032527036965,
+ 0.0005594875547103584,
+ 0.0007026067469269037,
+ 0.00045700964983552694,
+ 0.000550219090655446,
+ 0.00020889028382953256,
+ 0.00013992507592774928,
+ -0.0004261335707269609,
+ -0.0014356517931446433
+ ],
+ "final_value_loss": 1.470289986038208,
+ "final_term_loss": 0.35005189373493195,
+ "final_bridge_loss": 0.9054676934719086,
+ "final_tgrad_loss": 0.2147704033613205
+ }
+ },
+ "a0.5_L12_s456": {
+ "bp": {
+ "test_acc": 0.869,
+ "mean_bp_cosine": 0.74041115740935,
+ "mean_rho": 0.9998869399229685,
+ "mean_nudge_001": -0.007502871051353092,
+ "mean_nudge_003": -0.02132872895648082,
+ "mean_nudge_01": -0.05926296177009741,
+ "bp_cosine_per_layer": [
+ 0.802544355392456,
+ 0.7848162055015564,
+ 0.7700465321540833,
+ 0.7570744752883911,
+ 0.7440193891525269,
+ 0.733696699142456,
+ 0.7256457805633545,
+ 0.7199540734291077,
+ 0.7157886028289795,
+ 0.7124584913253784,
+ 0.7102035284042358,
+ 0.7086857557296753
+ ],
+ "rho_per_layer": [
+ 0.9999985694885254,
+ 0.9999974966049194,
+ 0.9999951720237732,
+ 0.9999867677688599,
+ 0.9999691843986511,
+ 0.9999383687973022,
+ 0.9999032020568848,
+ 0.9998719692230225,
+ 0.9998380541801453,
+ 0.9998047351837158,
+ 0.9996931552886963,
+ 0.9996466040611267
+ ],
+ "nudge_per_layer": [
+ -0.20057430863380432,
+ -0.1480334997177124,
+ -0.10051561146974564,
+ -0.0672251284122467,
+ -0.04664912819862366,
+ -0.03438428044319153,
+ -0.026901239529252052,
+ -0.02211749367415905,
+ -0.018912356346845627,
+ -0.01670587807893753,
+ -0.015132123604416847,
+ -0.01400449313223362
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.8,
+ "mean_bp_cosine": 0.11594532305995624,
+ "mean_rho": 0.11397512660672267,
+ "mean_nudge_001": -0.00042300097387245234,
+ "mean_nudge_003": -0.0012634664356786136,
+ "mean_nudge_01": -0.0041745746857486665,
+ "bp_cosine_per_layer": [
+ 0.04262668639421463,
+ 0.2711353898048401,
+ 0.1898173838853836,
+ 0.1387583613395691,
+ 0.09531620889902115,
+ 0.1376194804906845,
+ 0.07653278112411499,
+ 0.08707999438047409,
+ 0.09030534327030182,
+ 0.10221391171216965,
+ 0.06503984332084656,
+ 0.09489849209785461
+ ],
+ "rho_per_layer": [
+ 0.0572824701666832,
+ 0.20349135994911194,
+ 0.20036441087722778,
+ 0.17148703336715698,
+ 0.0623050183057785,
+ 0.14095279574394226,
+ 0.05262026563286781,
+ 0.12087561190128326,
+ 0.10731191188097,
+ 0.061124786734580994,
+ 0.07995927333831787,
+ 0.10992658138275146
+ ],
+ "nudge_per_layer": [
+ -0.009360449388623238,
+ -0.00823313370347023,
+ -0.005617598537355661,
+ -0.004333253484219313,
+ -0.0029935596976429224,
+ -0.0036506117321550846,
+ -0.002341690007597208,
+ -0.002613792195916176,
+ -0.0027945097535848618,
+ -0.003059752518311143,
+ -0.002222315641120076,
+ -0.002874229568988085
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.702,
+ "mean_bp_cosine": 0.18659504254659018,
+ "mean_rho": 0.1786113940179348,
+ "mean_nudge_001": -0.002035917636627952,
+ "mean_nudge_003": -0.0060201529073917,
+ "mean_nudge_01": -0.019059499570478994,
+ "bp_cosine_per_layer": [
+ 0.7615377902984619,
+ 0.3628881573677063,
+ 0.1397334486246109,
+ 0.13061293959617615,
+ 0.11024273186922073,
+ 0.09393852204084396,
+ 0.10003305226564407,
+ 0.10794281214475632,
+ 0.10362739115953445,
+ 0.10100233554840088,
+ 0.1030983105301857,
+ 0.12448301911354065
+ ],
+ "rho_per_layer": [
+ 0.7019654512405396,
+ 0.3051794767379761,
+ 0.12004730850458145,
+ 0.11974964290857315,
+ 0.1315283179283142,
+ 0.11543487757444382,
+ 0.08415813744068146,
+ 0.14185138046741486,
+ 0.12905646860599518,
+ 0.0691840872168541,
+ 0.12997986376285553,
+ 0.09520171582698822
+ ],
+ "nudge_per_layer": [
+ -0.1852446049451828,
+ -0.011355580762028694,
+ -0.003981029614806175,
+ -0.0038526845164597034,
+ -0.0031567115802317858,
+ -0.0028176922351121902,
+ -0.0029711187817156315,
+ -0.0031051787082105875,
+ -0.0029434349853545427,
+ -0.002931142458692193,
+ -0.002905802335590124,
+ -0.0034490139223635197
+ ],
+ "state_pred_error_per_layer": [
+ 8110.80078125,
+ 4497.13623046875,
+ 2448.651123046875,
+ 2213.206298828125,
+ 2038.592041015625,
+ 2361.478515625,
+ 2122.5341796875,
+ 2178.11474609375,
+ 2310.2265625,
+ 2081.50390625,
+ 2114.170654296875,
+ 2407.947998046875
+ ],
+ "mean_state_pred_error": 2907.0302530924478
+ },
+ "credit_bridge": {
+ "test_acc": 0.6375,
+ "mean_bp_cosine": 0.09317115658389714,
+ "mean_rho": 0.17472073963532844,
+ "mean_nudge_001": -0.000727248170733219,
+ "mean_nudge_003": -0.0021776299763587303,
+ "mean_nudge_01": -0.007225943821443555,
+ "bp_cosine_per_layer": [
+ -0.0012992812553420663,
+ 0.028360359370708466,
+ 0.07222752273082733,
+ 0.06384990364313126,
+ 0.0745362713932991,
+ 0.10235601663589478,
+ 0.11958298832178116,
+ 0.12767711281776428,
+ 0.12978672981262207,
+ 0.13033980131149292,
+ 0.131376713514328,
+ 0.13925974071025848
+ ],
+ "rho_per_layer": [
+ -0.036700520664453506,
+ 0.08258875459432602,
+ 0.18529893457889557,
+ 0.1350553333759308,
+ 0.14971259236335754,
+ 0.23370781540870667,
+ 0.15428856015205383,
+ 0.2475280910730362,
+ 0.20684200525283813,
+ 0.26022571325302124,
+ 0.23770767450332642,
+ 0.24039392173290253
+ ],
+ "nudge_per_layer": [
+ 0.0004691533395089209,
+ -0.002260619541630149,
+ -0.007056917063891888,
+ -0.005040735937654972,
+ -0.005857650190591812,
+ -0.007526098750531673,
+ -0.008702869527041912,
+ -0.009377602487802505,
+ -0.009931675158441067,
+ -0.01026402972638607,
+ -0.010433407500386238,
+ -0.010728873312473297
+ ],
+ "final_value_loss": 0.6376882638454437,
+ "final_term_loss": 0.3444120800256729,
+ "final_bridge_loss": 0.029638116455078124,
+ "final_tgrad_loss": 0.2636380691766739
+ }
+ },
+ "a1.0_L2_s42": {
+ "bp": {
+ "test_acc": 0.7915,
+ "mean_bp_cosine": 0.9376864433288574,
+ "mean_rho": 0.9999988675117493,
+ "mean_nudge_001": -0.040167851373553276,
+ "mean_nudge_003": -0.11654911190271378,
+ "mean_nudge_01": -0.34635232388973236,
+ "bp_cosine_per_layer": [
+ 0.937772274017334,
+ 0.9376006126403809
+ ],
+ "rho_per_layer": [
+ 0.9999990463256836,
+ 0.9999986886978149
+ ],
+ "nudge_per_layer": [
+ -0.4167234003543854,
+ -0.27598124742507935
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.7025,
+ "mean_bp_cosine": 0.007199164479970932,
+ "mean_rho": 0.005297745577991009,
+ "mean_nudge_001": -7.51367933844449e-05,
+ "mean_nudge_003": -0.00021808056044392288,
+ "mean_nudge_01": -0.000639150632196106,
+ "bp_cosine_per_layer": [
+ -0.005922339856624603,
+ 0.020320668816566467
+ ],
+ "rho_per_layer": [
+ -0.003393532708287239,
+ 0.013989023864269257
+ ],
+ "nudge_per_layer": [
+ 5.659737507812679e-05,
+ -0.0013348986394703388
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6735,
+ "mean_bp_cosine": 0.5210442394018173,
+ "mean_rho": 0.48512911796569824,
+ "mean_nudge_001": -0.011768221855163574,
+ "mean_nudge_003": -0.034833950689062476,
+ "mean_nudge_01": -0.11062158830463886,
+ "bp_cosine_per_layer": [
+ 0.6727198958396912,
+ 0.3693685829639435
+ ],
+ "rho_per_layer": [
+ 0.6028042435646057,
+ 0.36745399236679077
+ ],
+ "nudge_per_layer": [
+ -0.19608698785305023,
+ -0.025156188756227493
+ ],
+ "state_pred_error_per_layer": [
+ 4083.197509765625,
+ 262.47991943359375
+ ],
+ "mean_state_pred_error": 2172.8387145996094
+ },
+ "credit_bridge": {
+ "test_acc": 0.5125,
+ "mean_bp_cosine": 0.5678956210613251,
+ "mean_rho": 0.5935650169849396,
+ "mean_nudge_001": -0.00795893557369709,
+ "mean_nudge_003": -0.023799872025847435,
+ "mean_nudge_01": -0.07842501997947693,
+ "bp_cosine_per_layer": [
+ 0.39126425981521606,
+ 0.7445269823074341
+ ],
+ "rho_per_layer": [
+ 0.44417524337768555,
+ 0.7429547905921936
+ ],
+ "nudge_per_layer": [
+ -0.08887787163257599,
+ -0.06797216832637787
+ ],
+ "final_value_loss": 0.6212269179344178,
+ "final_term_loss": 0.05304660900235176,
+ "final_bridge_loss": 0.010462266248464584,
+ "final_tgrad_loss": 0.5577180406570434
+ }
+ },
+ "a1.0_L2_s123": {
+ "bp": {
+ "test_acc": 0.809,
+ "mean_bp_cosine": 0.9559402465820312,
+ "mean_rho": 0.9999986886978149,
+ "mean_nudge_001": -0.03185446374118328,
+ "mean_nudge_003": -0.09129266440868378,
+ "mean_nudge_01": -0.258349284529686,
+ "bp_cosine_per_layer": [
+ 0.9615377187728882,
+ 0.9503427743911743
+ ],
+ "rho_per_layer": [
+ 0.9999992847442627,
+ 0.9999980926513672
+ ],
+ "nudge_per_layer": [
+ -0.3078651428222656,
+ -0.20883342623710632
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.7455,
+ "mean_bp_cosine": 0.05108090303838253,
+ "mean_rho": 0.05254313163459301,
+ "mean_nudge_001": -0.0008275873260572553,
+ "mean_nudge_003": -0.0024727254058234394,
+ "mean_nudge_01": -0.008127598091959953,
+ "bp_cosine_per_layer": [
+ 0.057878345251083374,
+ 0.044283460825681686
+ ],
+ "rho_per_layer": [
+ 0.047237616032361984,
+ 0.057848647236824036
+ ],
+ "nudge_per_layer": [
+ -0.013432648032903671,
+ -0.0028225481510162354
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.704,
+ "mean_bp_cosine": 0.5101080536842346,
+ "mean_rho": 0.45375654101371765,
+ "mean_nudge_001": -0.00980611308477819,
+ "mean_nudge_003": -0.02897635381668806,
+ "mean_nudge_01": -0.09152827039361,
+ "bp_cosine_per_layer": [
+ 0.6596157550811768,
+ 0.3606003522872925
+ ],
+ "rho_per_layer": [
+ 0.5883278250694275,
+ 0.3191852569580078
+ ],
+ "nudge_per_layer": [
+ -0.16100725531578064,
+ -0.02204928547143936
+ ],
+ "state_pred_error_per_layer": [
+ 4266.72509765625,
+ 268.82733154296875
+ ],
+ "mean_state_pred_error": 2267.7762145996094
+ },
+ "credit_bridge": {
+ "test_acc": 0.536,
+ "mean_bp_cosine": 0.5000061094760895,
+ "mean_rho": 0.5169470459222794,
+ "mean_nudge_001": -0.007283595856279135,
+ "mean_nudge_003": -0.0217662351205945,
+ "mean_nudge_01": -0.07154248096048832,
+ "bp_cosine_per_layer": [
+ 0.3330497741699219,
+ 0.6669624447822571
+ ],
+ "rho_per_layer": [
+ 0.38148215413093567,
+ 0.652411937713623
+ ],
+ "nudge_per_layer": [
+ -0.08540114760398865,
+ -0.05768381431698799
+ ],
+ "final_value_loss": 0.6294826040267945,
+ "final_term_loss": 0.06573917962312699,
+ "final_bridge_loss": 0.01474373927861452,
+ "final_tgrad_loss": 0.5489996829986572
+ }
+ },
+ "a1.0_L2_s456": {
+ "bp": {
+ "test_acc": 0.7905,
+ "mean_bp_cosine": 0.9266799688339233,
+ "mean_rho": 0.9999988377094269,
+ "mean_nudge_001": -0.03671902138739824,
+ "mean_nudge_003": -0.10590140148997307,
+ "mean_nudge_01": -0.30589545518159866,
+ "bp_cosine_per_layer": [
+ 0.9291538000106812,
+ 0.9242061376571655
+ ],
+ "rho_per_layer": [
+ 0.9999991059303284,
+ 0.9999985694885254
+ ],
+ "nudge_per_layer": [
+ -0.36666756868362427,
+ -0.24512334167957306
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.73,
+ "mean_bp_cosine": 0.03006170690059662,
+ "mean_rho": 0.039368635043501854,
+ "mean_nudge_001": -0.0004903670051135123,
+ "mean_nudge_003": -0.0014640121953561902,
+ "mean_nudge_01": -0.004785260884091258,
+ "bp_cosine_per_layer": [
+ 0.02131858840584755,
+ 0.03880482539534569
+ ],
+ "rho_per_layer": [
+ 0.006325956434011459,
+ 0.07241131365299225
+ ],
+ "nudge_per_layer": [
+ -0.006775922141969204,
+ -0.002794599626213312
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6755,
+ "mean_bp_cosine": 0.5186701416969299,
+ "mean_rho": 0.48068559169769287,
+ "mean_nudge_001": -0.011591368587687612,
+ "mean_nudge_003": -0.03431171411648393,
+ "mean_nudge_01": -0.10901244357228279,
+ "bp_cosine_per_layer": [
+ 0.669547975063324,
+ 0.3677923083305359
+ ],
+ "rho_per_layer": [
+ 0.6219363808631897,
+ 0.33943480253219604
+ ],
+ "nudge_per_layer": [
+ -0.19162335991859436,
+ -0.026401527225971222
+ ],
+ "state_pred_error_per_layer": [
+ 3936.27783203125,
+ 288.300537109375
+ ],
+ "mean_state_pred_error": 2112.2891845703125
+ },
+ "credit_bridge": {
+ "test_acc": 0.544,
+ "mean_bp_cosine": 0.5161235481500626,
+ "mean_rho": 0.5938436686992645,
+ "mean_nudge_001": -0.0068406532518565655,
+ "mean_nudge_003": -0.020453338511288166,
+ "mean_nudge_01": -0.0673653893172741,
+ "bp_cosine_per_layer": [
+ 0.35489675402641296,
+ 0.6773503422737122
+ ],
+ "rho_per_layer": [
+ 0.4646533727645874,
+ 0.7230339646339417
+ ],
+ "nudge_per_layer": [
+ -0.07572861015796661,
+ -0.059002168476581573
+ ],
+ "final_value_loss": 0.6262330022811889,
+ "final_term_loss": 0.049621654653549195,
+ "final_bridge_loss": 0.011661755262315273,
+ "final_tgrad_loss": 0.5649495909690857
+ }
+ },
+ "a1.0_L4_s42": {
+ "bp": {
+ "test_acc": 0.7875,
+ "mean_bp_cosine": 0.882385790348053,
+ "mean_rho": 0.999995619058609,
+ "mean_nudge_001": -0.03646231605671346,
+ "mean_nudge_003": -0.10610398091375828,
+ "mean_nudge_01": -0.31568005308508873,
+ "bp_cosine_per_layer": [
+ 0.8902335166931152,
+ 0.8886877298355103,
+ 0.8827626705169678,
+ 0.8678592443466187
+ ],
+ "rho_per_layer": [
+ 0.9999993443489075,
+ 0.9999990463256836,
+ 0.9999973773956299,
+ 0.9999867081642151
+ ],
+ "nudge_per_layer": [
+ -0.49256381392478943,
+ -0.4056996703147888,
+ -0.2497977763414383,
+ -0.11465895175933838
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.7075,
+ "mean_bp_cosine": 0.060902527533471584,
+ "mean_rho": 0.052925301948562264,
+ "mean_nudge_001": -0.00048208528460236266,
+ "mean_nudge_003": -0.0014429198927246034,
+ "mean_nudge_01": -0.004763618926517665,
+ "bp_cosine_per_layer": [
+ 0.026215966790914536,
+ 0.05776425451040268,
+ 0.07666948437690735,
+ 0.08296040445566177
+ ],
+ "rho_per_layer": [
+ 0.04998716711997986,
+ 0.09949691593647003,
+ 0.049676910042762756,
+ 0.012540214695036411
+ ],
+ "nudge_per_layer": [
+ -0.008544353768229485,
+ -0.0038241599686443806,
+ -0.0033461027778685093,
+ -0.003339859191328287
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6625,
+ "mean_bp_cosine": 0.3484594225883484,
+ "mean_rho": 0.3289090357720852,
+ "mean_nudge_001": -0.005907032289542258,
+ "mean_nudge_003": -0.01748002166277729,
+ "mean_nudge_01": -0.05545389896724373,
+ "bp_cosine_per_layer": [
+ 0.6404350996017456,
+ 0.4214136302471161,
+ 0.18068093061447144,
+ 0.15130802989006042
+ ],
+ "rho_per_layer": [
+ 0.5499319434165955,
+ 0.368219256401062,
+ 0.21391229331493378,
+ 0.1835726499557495
+ ],
+ "nudge_per_layer": [
+ -0.18587297201156616,
+ -0.0235043503344059,
+ -0.00688221026211977,
+ -0.005556063260883093
+ ],
+ "state_pred_error_per_layer": [
+ 10066.107421875,
+ 1273.9140625,
+ 696.594482421875,
+ 612.3014526367188
+ ],
+ "mean_state_pred_error": 3162.2293548583984
+ },
+ "credit_bridge": {
+ "test_acc": 0.558,
+ "mean_bp_cosine": 0.45794273912906647,
+ "mean_rho": 0.5322257168591022,
+ "mean_nudge_001": -0.003842960635665804,
+ "mean_nudge_003": -0.011505396338179708,
+ "mean_nudge_01": -0.038075629621744156,
+ "bp_cosine_per_layer": [
+ 0.17809242010116577,
+ 0.5349531173706055,
+ 0.5522423982620239,
+ 0.5664830207824707
+ ],
+ "rho_per_layer": [
+ 0.22843755781650543,
+ 0.5910820364952087,
+ 0.6707864999771118,
+ 0.638596773147583
+ ],
+ "nudge_per_layer": [
+ -0.044362872838974,
+ -0.03722546622157097,
+ -0.03515344485640526,
+ -0.0355607345700264
+ ],
+ "final_value_loss": 0.38718592133522034,
+ "final_term_loss": 0.06566130868196488,
+ "final_bridge_loss": 0.01777836950570345,
+ "final_tgrad_loss": 0.30374624242782594
+ }
+ },
+ "a1.0_L4_s123": {
+ "bp": {
+ "test_acc": 0.786,
+ "mean_bp_cosine": 0.8366721421480179,
+ "mean_rho": 0.9999945610761642,
+ "mean_nudge_001": -0.03740503964945674,
+ "mean_nudge_003": -0.1080933827906847,
+ "mean_nudge_01": -0.3170367181301117,
+ "bp_cosine_per_layer": [
+ 0.8610074520111084,
+ 0.8541143536567688,
+ 0.8321727514266968,
+ 0.7993940114974976
+ ],
+ "rho_per_layer": [
+ 0.9999990463256836,
+ 0.9999986886978149,
+ 0.9999971389770508,
+ 0.9999833703041077
+ ],
+ "nudge_per_layer": [
+ -0.492245614528656,
+ -0.40577083826065063,
+ -0.25304561853408813,
+ -0.117084801197052
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.682,
+ "mean_bp_cosine": 0.049554066732525826,
+ "mean_rho": 0.06381266703829169,
+ "mean_nudge_001": -0.00014734033902641386,
+ "mean_nudge_003": -0.0004330205119913444,
+ "mean_nudge_01": -0.001343857147730887,
+ "bp_cosine_per_layer": [
+ -0.008613362908363342,
+ 0.039367884397506714,
+ 0.07619941979646683,
+ 0.0912623256444931
+ ],
+ "rho_per_layer": [
+ -0.007624803110957146,
+ 0.008791688829660416,
+ 0.13103844225406647,
+ 0.12304534018039703
+ ],
+ "nudge_per_layer": [
+ 0.005509334150701761,
+ -0.003195145633071661,
+ -0.0036095697432756424,
+ -0.004080047365278006
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6305,
+ "mean_bp_cosine": 0.3143155351281166,
+ "mean_rho": 0.30846646428108215,
+ "mean_nudge_001": -0.005087231853394769,
+ "mean_nudge_003": -0.015093521040398628,
+ "mean_nudge_01": -0.04834054387174547,
+ "bp_cosine_per_layer": [
+ 0.5847928524017334,
+ 0.3501134514808655,
+ 0.17105570435523987,
+ 0.15130013227462769
+ ],
+ "rho_per_layer": [
+ 0.5387442708015442,
+ 0.3080189526081085,
+ 0.17941737174987793,
+ 0.20768526196479797
+ ],
+ "nudge_per_layer": [
+ -0.16164088249206543,
+ -0.01902196928858757,
+ -0.006823995150625706,
+ -0.005875328555703163
+ ],
+ "state_pred_error_per_layer": [
+ 10103.57421875,
+ 1132.8861083984375,
+ 636.5859375,
+ 537.355224609375
+ ],
+ "mean_state_pred_error": 3102.600372314453
+ },
+ "credit_bridge": {
+ "test_acc": 0.502,
+ "mean_bp_cosine": 0.39079025387763977,
+ "mean_rho": 0.4630395397543907,
+ "mean_nudge_001": -0.0038928183494135737,
+ "mean_nudge_003": -0.011659935116767883,
+ "mean_nudge_01": -0.03865493927150965,
+ "bp_cosine_per_layer": [
+ 0.1632033884525299,
+ 0.4602273404598236,
+ 0.4661305546760559,
+ 0.47359973192214966
+ ],
+ "rho_per_layer": [
+ 0.20324298739433289,
+ 0.5429707169532776,
+ 0.5653814077377319,
+ 0.5405630469322205
+ ],
+ "nudge_per_layer": [
+ -0.04415123537182808,
+ -0.037312425673007965,
+ -0.03657253086566925,
+ -0.036583565175533295
+ ],
+ "final_value_loss": 0.5799021621704101,
+ "final_term_loss": 0.1424343505382538,
+ "final_bridge_loss": 0.03182844363451004,
+ "final_tgrad_loss": 0.4056393639087677
+ }
+ },
+ "a1.0_L4_s456": {
+ "bp": {
+ "test_acc": 0.792,
+ "mean_bp_cosine": 0.8552748262882233,
+ "mean_rho": 0.9999953359365463,
+ "mean_nudge_001": -0.03656455362215638,
+ "mean_nudge_003": -0.10595990065485239,
+ "mean_nudge_01": -0.31139715015888214,
+ "bp_cosine_per_layer": [
+ 0.8668075799942017,
+ 0.8621845245361328,
+ 0.8550785779953003,
+ 0.8370286226272583
+ ],
+ "rho_per_layer": [
+ 0.9999995827674866,
+ 0.9999990463256836,
+ 0.999997615814209,
+ 0.9999850988388062
+ ],
+ "nudge_per_layer": [
+ -0.4802546799182892,
+ -0.3984469175338745,
+ -0.2503964900970459,
+ -0.11649051308631897
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.68,
+ "mean_bp_cosine": 0.052356213971506804,
+ "mean_rho": 0.05650564655661583,
+ "mean_nudge_001": -0.0003577733878046274,
+ "mean_nudge_003": -0.0010662981367204338,
+ "mean_nudge_01": -0.0034739490947686136,
+ "bp_cosine_per_layer": [
+ -0.001797341974452138,
+ 0.06668862700462341,
+ 0.05448886379599571,
+ 0.09004470705986023
+ ],
+ "rho_per_layer": [
+ -0.01287321001291275,
+ 0.007983170449733734,
+ 0.10568365454673767,
+ 0.12522897124290466
+ ],
+ "nudge_per_layer": [
+ -0.0016110537108033895,
+ -0.004868227988481522,
+ -0.0030549662187695503,
+ -0.004361548461019993
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.651,
+ "mean_bp_cosine": 0.35348402336239815,
+ "mean_rho": 0.3312904089689255,
+ "mean_nudge_001": -0.005755784470238723,
+ "mean_nudge_003": -0.017025350069161505,
+ "mean_nudge_01": -0.05395022651646286,
+ "bp_cosine_per_layer": [
+ 0.6501579284667969,
+ 0.4189426302909851,
+ 0.1800653487443924,
+ 0.1647701859474182
+ ],
+ "rho_per_layer": [
+ 0.5907484292984009,
+ 0.36159276962280273,
+ 0.19337056577205658,
+ 0.1794498711824417
+ ],
+ "nudge_per_layer": [
+ -0.1790994107723236,
+ -0.023556631058454514,
+ -0.006848426535725594,
+ -0.0062964376993477345
+ ],
+ "state_pred_error_per_layer": [
+ 7107.7138671875,
+ 890.22314453125,
+ 493.5357360839844,
+ 407.69677734375
+ ],
+ "mean_state_pred_error": 2224.792381286621
+ },
+ "credit_bridge": {
+ "test_acc": 0.487,
+ "mean_bp_cosine": 0.5049829035997391,
+ "mean_rho": 0.5321159400045872,
+ "mean_nudge_001": -0.004336995130870491,
+ "mean_nudge_003": -0.012986946385353804,
+ "mean_nudge_01": -0.04301031678915024,
+ "bp_cosine_per_layer": [
+ 0.20670706033706665,
+ 0.594096302986145,
+ 0.6002212762832642,
+ 0.6189069747924805
+ ],
+ "rho_per_layer": [
+ 0.24109239876270294,
+ 0.6317664384841919,
+ 0.6270265579223633,
+ 0.6285783648490906
+ ],
+ "nudge_per_layer": [
+ -0.03731346130371094,
+ -0.04525235667824745,
+ -0.044518306851387024,
+ -0.04495714232325554
+ ],
+ "final_value_loss": 0.46226135368347165,
+ "final_term_loss": 0.049428026616573334,
+ "final_bridge_loss": 0.022721626716852187,
+ "final_tgrad_loss": 0.39011170201301576
+ }
+ },
+ "a1.0_L8_s42": {
+ "bp": {
+ "test_acc": 0.763,
+ "mean_bp_cosine": 0.8278333768248558,
+ "mean_rho": 0.9999853745102882,
+ "mean_nudge_001": -0.029990217997692525,
+ "mean_nudge_003": -0.08752790885046124,
+ "mean_nudge_01": -0.2652519349940121,
+ "bp_cosine_per_layer": [
+ 0.85625159740448,
+ 0.8527897596359253,
+ 0.847720742225647,
+ 0.8408411145210266,
+ 0.831807017326355,
+ 0.8158122301101685,
+ 0.7960221171379089,
+ 0.7814224362373352
+ ],
+ "rho_per_layer": [
+ 0.999999463558197,
+ 0.9999992847442627,
+ 0.9999988079071045,
+ 0.9999978542327881,
+ 0.999994695186615,
+ 0.9999883770942688,
+ 0.9999692440032959,
+ 0.9999352693557739
+ ],
+ "nudge_per_layer": [
+ -0.5478029251098633,
+ -0.4737934172153473,
+ -0.3800549805164337,
+ -0.2769272029399872,
+ -0.18745023012161255,
+ -0.12213317304849625,
+ -0.07957549393177032,
+ -0.05427805706858635
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.657,
+ "mean_bp_cosine": 0.046988741494715214,
+ "mean_rho": 0.0527694383636117,
+ "mean_nudge_001": -0.00015309322225220967,
+ "mean_nudge_003": -0.00045631649845745414,
+ "mean_nudge_01": -0.0014890892343828455,
+ "bp_cosine_per_layer": [
+ -0.01574046164751053,
+ 0.07191511988639832,
+ 0.043905604630708694,
+ 0.07308061420917511,
+ 0.07518148422241211,
+ 0.026394926011562347,
+ 0.06854978203773499,
+ 0.03262286260724068
+ ],
+ "rho_per_layer": [
+ -0.02709903195500374,
+ 0.1010747104883194,
+ 0.06438975036144257,
+ 0.07812117040157318,
+ 0.0766223892569542,
+ 0.026489075273275375,
+ 0.09218208491802216,
+ 0.010375358164310455
+ ],
+ "nudge_per_layer": [
+ 0.007441862486302853,
+ -0.0052239359356462955,
+ -0.0022090799175202847,
+ -0.003076428547501564,
+ -0.0031523762736469507,
+ -0.0013899998739361763,
+ -0.0030318819917738438,
+ -0.0012708738213405013
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.65,
+ "mean_bp_cosine": 0.2592074144631624,
+ "mean_rho": 0.23237370885908604,
+ "mean_nudge_001": -0.0031611585363862105,
+ "mean_nudge_003": -0.009385082448716275,
+ "mean_nudge_01": -0.030122902884613723,
+ "bp_cosine_per_layer": [
+ 0.6320836544036865,
+ 0.4503885507583618,
+ 0.22882479429244995,
+ 0.17507168650627136,
+ 0.15456035733222961,
+ 0.15327030420303345,
+ 0.14079461991786957,
+ 0.1386653482913971
+ ],
+ "rho_per_layer": [
+ 0.5491607189178467,
+ 0.3870346248149872,
+ 0.23711450397968292,
+ 0.15141981840133667,
+ 0.12508505582809448,
+ 0.15914584696292877,
+ 0.13365353643894196,
+ 0.11637556552886963
+ ],
+ "nudge_per_layer": [
+ -0.18924641609191895,
+ -0.02186501771211624,
+ -0.007085676770657301,
+ -0.0053551034070551395,
+ -0.00462403055280447,
+ -0.004574076272547245,
+ -0.004170445259660482,
+ -0.004062457010149956
+ ],
+ "state_pred_error_per_layer": [
+ 9406.7255859375,
+ 1991.255126953125,
+ 1233.173095703125,
+ 996.4456787109375,
+ 824.75537109375,
+ 800.2864990234375,
+ 821.3734130859375,
+ 840.202392578125
+ ],
+ "mean_state_pred_error": 2114.277145385742
+ },
+ "credit_bridge": {
+ "test_acc": 0.5165,
+ "mean_bp_cosine": 0.41811549477279186,
+ "mean_rho": 0.45575808361172676,
+ "mean_nudge_001": -0.002801764407195151,
+ "mean_nudge_003": -0.00839249708224088,
+ "mean_nudge_01": -0.02782702073454857,
+ "bp_cosine_per_layer": [
+ 0.159218892455101,
+ 0.41163527965545654,
+ 0.4353415369987488,
+ 0.4608742594718933,
+ 0.46223077178001404,
+ 0.4579800069332123,
+ 0.4774817228317261,
+ 0.48016148805618286
+ ],
+ "rho_per_layer": [
+ 0.16694357991218567,
+ 0.4445253610610962,
+ 0.4925374388694763,
+ 0.48059922456741333,
+ 0.4989780783653259,
+ 0.5061379075050354,
+ 0.5181043148040771,
+ 0.5382387638092041
+ ],
+ "nudge_per_layer": [
+ -0.030580628663301468,
+ -0.027534715831279755,
+ -0.027298064902424812,
+ -0.027803048491477966,
+ -0.027431834489107132,
+ -0.02679138071835041,
+ -0.027646536007523537,
+ -0.02752995677292347
+ ],
+ "final_value_loss": 0.35056146993637083,
+ "final_term_loss": 0.0784306697010994,
+ "final_bridge_loss": 0.0149920065253973,
+ "final_tgrad_loss": 0.25713879618644714
+ }
+ },
+ "a1.0_L8_s123": {
+ "bp": {
+ "test_acc": 0.7715,
+ "mean_bp_cosine": 0.8317327573895454,
+ "mean_rho": 0.9999875128269196,
+ "mean_nudge_001": -0.028257266676519066,
+ "mean_nudge_003": -0.08214446459896863,
+ "mean_nudge_01": -0.24747182056307793,
+ "bp_cosine_per_layer": [
+ 0.8705248832702637,
+ 0.8637571334838867,
+ 0.8509291410446167,
+ 0.8393645286560059,
+ 0.8308560848236084,
+ 0.8178726434707642,
+ 0.800449013710022,
+ 0.780108630657196
+ ],
+ "rho_per_layer": [
+ 0.9999995231628418,
+ 0.9999995827674866,
+ 0.9999989867210388,
+ 0.9999984502792358,
+ 0.9999953508377075,
+ 0.9999901056289673,
+ 0.9999750852584839,
+ 0.9999430179595947
+ ],
+ "nudge_per_layer": [
+ -0.5067576169967651,
+ -0.4360688626766205,
+ -0.3518902063369751,
+ -0.26053690910339355,
+ -0.1787266880273819,
+ -0.1170111671090126,
+ -0.07650406658649445,
+ -0.052279047667980194
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.67,
+ "mean_bp_cosine": 0.06255943619180471,
+ "mean_rho": 0.0582913524704054,
+ "mean_nudge_001": -0.00016377134670619853,
+ "mean_nudge_003": -0.00048249874453176744,
+ "mean_nudge_01": -0.0015042584564071149,
+ "bp_cosine_per_layer": [
+ -0.006531993858516216,
+ 0.06646430492401123,
+ 0.03470785170793533,
+ 0.06075863167643547,
+ 0.08359120786190033,
+ 0.10361115634441376,
+ 0.07729409635066986,
+ 0.08058023452758789
+ ],
+ "rho_per_layer": [
+ -0.009454472921788692,
+ 0.027615420520305634,
+ 0.016344428062438965,
+ 0.07737872004508972,
+ 0.07998150587081909,
+ 0.10012705624103546,
+ 0.06766189634799957,
+ 0.10667626559734344
+ ],
+ "nudge_per_layer": [
+ 0.008429424837231636,
+ -0.004321999382227659,
+ -0.0012797827366739511,
+ -0.0022665630094707012,
+ -0.003274995367974043,
+ -0.0036867314483970404,
+ -0.0025471593253314495,
+ -0.0030862612184137106
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.63,
+ "mean_bp_cosine": 0.2676183916628361,
+ "mean_rho": 0.249815184623003,
+ "mean_nudge_001": -0.0025806196208577603,
+ "mean_nudge_003": -0.007662267831619829,
+ "mean_nudge_01": -0.024620095442514867,
+ "bp_cosine_per_layer": [
+ 0.6138853430747986,
+ 0.41074037551879883,
+ 0.25203365087509155,
+ 0.20834164321422577,
+ 0.16624599695205688,
+ 0.15929004549980164,
+ 0.15449269115924835,
+ 0.175917387008667
+ ],
+ "rho_per_layer": [
+ 0.5534218549728394,
+ 0.3554393947124481,
+ 0.28831934928894043,
+ 0.1869889795780182,
+ 0.14766299724578857,
+ 0.176305890083313,
+ 0.1294843554496765,
+ 0.16089865565299988
+ ],
+ "nudge_per_layer": [
+ -0.14630448818206787,
+ -0.017482426017522812,
+ -0.00796731747686863,
+ -0.006267632823437452,
+ -0.00492177763953805,
+ -0.00457757618278265,
+ -0.004429594613611698,
+ -0.00500995060428977
+ ],
+ "state_pred_error_per_layer": [
+ 7478.478515625,
+ 1555.7657470703125,
+ 846.884521484375,
+ 607.9534301757812,
+ 659.867919921875,
+ 614.796630859375,
+ 546.969482421875,
+ 518.796142578125
+ ],
+ "mean_state_pred_error": 1603.6890487670898
+ },
+ "credit_bridge": {
+ "test_acc": 0.5695,
+ "mean_bp_cosine": 0.33955336920917034,
+ "mean_rho": 0.4137213062494993,
+ "mean_nudge_001": -0.002328026050236076,
+ "mean_nudge_003": -0.006974202115088701,
+ "mean_nudge_01": -0.023127662017941475,
+ "bp_cosine_per_layer": [
+ 0.08390675485134125,
+ 0.2993828356266022,
+ 0.37482553720474243,
+ 0.3876585066318512,
+ 0.3966418504714966,
+ 0.3863479495048523,
+ 0.3938036561012268,
+ 0.39385986328125
+ ],
+ "rho_per_layer": [
+ 0.09506039321422577,
+ 0.3888479173183441,
+ 0.42724472284317017,
+ 0.5000925064086914,
+ 0.4708487391471863,
+ 0.47097086906433105,
+ 0.48436442017555237,
+ 0.4723408818244934
+ ],
+ "nudge_per_layer": [
+ -0.027181372046470642,
+ -0.02298363298177719,
+ -0.02282092720270157,
+ -0.022664468735456467,
+ -0.02277727797627449,
+ -0.02207607962191105,
+ -0.022199643775820732,
+ -0.02231789380311966
+ ],
+ "final_value_loss": 0.32433377566337585,
+ "final_term_loss": 0.09466714213788509,
+ "final_bridge_loss": 0.018076158130913973,
+ "final_tgrad_loss": 0.21159047515392304
+ }
+ },
+ "a1.0_L8_s456": {
+ "bp": {
+ "test_acc": 0.753,
+ "mean_bp_cosine": 0.8595180436968803,
+ "mean_rho": 0.9999836012721062,
+ "mean_nudge_001": -0.029901663539931178,
+ "mean_nudge_003": -0.08636575657874346,
+ "mean_nudge_01": -0.25306460773572326,
+ "bp_cosine_per_layer": [
+ 0.8814424872398376,
+ 0.8780966401100159,
+ 0.8716025352478027,
+ 0.8659577369689941,
+ 0.8611791133880615,
+ 0.8505971431732178,
+ 0.840730607509613,
+ 0.8265380859375
+ ],
+ "rho_per_layer": [
+ 0.9999989867210388,
+ 0.9999986886978149,
+ 0.9999985694885254,
+ 0.9999977350234985,
+ 0.9999950528144836,
+ 0.9999887943267822,
+ 0.9999659657478333,
+ 0.9999250173568726
+ ],
+ "nudge_per_layer": [
+ -0.4892617166042328,
+ -0.43737056851387024,
+ -0.36532458662986755,
+ -0.27772778272628784,
+ -0.1931857019662857,
+ -0.12626537680625916,
+ -0.08131371438503265,
+ -0.05406741425395012
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.6545,
+ "mean_bp_cosine": 0.07594231329858303,
+ "mean_rho": 0.08383850008249283,
+ "mean_nudge_001": -0.00040534641811973415,
+ "mean_nudge_003": -0.0011938292009290308,
+ "mean_nudge_01": -0.0038653643568977714,
+ "bp_cosine_per_layer": [
+ 0.025392260402441025,
+ 0.05978121981024742,
+ 0.09360896795988083,
+ 0.06215091794729233,
+ 0.08870920538902283,
+ 0.07948237657546997,
+ 0.10833052545785904,
+ 0.0900830328464508
+ ],
+ "rho_per_layer": [
+ -0.015408031642436981,
+ 0.08876338601112366,
+ 0.15722069144248962,
+ 0.07516318559646606,
+ 0.12132002413272858,
+ 0.08764688670635223,
+ 0.0905974954366684,
+ 0.06540436297655106
+ ],
+ "nudge_per_layer": [
+ -0.002068763133138418,
+ -0.004839141853153706,
+ -0.004507332108914852,
+ -0.002498403424397111,
+ -0.004324691370129585,
+ -0.004049480427056551,
+ -0.004787375684827566,
+ -0.0038477268535643816
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6315,
+ "mean_bp_cosine": 0.22162932250648737,
+ "mean_rho": 0.200162704102695,
+ "mean_nudge_001": -0.002804466668749228,
+ "mean_nudge_003": -0.008329451040481217,
+ "mean_nudge_01": -0.026790971111040562,
+ "bp_cosine_per_layer": [
+ 0.6046093106269836,
+ 0.3773959279060364,
+ 0.1675240397453308,
+ 0.13364183902740479,
+ 0.12548640370368958,
+ 0.11966440826654434,
+ 0.11708953976631165,
+ 0.12762311100959778
+ ],
+ "rho_per_layer": [
+ 0.5598001480102539,
+ 0.35775649547576904,
+ 0.14680343866348267,
+ 0.103827565908432,
+ 0.12472978234291077,
+ 0.08794894069433212,
+ 0.12868158519268036,
+ 0.09175367653369904
+ ],
+ "nudge_per_layer": [
+ -0.17137765884399414,
+ -0.018192056566476822,
+ -0.005168645642697811,
+ -0.004143164958804846,
+ -0.0039602769538760185,
+ -0.0037884372286498547,
+ -0.003734107594937086,
+ -0.00396342109888792
+ ],
+ "state_pred_error_per_layer": [
+ 11751.603515625,
+ 2306.73095703125,
+ 1321.091796875,
+ 1033.674560546875,
+ 973.6993408203125,
+ 865.9056396484375,
+ 869.378173828125,
+ 839.1387329101562
+ ],
+ "mean_state_pred_error": 2495.1528396606445
+ },
+ "credit_bridge": {
+ "test_acc": 0.5275,
+ "mean_bp_cosine": 0.33450845070183277,
+ "mean_rho": 0.39851769525557756,
+ "mean_nudge_001": -0.0025428086810279638,
+ "mean_nudge_003": -0.007617499912157655,
+ "mean_nudge_01": -0.025270385667681694,
+ "bp_cosine_per_layer": [
+ 0.1268395036458969,
+ 0.30569249391555786,
+ 0.34143707156181335,
+ 0.3805205225944519,
+ 0.3833070397377014,
+ 0.38344305753707886,
+ 0.3742453455924988,
+ 0.3805825710296631
+ ],
+ "rho_per_layer": [
+ 0.10492167621850967,
+ 0.4008791148662567,
+ 0.42003583908081055,
+ 0.4331238567829132,
+ 0.4291571080684662,
+ 0.4853004217147827,
+ 0.4488537311553955,
+ 0.46586981415748596
+ ],
+ "nudge_per_layer": [
+ -0.02585173025727272,
+ -0.023091215640306473,
+ -0.0244273878633976,
+ -0.026221776381134987,
+ -0.026039035990834236,
+ -0.025849176570773125,
+ -0.025189466774463654,
+ -0.02549329586327076
+ ],
+ "final_value_loss": 0.41436073665618894,
+ "final_term_loss": 0.08663651337623596,
+ "final_bridge_loss": 0.013127461233735085,
+ "final_tgrad_loss": 0.3145967625617981
+ }
+ },
+ "a1.0_L12_s42": {
+ "bp": {
+ "test_acc": 0.761,
+ "mean_bp_cosine": 0.8604618857304255,
+ "mean_rho": 0.9999715387821198,
+ "mean_nudge_001": -0.027060116563613217,
+ "mean_nudge_003": -0.07916912420963247,
+ "mean_nudge_01": -0.2410698818663756,
+ "bp_cosine_per_layer": [
+ 0.9098777174949646,
+ 0.9046642780303955,
+ 0.8960509300231934,
+ 0.8827707171440125,
+ 0.8719829320907593,
+ 0.8605888485908508,
+ 0.8495617508888245,
+ 0.8414114117622375,
+ 0.8343594074249268,
+ 0.8291183114051819,
+ 0.8250235915184021,
+ 0.8201327323913574
+ ],
+ "rho_per_layer": [
+ 0.9999990463256836,
+ 0.9999990463256836,
+ 0.9999988675117493,
+ 0.9999977946281433,
+ 0.9999968409538269,
+ 0.9999942779541016,
+ 0.9999903440475464,
+ 0.9999786615371704,
+ 0.9999630451202393,
+ 0.9999446272850037,
+ 0.9999108910560608,
+ 0.9998850226402283
+ ],
+ "nudge_per_layer": [
+ -0.6227189302444458,
+ -0.5321269631385803,
+ -0.43762683868408203,
+ -0.34503036737442017,
+ -0.26150017976760864,
+ -0.1957385241985321,
+ -0.14543747901916504,
+ -0.10888919234275818,
+ -0.08308196067810059,
+ -0.06497863680124283,
+ -0.05229911208152771,
+ -0.043410398066043854
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.6555,
+ "mean_bp_cosine": 0.07142843399196863,
+ "mean_rho": 0.08962296570340793,
+ "mean_nudge_001": -0.00027090053966579336,
+ "mean_nudge_003": -0.0007314661440129081,
+ "mean_nudge_01": -0.0026503523016193262,
+ "bp_cosine_per_layer": [
+ 0.019931811839342117,
+ 0.08357247710227966,
+ 0.07596792280673981,
+ 0.07454836368560791,
+ 0.08405900746583939,
+ 0.09273561835289001,
+ 0.08532143384218216,
+ 0.014841631054878235,
+ 0.05702097713947296,
+ 0.11365848034620285,
+ 0.0635562390089035,
+ 0.09192724525928497
+ ],
+ "rho_per_layer": [
+ -0.021908380091190338,
+ 0.08644437789916992,
+ 0.133758544921875,
+ 0.11560394614934921,
+ 0.09019643068313599,
+ 0.10901004821062088,
+ 0.05401141196489334,
+ 0.06626297533512115,
+ 0.10668720304965973,
+ 0.11482831090688705,
+ 0.07995637506246567,
+ 0.14062434434890747
+ ],
+ "nudge_per_layer": [
+ 0.012093277648091316,
+ -0.00814887322485447,
+ -0.0036774289328604937,
+ -0.0036643892526626587,
+ -0.0034756590612232685,
+ -0.0045063551515340805,
+ -0.003735880134627223,
+ -0.00101565255317837,
+ -0.0033070247154682875,
+ -0.005390047561377287,
+ -0.0029281126335263252,
+ -0.004048082046210766
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.612,
+ "mean_bp_cosine": 0.2312017778555552,
+ "mean_rho": 0.2218381396184365,
+ "mean_nudge_001": -0.0020883519706937173,
+ "mean_nudge_003": -0.0062129807386857765,
+ "mean_nudge_01": -0.02010280774751057,
+ "bp_cosine_per_layer": [
+ 0.6137553453445435,
+ 0.458263099193573,
+ 0.30694735050201416,
+ 0.21984770894050598,
+ 0.18884725868701935,
+ 0.1519574671983719,
+ 0.14165323972702026,
+ 0.13691727817058563,
+ 0.1416233777999878,
+ 0.126474529504776,
+ 0.13544593751430511,
+ 0.15268874168395996
+ ],
+ "rho_per_layer": [
+ 0.5528259873390198,
+ 0.43722641468048096,
+ 0.3177984952926636,
+ 0.20145072042942047,
+ 0.17441785335540771,
+ 0.10548915714025497,
+ 0.16265320777893066,
+ 0.1351865828037262,
+ 0.16532285511493683,
+ 0.1285737156867981,
+ 0.14820542931556702,
+ 0.13290725648403168
+ ],
+ "nudge_per_layer": [
+ -0.16301177442073822,
+ -0.02157333306968212,
+ -0.011153988540172577,
+ -0.00765608623623848,
+ -0.006283854134380817,
+ -0.005166183691471815,
+ -0.0045799510553479195,
+ -0.004474613815546036,
+ -0.004547867923974991,
+ -0.003950329497456551,
+ -0.004098072648048401,
+ -0.004737637937068939
+ ],
+ "state_pred_error_per_layer": [
+ 9663.3720703125,
+ 2355.42919921875,
+ 1189.673095703125,
+ 946.2671508789062,
+ 890.0131225585938,
+ 836.83837890625,
+ 765.7700805664062,
+ 776.2135009765625,
+ 909.9769287109375,
+ 744.7386474609375,
+ 809.6233520507812,
+ 764.1907958984375
+ ],
+ "mean_state_pred_error": 1721.0088602701824
+ },
+ "credit_bridge": {
+ "test_acc": 0.551,
+ "mean_bp_cosine": 0.24796992043654123,
+ "mean_rho": 0.34521655660743517,
+ "mean_nudge_001": -0.0019821600387028107,
+ "mean_nudge_003": -0.005940369796007872,
+ "mean_nudge_01": -0.01972930335129301,
+ "bp_cosine_per_layer": [
+ 0.050826266407966614,
+ 0.1324397623538971,
+ 0.19395378232002258,
+ 0.22954219579696655,
+ 0.24835197627544403,
+ 0.26261672377586365,
+ 0.2866933345794678,
+ 0.3069983422756195,
+ 0.3148944675922394,
+ 0.31817084550857544,
+ 0.3155951499938965,
+ 0.31555619835853577
+ ],
+ "rho_per_layer": [
+ 0.024354537948966026,
+ 0.23902058601379395,
+ 0.29458120465278625,
+ 0.31519168615341187,
+ 0.3208061456680298,
+ 0.38384467363357544,
+ 0.38460177183151245,
+ 0.4478553831577301,
+ 0.41032421588897705,
+ 0.452781081199646,
+ 0.43433815240859985,
+ 0.434899240732193
+ ],
+ "nudge_per_layer": [
+ -0.018513288348913193,
+ -0.014132995158433914,
+ -0.016322217881679535,
+ -0.017585258930921555,
+ -0.018846090883016586,
+ -0.02027801051735878,
+ -0.021141095086932182,
+ -0.02164183184504509,
+ -0.02207053080201149,
+ -0.022233182564377785,
+ -0.02206714265048504,
+ -0.021919995546340942
+ ],
+ "final_value_loss": 0.40481987361907956,
+ "final_term_loss": 0.14867231681346893,
+ "final_bridge_loss": 0.015895452450215817,
+ "final_tgrad_loss": 0.24025210301876068
+ }
+ },
+ "a1.0_L12_s123": {
+ "bp": {
+ "test_acc": 0.7615,
+ "mean_bp_cosine": 0.8364224582910538,
+ "mean_rho": 0.9999674806992213,
+ "mean_nudge_001": -0.021432781708426774,
+ "mean_nudge_003": -0.061891427962109447,
+ "mean_nudge_01": -0.18090539829184613,
+ "bp_cosine_per_layer": [
+ 0.86488276720047,
+ 0.8622424006462097,
+ 0.8600971698760986,
+ 0.85722416639328,
+ 0.8523166179656982,
+ 0.8457985520362854,
+ 0.8359642028808594,
+ 0.828606367111206,
+ 0.8221874237060547,
+ 0.8125513792037964,
+ 0.80171799659729,
+ 0.7934804558753967
+ ],
+ "rho_per_layer": [
+ 0.9999992251396179,
+ 0.9999991655349731,
+ 0.9999990463256836,
+ 0.9999980330467224,
+ 0.9999971389770508,
+ 0.9999936819076538,
+ 0.9999881386756897,
+ 0.9999800324440002,
+ 0.9999632835388184,
+ 0.999937891960144,
+ 0.9999018311500549,
+ 0.9998522996902466
+ ],
+ "nudge_per_layer": [
+ -0.4491935074329376,
+ -0.38857996463775635,
+ -0.3270212411880493,
+ -0.26439201831817627,
+ -0.20410630106925964,
+ -0.15283547341823578,
+ -0.11351937055587769,
+ -0.08454076200723648,
+ -0.06403174996376038,
+ -0.04978282377123833,
+ -0.03986590355634689,
+ -0.032995663583278656
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.6485,
+ "mean_bp_cosine": 0.05831230893575897,
+ "mean_rho": 0.0407225100013117,
+ "mean_nudge_001": -0.00021713114256272092,
+ "mean_nudge_003": -0.0006509826756276501,
+ "mean_nudge_01": -0.002172412224657213,
+ "bp_cosine_per_layer": [
+ 0.003139778506010771,
+ 0.07545783370733261,
+ 0.07123857736587524,
+ 0.04737270250916481,
+ 0.07089244574308395,
+ 0.05843178555369377,
+ 0.10959646850824356,
+ 0.04730183631181717,
+ 0.05721074715256691,
+ 0.06935717165470123,
+ 0.04019004851579666,
+ 0.04955831170082092
+ ],
+ "rho_per_layer": [
+ -0.020620837807655334,
+ 0.0424807034432888,
+ 0.07906489074230194,
+ -0.014874707907438278,
+ 0.06078936904668808,
+ 0.006801994517445564,
+ 0.11016394942998886,
+ 0.07577681541442871,
+ 0.01940302737057209,
+ 0.0600065141916275,
+ 0.020656054839491844,
+ 0.04902234673500061
+ ],
+ "nudge_per_layer": [
+ 0.00014946935698390007,
+ -0.004455030895769596,
+ -0.0028790468350052834,
+ -0.0015581330517306924,
+ -0.0028997263871133327,
+ -0.0020245155319571495,
+ -0.003806713502854109,
+ -0.0014502943959087133,
+ -0.0017623959574848413,
+ -0.002352846320718527,
+ -0.001400630921125412,
+ -0.001629082253202796
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6055,
+ "mean_bp_cosine": 0.23132580270369849,
+ "mean_rho": 0.21027085681756338,
+ "mean_nudge_001": -0.002061755420678916,
+ "mean_nudge_003": -0.006128282761589314,
+ "mean_nudge_01": -0.019752548774704337,
+ "bp_cosine_per_layer": [
+ 0.5538393259048462,
+ 0.4287089705467224,
+ 0.25277969241142273,
+ 0.2402075231075287,
+ 0.180599182844162,
+ 0.15653815865516663,
+ 0.1736883521080017,
+ 0.18825414776802063,
+ 0.1335570216178894,
+ 0.13271775841712952,
+ 0.15632027387619019,
+ 0.17869922518730164
+ ],
+ "rho_per_layer": [
+ 0.4586557149887085,
+ 0.4002187252044678,
+ 0.23149724304676056,
+ 0.21227607131004333,
+ 0.1842716634273529,
+ 0.16792945563793182,
+ 0.21390791237354279,
+ 0.19318881630897522,
+ 0.08300350606441498,
+ 0.10752588510513306,
+ 0.12254554033279419,
+ 0.14822974801063538
+ ],
+ "nudge_per_layer": [
+ -0.16128812730312347,
+ -0.02071414887905121,
+ -0.008381091989576817,
+ -0.007560182362794876,
+ -0.005691731348633766,
+ -0.0046913521364331245,
+ -0.005232630763202906,
+ -0.0054755983874201775,
+ -0.0038832086138427258,
+ -0.004123975522816181,
+ -0.004747895523905754,
+ -0.005240642465651035
+ ],
+ "state_pred_error_per_layer": [
+ 8762.341796875,
+ 2348.0966796875,
+ 1278.38525390625,
+ 1081.769287109375,
+ 948.214599609375,
+ 985.5714111328125,
+ 775.6072387695312,
+ 713.37109375,
+ 927.2667846679688,
+ 1123.047119140625,
+ 1035.65966796875,
+ 864.7014770507812
+ ],
+ "mean_state_pred_error": 1737.002700805664
+ },
+ "credit_bridge": {
+ "test_acc": 0.4905,
+ "mean_bp_cosine": 0.14494075424348316,
+ "mean_rho": 0.18026241473853588,
+ "mean_nudge_001": -0.0010125784683623351,
+ "mean_nudge_003": -0.003034341447346378,
+ "mean_nudge_01": -0.010073745266709011,
+ "bp_cosine_per_layer": [
+ 0.0054779257625341415,
+ 0.004163481295108795,
+ -0.01823507994413376,
+ 0.06908583641052246,
+ 0.09582538902759552,
+ 0.15172168612480164,
+ 0.18814444541931152,
+ 0.21233659982681274,
+ 0.2397850900888443,
+ 0.26321661472320557,
+ 0.2640886902809143,
+ 0.2636783719062805
+ ],
+ "rho_per_layer": [
+ 0.05151631310582161,
+ 0.03990761935710907,
+ 0.02668120339512825,
+ 0.08933386206626892,
+ 0.12927217781543732,
+ 0.1893344521522522,
+ 0.20202970504760742,
+ 0.27141058444976807,
+ 0.2724490761756897,
+ 0.2844354808330536,
+ 0.2797800898551941,
+ 0.32699841260910034
+ ],
+ "nudge_per_layer": [
+ -0.0015225817915052176,
+ -0.0009501088643446565,
+ 0.00033305209944956005,
+ -0.005592360161244869,
+ -0.00755771528929472,
+ -0.010863769799470901,
+ -0.012987833470106125,
+ -0.014405487105250359,
+ -0.015937766060233116,
+ -0.017140284180641174,
+ -0.017137283459305763,
+ -0.01712280511856079
+ ],
+ "final_value_loss": 0.42473253202438355,
+ "final_term_loss": 0.10016471980810165,
+ "final_bridge_loss": 0.011516085395216941,
+ "final_tgrad_loss": 0.3130517265796661
+ }
+ },
+ "a1.0_L12_s456": {
+ "bp": {
+ "test_acc": 0.762,
+ "mean_bp_cosine": 0.8058839539686838,
+ "mean_rho": 0.999967540303866,
+ "mean_nudge_001": -0.023895990879585344,
+ "mean_nudge_003": -0.06970183023562034,
+ "mean_nudge_01": -0.21104640668878952,
+ "bp_cosine_per_layer": [
+ 0.8338037729263306,
+ 0.8328856229782104,
+ 0.8300410509109497,
+ 0.823561429977417,
+ 0.8153207302093506,
+ 0.8093391060829163,
+ 0.8022103309631348,
+ 0.797042727470398,
+ 0.7909072041511536,
+ 0.7847579121589661,
+ 0.7778322100639343,
+ 0.7729053497314453
+ ],
+ "rho_per_layer": [
+ 0.9999991059303284,
+ 0.999998927116394,
+ 0.9999983906745911,
+ 0.9999978542327881,
+ 0.999996542930603,
+ 0.9999936819076538,
+ 0.9999876022338867,
+ 0.9999791383743286,
+ 0.9999581575393677,
+ 0.9999358057975769,
+ 0.9998983144760132,
+ 0.9998669624328613
+ ],
+ "nudge_per_layer": [
+ -0.5344969034194946,
+ -0.45930254459381104,
+ -0.3820700943470001,
+ -0.30436116456985474,
+ -0.2331882268190384,
+ -0.17455099523067474,
+ -0.12991222739219666,
+ -0.09728521853685379,
+ -0.07412658631801605,
+ -0.05795694515109062,
+ -0.04662308096885681,
+ -0.03868289291858673
+ ]
+ },
+ "dfa": {
+ "test_acc": 0.6705,
+ "mean_bp_cosine": 0.07614415294180314,
+ "mean_rho": 0.07346192157516877,
+ "mean_nudge_001": -0.0004569464314651365,
+ "mean_nudge_003": -0.0013685211645982538,
+ "mean_nudge_01": -0.004532526101684198,
+ "bp_cosine_per_layer": [
+ 0.04563574492931366,
+ 0.07466404139995575,
+ 0.07062304764986038,
+ 0.07941032946109772,
+ 0.08478259295225143,
+ 0.1176375150680542,
+ 0.051365386694669724,
+ 0.07094398140907288,
+ 0.06898803263902664,
+ 0.07310269773006439,
+ 0.0635182335972786,
+ 0.11305823177099228
+ ],
+ "rho_per_layer": [
+ 0.026268895715475082,
+ 0.03733495995402336,
+ 0.07775422930717468,
+ 0.12396883964538574,
+ 0.05687103420495987,
+ 0.13703036308288574,
+ -0.0030320845544338226,
+ 0.08171480149030685,
+ 0.06336408108472824,
+ 0.09909991919994354,
+ 0.06059148907661438,
+ 0.12057653069496155
+ ],
+ "nudge_per_layer": [
+ -0.015672076493501663,
+ -0.0053095086477696896,
+ -0.0031822575256228447,
+ -0.003722358262166381,
+ -0.0036155935376882553,
+ -0.004913205746561289,
+ -0.0017889357404783368,
+ -0.002959918463602662,
+ -0.003063073381781578,
+ -0.003171245101839304,
+ -0.0024787387810647488,
+ -0.004513401538133621
+ ]
+ },
+ "state_bridge": {
+ "test_acc": 0.6015,
+ "mean_bp_cosine": 0.1852269663165013,
+ "mean_rho": 0.18596469921370348,
+ "mean_nudge_001": -0.001999816272776419,
+ "mean_nudge_003": -0.005956100358162075,
+ "mean_nudge_01": -0.01933680862809221,
+ "bp_cosine_per_layer": [
+ 0.5561584234237671,
+ 0.39794063568115234,
+ 0.20452159643173218,
+ 0.14641982316970825,
+ 0.11315252631902695,
+ 0.12314423173666,
+ 0.11100500077009201,
+ 0.11256138980388641,
+ 0.12550771236419678,
+ 0.11898934841156006,
+ 0.11000233888626099,
+ 0.10332056879997253
+ ],
+ "rho_per_layer": [
+ 0.4663659632205963,
+ 0.38622361421585083,
+ 0.20298895239830017,
+ 0.1521472930908203,
+ 0.10572830587625504,
+ 0.14532539248466492,
+ 0.1235864907503128,
+ 0.12295880913734436,
+ 0.1263602077960968,
+ 0.1123446375131607,
+ 0.14707674086093903,
+ 0.1404699832201004
+ ],
+ "nudge_per_layer": [
+ -0.16852372884750366,
+ -0.020911922678351402,
+ -0.007518916856497526,
+ -0.005010381806641817,
+ -0.0037449360825121403,
+ -0.004001074004918337,
+ -0.0037657374050468206,
+ -0.0037060989998281,
+ -0.00406123511493206,
+ -0.003861584234982729,
+ -0.0035726726055145264,
+ -0.0033634149003773928
+ ],
+ "state_pred_error_per_layer": [
+ 16351.89453125,
+ 3139.08837890625,
+ 1824.6005859375,
+ 1391.949462890625,
+ 1295.1900634765625,
+ 1149.4605712890625,
+ 981.4422607421875,
+ 921.3729248046875,
+ 954.6389770507812,
+ 1032.970703125,
+ 1065.58984375,
+ 1272.3818359375
+ ],
+ "mean_state_pred_error": 2615.048344930013
+ },
+ "credit_bridge": {
+ "test_acc": 0.5585,
+ "mean_bp_cosine": 0.3251700059821208,
+ "mean_rho": 0.4226210874815782,
+ "mean_nudge_001": -0.0023732566623948514,
+ "mean_nudge_003": -0.007109481530884902,
+ "mean_nudge_01": -0.02357900080581506,
+ "bp_cosine_per_layer": [
+ 0.05994441360235214,
+ 0.19127817451953888,
+ 0.25874069333076477,
+ 0.31905949115753174,
+ 0.31442493200302124,
+ 0.3214789927005768,
+ 0.368133008480072,
+ 0.38988351821899414,
+ 0.4050426781177521,
+ 0.416469931602478,
+ 0.4253390431404114,
+ 0.4322451949119568
+ ],
+ "rho_per_layer": [
+ 0.1191493421792984,
+ 0.31643322110176086,
+ 0.4170604646205902,
+ 0.42330044507980347,
+ 0.4319503903388977,
+ 0.42732322216033936,
+ 0.46659332513809204,
+ 0.487338662147522,
+ 0.496512234210968,
+ 0.4787842035293579,
+ 0.5010949969291687,
+ 0.5059125423431396
+ ],
+ "nudge_per_layer": [
+ -0.015865826979279518,
+ -0.018151750788092613,
+ -0.021288521587848663,
+ -0.02352731302380562,
+ -0.023306310176849365,
+ -0.02329857647418976,
+ -0.025182321667671204,
+ -0.025520823895931244,
+ -0.026067661121487617,
+ -0.026535863056778908,
+ -0.027021951973438263,
+ -0.02718108892440796
+ ],
+ "final_value_loss": 0.3557061047077179,
+ "final_term_loss": 0.06590610226392746,
+ "final_bridge_loss": 0.010093027733266353,
+ "final_tgrad_loss": 0.2797069767475128
+ }
+ }
+} \ No newline at end of file