diff options
| author | YurenHao0426 <Blackhao0426@gmail.com> | 2026-03-23 19:46:08 -0500 |
|---|---|---|
| committer | YurenHao0426 <Blackhao0426@gmail.com> | 2026-03-23 19:46:08 -0500 |
| commit | 32123cb36ae9521f60c9b6f67458b931b6540ef2 (patch) | |
| tree | 4731e1dc513f5b613f80c4d20fc4114044c266d3 /results/toy_lq_frozen | |
| parent | bbb1a36d67f2f0c83106c1e771ea2c2fcb7fd83a (diff) | |
Add final report, plots, experiment guide, and complete NOTE.md
All experiments complete:
- Toy LQ: credit bridge matches state bridge (~0.94 costate cosine)
- CIFAR-10: credit bridge (29.6%) comparable to DFA (30.0%), both beat state bridge (18.5%)
- State bridge confirms core hypothesis: perfect state prediction != useful credit
- Terminal gradient matching is essential for credit bridge
Diffstat (limited to 'results/toy_lq_frozen')
3 files changed, 798 insertions, 0 deletions
diff --git a/results/toy_lq_frozen/toy_lq_v2_seed123_lam0.1_sig0.1_tgw1.0_fm0.0.json b/results/toy_lq_frozen/toy_lq_v2_seed123_lam0.1_sig0.1_tgw1.0_fm0.0.json new file mode 100644 index 0000000..50eed4c --- /dev/null +++ b/results/toy_lq_frozen/toy_lq_v2_seed123_lam0.1_sig0.1_tgw1.0_fm0.0.json @@ -0,0 +1,266 @@ +{ + "config": { + "d_hidden": 64, + "output_dim": 10, + "num_layers": 12, + "sigma": 0.03, + "batch_size": 256, + "num_steps": 8000, + "lr_fb": 0.001, + "lam": 0.1, + "K": 8, + "ema_momentum": 0.995, + "sigma_bridge": 0.1, + "eval_every": 2000, + "seed": 123, + "gpu": 0, + "output_dir": "results/toy_lq_frozen", + "vnet_hidden": 256, + "vnet_layers": 3, + "term_grad_weight": 1.0, + "fm_weight": 0.0 + }, + "log": { + "steps": [ + 1, + 2000, + 4000, + 6000, + 8000 + ], + "dfa_costate_cos": [ + 0.0061469420325011015, + 0.005306758529817064, + 0.0032278880632172027, + 0.010428216774016619, + 0.005160536073769133 + ], + "state_costate_cos": [ + 0.04923563698927561, + 0.9359788099924723, + 0.93496473133564, + 0.9391002754370371, + 0.9422274927298228 + ], + "credit_costate_cos": [ + 0.005350367398932576, + 0.9094806561867396, + 0.933747818072637, + 0.939527784784635, + 0.9428367614746094 + ], + "dfa_rho": [ + 0.014851124413932363, + -0.0009741405956447124, + 0.010637809444839755, + 0.01579231140203774, + 0.0006830055887500445 + ], + "state_rho": [ + 0.05303209243963162, + 0.9233627518018087, + 0.9250594973564148, + 0.9248303671677908, + 0.9291473726431528 + ], + "credit_rho": [ + 8.900166722014546e-05, + 0.8767146865526835, + 0.9206246634324392, + 0.9250840544700623, + 0.9295186003049215 + ], + "dfa_nudge": [ + -0.0020856610499322414, + -0.0016959290175388257, + -0.0004252120852470398, + -0.00336669214690725, + -0.0014625868449608486 + ], + "state_nudge": [ + -0.017791483240822952, + -0.32088013738393784, + -0.3230740974346797, + -0.318187120060126, + -0.324822299182415 + ], + "credit_nudge": [ + -0.0004618208234508832, + -0.31195973853270215, + -0.3216395452618599, + -0.3171723609169324, + -0.3237730637192726 + ], + "bridge_residual": [], + "state_bridge_loss": [ + 1.0102367401123047, + 0.029022935777902603, + 0.031384147703647614, + 0.02959899604320526, + 0.031896352767944336 + ], + "credit_bridge_loss": [ + 129.2601776123047, + 8.807141304016113, + 8.771026611328125, + 7.9213643074035645, + 8.751266479492188 + ], + "term_loss": [ + 109.68403625488281, + 4.207324028015137, + 4.038488388061523, + 3.279881477355957, + 3.9708642959594727 + ], + "bridge_loss": [ + 5.943464884694549e-07, + 0.11741068214178085, + 0.08691056072711945, + 0.10882671922445297, + 0.12579748034477234 + ], + "term_grad_loss": [ + 19.57614517211914, + 4.4824066162109375, + 4.645627975463867, + 4.532656192779541, + 4.654605388641357 + ], + "fm_loss": [ + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + }, + "final_per_layer": { + "dfa_costate_cos": [ + 0.04813992977142334, + -0.042106956243515015, + 0.004819205962121487, + 0.06406223028898239, + 0.027982598170638084, + -0.024616792798042297, + 0.03184102475643158, + -0.03284747526049614, + -0.031094228848814964, + -0.04093015938997269, + 0.012475000694394112, + 0.0442020557820797 + ], + "state_costate_cos": [ + 0.9390542507171631, + 0.9402485489845276, + 0.9412673711776733, + 0.9416499137878418, + 0.9424928426742554, + 0.9428901672363281, + 0.9427830576896667, + 0.9428685903549194, + 0.9430990219116211, + 0.9434692859649658, + 0.9433966875076294, + 0.9435101747512817 + ], + "credit_costate_cos": [ + 0.9391632676124573, + 0.9400047659873962, + 0.9408236742019653, + 0.9413831233978271, + 0.9420697689056396, + 0.942909836769104, + 0.9431338906288147, + 0.943551778793335, + 0.9441136121749878, + 0.9448702335357666, + 0.9456644654273987, + 0.9463527202606201 + ], + "dfa_rho": [ + 0.0134794432669878, + -0.042476922273635864, + 0.04209040105342865, + 0.06388744711875916, + -0.012325622141361237, + -0.025234051048755646, + -0.020182523876428604, + -0.02071167342364788, + -0.049487367272377014, + -0.05043957754969597, + 0.04616815596818924, + 0.0634283572435379 + ], + "state_rho": [ + 0.9241164922714233, + 0.9311657547950745, + 0.926814079284668, + 0.9336568117141724, + 0.9266120791435242, + 0.9352933764457703, + 0.9264969825744629, + 0.9290511012077332, + 0.9249886870384216, + 0.9313560128211975, + 0.9301149845123291, + 0.9301021099090576 + ], + "credit_rho": [ + 0.9276995658874512, + 0.9273138046264648, + 0.9248120784759521, + 0.9268039464950562, + 0.92667555809021, + 0.9278458952903748, + 0.9272637367248535, + 0.9345529079437256, + 0.9366906881332397, + 0.9292744398117065, + 0.9313026070594788, + 0.9339879751205444 + ], + "dfa_nudge": [ + -0.017539501190185547, + 0.01593128778040409, + -0.0030720066279172897, + -0.020152313634753227, + -0.009087346494197845, + 0.007799159735441208, + -0.010878749191761017, + 0.013225046917796135, + 0.011669810861349106, + 0.017475932836532593, + -0.006174879148602486, + -0.016747483983635902 + ], + "state_nudge": [ + -0.32301613688468933, + -0.3241724371910095, + -0.32460731267929077, + -0.32475656270980835, + -0.325019896030426, + -0.3253987431526184, + -0.32468554377555847, + -0.3243948817253113, + -0.3248230516910553, + -0.32554829120635986, + -0.3256106674671173, + -0.3258340656757355 + ], + "credit_nudge": [ + -0.32093775272369385, + -0.32208389043807983, + -0.32268720865249634, + -0.3229762613773346, + -0.3233621120452881, + -0.324078768491745, + -0.32360684871673584, + -0.32358717918395996, + -0.3243335783481598, + -0.32536792755126953, + -0.3258592486381531, + -0.32639598846435547 + ] + } +}
\ No newline at end of file diff --git a/results/toy_lq_frozen/toy_lq_v2_seed42_lam0.1_sig0.1_tgw1.0_fm0.0.json b/results/toy_lq_frozen/toy_lq_v2_seed42_lam0.1_sig0.1_tgw1.0_fm0.0.json new file mode 100644 index 0000000..bbcd5c4 --- /dev/null +++ b/results/toy_lq_frozen/toy_lq_v2_seed42_lam0.1_sig0.1_tgw1.0_fm0.0.json @@ -0,0 +1,266 @@ +{ + "config": { + "d_hidden": 64, + "output_dim": 10, + "num_layers": 12, + "sigma": 0.03, + "batch_size": 256, + "num_steps": 8000, + "lr_fb": 0.001, + "lam": 0.1, + "K": 8, + "ema_momentum": 0.995, + "sigma_bridge": 0.1, + "eval_every": 2000, + "seed": 42, + "gpu": 0, + "output_dir": "results/toy_lq_frozen", + "vnet_hidden": 256, + "vnet_layers": 3, + "term_grad_weight": 1.0, + "fm_weight": 0.0 + }, + "log": { + "steps": [ + 1, + 2000, + 4000, + 6000, + 8000 + ], + "dfa_costate_cos": [ + 0.001022340264171362, + 0.001144224622597297, + 0.0035498210539420447, + 0.0025704174380128584, + 0.0012041970621794462 + ], + "state_costate_cos": [ + 0.009041048353537917, + 0.9367498010396957, + 0.9443944742282232, + 0.9488719999790192, + 0.9465398589769999 + ], + "credit_costate_cos": [ + 0.024892715892444055, + 0.9009914000829061, + 0.9385832945505778, + 0.947337324420611, + 0.9453924099604288 + ], + "dfa_rho": [ + 0.015879416760678094, + 0.003749566695963343, + 0.0025427089616035423, + 0.0041017483454197645, + -0.006658251901778082 + ], + "state_rho": [ + 0.0029661240599428615, + 0.9205784201622009, + 0.9331746151049932, + 0.9367670218149821, + 0.9348721752564112 + ], + "credit_rho": [ + 0.02234963719577839, + 0.8549301077922186, + 0.9257398645083109, + 0.9335627655188242, + 0.9330280274152756 + ], + "dfa_nudge": [ + -0.0003799900102118651, + -0.0001569713931530714, + -0.0012285423775513966, + -0.00047482581188281375, + -0.0003635381193210681 + ], + "state_nudge": [ + -0.002246703254058957, + -0.3365800951917966, + -0.3378218387564023, + -0.34102949251731235, + -0.3362140009800593 + ], + "credit_nudge": [ + -0.0079942528779308, + -0.32416996111472446, + -0.3345658630132675, + -0.3391987532377243, + -0.33437975496053696 + ], + "bridge_residual": [], + "state_bridge_loss": [ + 1.0073249340057373, + 0.03208087012171745, + 0.02979956567287445, + 0.03251900523900986, + 0.03256681188941002 + ], + "credit_bridge_loss": [ + 132.09298706054688, + 10.374980926513672, + 10.61994743347168, + 10.229816436767578, + 9.931343078613281 + ], + "term_loss": [ + 111.63633728027344, + 5.137801647186279, + 5.388574600219727, + 5.321071147918701, + 4.950850486755371 + ], + "bridge_loss": [ + 6.45359421014291e-07, + 0.2699485719203949, + 0.12590564787387848, + 0.13655179738998413, + 0.15239471197128296 + ], + "term_grad_loss": [ + 20.456655502319336, + 4.967230796813965, + 5.105466842651367, + 4.772193431854248, + 4.828097343444824 + ], + "fm_loss": [ + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + }, + "final_per_layer": { + "dfa_costate_cos": [ + -0.053928110748529434, + -0.03558344021439552, + -0.002497725188732147, + -0.025605209171772003, + -0.0015886849723756313, + -0.004757361486554146, + 0.038880251348018646, + 0.04505593329668045, + 0.044440463185310364, + 0.049856118857860565, + -0.036305028945207596, + -0.0035168412141501904 + ], + "state_costate_cos": [ + 0.943811297416687, + 0.9446508884429932, + 0.9451277256011963, + 0.9456416368484497, + 0.9462511539459229, + 0.9469271898269653, + 0.9473466873168945, + 0.947996973991394, + 0.9481196999549866, + 0.9477524757385254, + 0.9474242925643921, + 0.947428286075592 + ], + "credit_costate_cos": [ + 0.941976010799408, + 0.9424219727516174, + 0.94321209192276, + 0.9437947273254395, + 0.9448409080505371, + 0.9454640746116638, + 0.9459144473075867, + 0.9465770721435547, + 0.9470815062522888, + 0.9474484920501709, + 0.947708010673523, + 0.9482696056365967 + ], + "dfa_rho": [ + -0.04425683990120888, + -0.06072389334440231, + -0.02133849635720253, + -0.009745828807353973, + 0.012875140644609928, + -0.06230748072266579, + -0.011334436014294624, + 0.06567166745662689, + 0.05127769336104393, + 0.02585187926888466, + -0.02806694805622101, + 0.0021985196508467197 + ], + "state_rho": [ + 0.9318734407424927, + 0.9358463883399963, + 0.9371962547302246, + 0.932350754737854, + 0.9360877871513367, + 0.9400110840797424, + 0.9344450235366821, + 0.9253479242324829, + 0.9369418621063232, + 0.9354310035705566, + 0.9379286170005798, + 0.9350059628486633 + ], + "credit_rho": [ + 0.925601065158844, + 0.9282341599464417, + 0.9294254779815674, + 0.9282456040382385, + 0.9352800846099854, + 0.9381647109985352, + 0.9306818246841431, + 0.9283095598220825, + 0.9359391331672668, + 0.9364811182022095, + 0.940323531627655, + 0.9396500587463379 + ], + "dfa_nudge": [ + 0.018354831263422966, + 0.012472891248762608, + 0.0010786037892103195, + 0.008631331846117973, + -0.000161781907081604, + 0.0025226473808288574, + -0.013589534908533096, + -0.017021682113409042, + -0.01592499390244484, + -0.017948923632502556, + 0.015213390812277794, + 0.0020107626914978027 + ], + "state_nudge": [ + -0.3381166160106659, + -0.33782684803009033, + -0.33681023120880127, + -0.3365652561187744, + -0.3364033102989197, + -0.336093544960022, + -0.33575671911239624, + -0.3358075022697449, + -0.33578699827194214, + -0.3356783986091614, + -0.3347625136375427, + -0.33496007323265076 + ], + "credit_nudge": [ + -0.3348296880722046, + -0.33472180366516113, + -0.33402615785598755, + -0.3340165615081787, + -0.33416393399238586, + -0.33410122990608215, + -0.33391931653022766, + -0.3341727554798126, + -0.334547221660614, + -0.33483123779296875, + -0.3342774510383606, + -0.33494970202445984 + ] + } +}
\ No newline at end of file diff --git a/results/toy_lq_frozen/toy_lq_v2_seed456_lam0.1_sig0.1_tgw1.0_fm0.0.json b/results/toy_lq_frozen/toy_lq_v2_seed456_lam0.1_sig0.1_tgw1.0_fm0.0.json new file mode 100644 index 0000000..7684971 --- /dev/null +++ b/results/toy_lq_frozen/toy_lq_v2_seed456_lam0.1_sig0.1_tgw1.0_fm0.0.json @@ -0,0 +1,266 @@ +{ + "config": { + "d_hidden": 64, + "output_dim": 10, + "num_layers": 12, + "sigma": 0.03, + "batch_size": 256, + "num_steps": 8000, + "lr_fb": 0.001, + "lam": 0.1, + "K": 8, + "ema_momentum": 0.995, + "sigma_bridge": 0.1, + "eval_every": 2000, + "seed": 456, + "gpu": 0, + "output_dir": "results/toy_lq_frozen", + "vnet_hidden": 256, + "vnet_layers": 3, + "term_grad_weight": 1.0, + "fm_weight": 0.0 + }, + "log": { + "steps": [ + 1, + 2000, + 4000, + 6000, + 8000 + ], + "dfa_costate_cos": [ + -0.008305357536301017, + -0.008392414000506202, + -0.0038773335108999163, + -0.005692236203079422, + -0.0027285031198213496 + ], + "state_costate_cos": [ + 0.010795300283158818, + 0.9460556507110596, + 0.9393202712138494, + 0.9483461380004883, + 0.9449077347914377 + ], + "credit_costate_cos": [ + 0.010942678588132063, + 0.9265013436476389, + 0.9366317639748255, + 0.947089821100235, + 0.9429272959629694 + ], + "dfa_rho": [ + -0.0028248391657446823, + -0.0069896553953488665, + 0.006519075793524583, + -0.0016956791902581851, + 0.009361718820097545 + ], + "state_rho": [ + 0.02673721546307206, + 0.9346788177887598, + 0.9264062345027924, + 0.9364438454310099, + 0.928318440914154 + ], + "credit_rho": [ + 0.015292729716748, + 0.8930107355117798, + 0.9212059676647186, + 0.9316875636577606, + 0.9271238495906194 + ], + "dfa_nudge": [ + 0.004384364855165283, + 0.004451872392868002, + 0.0023875126304725804, + 0.0029402777242163816, + 0.0018359140182534854 + ], + "state_nudge": [ + -0.005124294043829043, + -0.34853988885879517, + -0.36369936913251877, + -0.3535121629635493, + -0.3701842874288559 + ], + "credit_nudge": [ + -0.003232262640570601, + -0.3407190019885699, + -0.36137687663237256, + -0.35145895431439084, + -0.3679164672891299 + ], + "bridge_residual": [], + "state_bridge_loss": [ + 1.0078721046447754, + 0.029677797108888626, + 0.03204238414764404, + 0.0327574647963047, + 0.033611781895160675 + ], + "credit_bridge_loss": [ + 158.73072814941406, + 11.051497459411621, + 9.754555702209473, + 10.701624870300293, + 9.23304557800293 + ], + "term_loss": [ + 132.93673706054688, + 5.0680437088012695, + 4.583424091339111, + 5.3644843101501465, + 4.062508583068848 + ], + "bridge_loss": [ + 7.166463547036983e-07, + 0.25247713923454285, + 0.14709019660949707, + 0.1511959433555603, + 0.12251871824264526 + ], + "term_grad_loss": [ + 25.793991088867188, + 5.730976581573486, + 5.024041175842285, + 5.185944557189941, + 5.048018932342529 + ], + "fm_loss": [ + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + }, + "final_per_layer": { + "dfa_costate_cos": [ + 0.005115414969623089, + -0.0511106476187706, + 0.026345418766140938, + -0.06129831820726395, + 0.023028161376714706, + 0.043917812407016754, + -0.02071939967572689, + 0.020611021667718887, + -0.025742489844560623, + -0.052854984998703, + 0.004462959244847298, + 0.05550301447510719 + ], + "state_costate_cos": [ + 0.9431805610656738, + 0.9437761306762695, + 0.9443435072898865, + 0.9446961879730225, + 0.9448176622390747, + 0.9449890851974487, + 0.945353627204895, + 0.9453505277633667, + 0.9454029202461243, + 0.9456251859664917, + 0.945793867111206, + 0.945563554763794 + ], + "credit_costate_cos": [ + 0.9382357001304626, + 0.9392683506011963, + 0.9404538869857788, + 0.9414603114128113, + 0.9420560598373413, + 0.9428950548171997, + 0.9436970353126526, + 0.9444013833999634, + 0.9445676803588867, + 0.9454110860824585, + 0.9460842609405518, + 0.9465967416763306 + ], + "dfa_rho": [ + 0.0005743983201682568, + -0.06480635702610016, + 0.04855071008205414, + -0.09910713136196136, + 0.0678277313709259, + 0.07211608439683914, + -0.024130607023835182, + 0.001894976943731308, + -0.009040179662406445, + -0.02709592692553997, + 0.047522202134132385, + 0.09803472459316254 + ], + "state_rho": [ + 0.9245786666870117, + 0.9240697026252747, + 0.9293171167373657, + 0.9301248788833618, + 0.9324039220809937, + 0.9262233376502991, + 0.9288182854652405, + 0.9328013062477112, + 0.926672101020813, + 0.928871750831604, + 0.9281368255615234, + 0.9278033971786499 + ], + "credit_rho": [ + 0.9264800548553467, + 0.9184226989746094, + 0.9257187247276306, + 0.9245353937149048, + 0.9274380803108215, + 0.9219262599945068, + 0.9251310229301453, + 0.9257712960243225, + 0.9327481985092163, + 0.9326720833778381, + 0.9336825013160706, + 0.9309598803520203 + ], + "dfa_nudge": [ + -0.0008005127310752869, + 0.01917375810444355, + -0.009830990806221962, + 0.02491075173020363, + -0.007071066647768021, + -0.017435496672987938, + 0.009654557332396507, + -0.005623402073979378, + 0.01048743724822998, + 0.022874275222420692, + -0.0009297188371419907, + -0.02337862364947796 + ], + "state_nudge": [ + -0.3704739809036255, + -0.3704678416252136, + -0.36917200684547424, + -0.36994534730911255, + -0.3694732189178467, + -0.37023210525512695, + -0.3705016076564789, + -0.37048155069351196, + -0.36992865800857544, + -0.37050265073776245, + -0.37076336145401, + -0.37026911973953247 + ], + "credit_nudge": [ + -0.3661743402481079, + -0.3663756549358368, + -0.3655211329460144, + -0.3667157292366028, + -0.3666227161884308, + -0.36782804131507874, + -0.36846989393234253, + -0.3688392639160156, + -0.3685477077960968, + -0.36957746744155884, + -0.37019991874694824, + -0.37012574076652527 + ] + } +}
\ No newline at end of file |
