From 8b78fbb1308d31bedd74f4b1deb250f5e684a6d3 Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Tue, 31 Mar 2026 22:18:32 -0500 Subject: Update naive StateErr v3: L2 norm ratio formula, with checkpoints saved MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Formula: ||h_{L//2} - h_L||_2 / ||h_L||_2 (scalar L2 ratio) A1: 240 rows (3 alpha × 2 depth × 4 methods × 10 seeds) A2: 40 rows (4 methods including BP × 10 seeds) All model checkpoints saved in checkpoints_A1/ and checkpoints_A2/ Co-Authored-By: Claude Opus 4.6 (1M context) --- results/confirmatory/A2_naive_state_err.csv | 80 ++++++++++++++--------------- 1 file changed, 40 insertions(+), 40 deletions(-) (limited to 'results/confirmatory/A2_naive_state_err.csv') diff --git a/results/confirmatory/A2_naive_state_err.csv b/results/confirmatory/A2_naive_state_err.csv index 905d1c2..5a7dedd 100644 --- a/results/confirmatory/A2_naive_state_err.csv +++ b/results/confirmatory/A2_naive_state_err.csv @@ -1,41 +1,41 @@ method,seed,naive_StateErr -dfa,42,0.8608599968910218 -state_bridge,42,1.1073074493408204 -credit_bridge,42,0.18549979393482208 -dfa,123,0.6620678688049316 -state_bridge,123,1.157683981513977 -credit_bridge,123,0.5449653492927551 -dfa,456,0.862576175403595 -state_bridge,456,0.5174413678169251 -credit_bridge,456,0.02991231045126915 -dfa,789,0.5742178151130676 -state_bridge,789,0.32427600870132445 -credit_bridge,789,0.34830747079849245 -dfa,1024,0.7317259416580201 -state_bridge,1024,1.1036756999969481 -credit_bridge,1024,0.5166968782424927 -dfa,2048,0.29954994792938233 -state_bridge,2048,0.4312982501029968 -credit_bridge,2048,0.8699032402038575 -dfa,3000,0.7138990812301635 -state_bridge,3000,0.08414710862636567 -credit_bridge,3000,0.07805714750289917 -dfa,4000,0.6306101009368896 -state_bridge,4000,0.9965199737548828 -credit_bridge,4000,0.4791879728317261 -dfa,5000,0.9650134473800659 -state_bridge,5000,0.9529169537544251 -credit_bridge,5000,0.6871149513244629 -dfa,6000,0.8224315113067627 -state_bridge,6000,0.14781150970458984 -credit_bridge,6000,0.5449538031578064 -bp,42,12270.6220625 -bp,123,11526.486759375 -bp,456,11941.3817234375 -bp,789,12075.4278453125 -bp,1024,11724.9296015625 -bp,2048,11844.94355 -bp,3000,10728.462175 -bp,4000,12229.952775 -bp,5000,10800.38535 -bp,6000,11821.658378125 +bp,42,0.5055088927268981 +dfa,42,0.9277795883178711 +state_bridge,42,1.0522792560577392 +credit_bridge,42,0.4304226595401764 +bp,123,0.48196040391921996 +dfa,123,0.8118253867149353 +state_bridge,123,1.074320799636841 +credit_bridge,123,0.7168932020187377 +bp,456,0.5040699287414551 +dfa,456,0.9287333112716675 +state_bridge,456,0.7177199237823486 +credit_bridge,456,0.1727201170682907 +bp,789,0.49838844504356383 +dfa,789,0.757287864780426 +state_bridge,789,0.5485553059577942 +credit_bridge,789,0.5861995733261108 +bp,1024,0.48747658252716064 +dfa,1024,0.8549048913955688 +state_bridge,1024,1.0501901695251465 +credit_bridge,1024,0.7178753211975097 +bp,2048,0.5092790686607361 +dfa,2048,0.5471531904220581 +state_bridge,2048,0.6565892428398132 +credit_bridge,2048,0.9323275475502014 +bp,3000,0.4684532221794128 +dfa,3000,0.8445726726531982 +state_bridge,3000,0.2893164021015167 +credit_bridge,3000,0.2710479733943939 +bp,4000,0.5021170521736145 +dfa,4000,0.7929723978042602 +state_bridge,4000,0.996940908241272 +credit_bridge,4000,0.6836131464004517 +bp,5000,0.4780992596626282 +dfa,5000,0.9823324444770813 +state_bridge,5000,0.973629965686798 +credit_bridge,5000,0.8286034298896789 +bp,6000,0.5065476115226746 +dfa,6000,0.9064758165359497 +state_bridge,6000,0.3835857294559479 +credit_bridge,6000,0.7299125791549682 -- cgit v1.2.3