From 8b21fb32bf0997e3f4266c1c22414e49f1fdcfcc Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Mon, 30 Mar 2026 19:25:53 -0500 Subject: Add confirmatory paper experiments: A1-A4, all 10 seeds complete MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit A1: Synthetic nonlinearity ladder (240 rows: 3 alpha × 2 depth × 4 methods × 10 seeds) A2: CIFAR state-vs-credit counterexample (30 rows: 3 methods × 10 seeds) A3: Frozen vs online dissociation (60 rows: 2 regimes × 3 methods × 10 seeds) A4: Protocol dependence panel (82 rows: assembled from existing results) All experiments ran on GPU 3. Total runtime: ~20 hours. CSVs in results/confirmatory/. Co-Authored-By: Claude Opus 4.6 (1M context) --- results/confirmatory/A4_protocol_dependence.csv | 83 +++++++++++++++++++++++++ 1 file changed, 83 insertions(+) create mode 100644 results/confirmatory/A4_protocol_dependence.csv (limited to 'results/confirmatory/A4_protocol_dependence.csv') diff --git a/results/confirmatory/A4_protocol_dependence.csv b/results/confirmatory/A4_protocol_dependence.csv new file mode 100644 index 0000000..509e51f --- /dev/null +++ b/results/confirmatory/A4_protocol_dependence.csv @@ -0,0 +1,83 @@ +slice,method,metric,value +snapshot_exploit_ep100,dfa,gamma,0.008470005544950254 +snapshot_exploit_ep100,dfa,rho,-0.022525018197484314 +snapshot_exploit_ep100,dfa,nudge,-2.3932622525535407e-05 +snapshot_exploit_ep100,dfa,loss_before,1.1802499413490295 +snapshot_exploit_ep100,dfa,loss_after_1step,1.1798909544944762 +snapshot_exploit_ep100,dfa,delta_loss_1step,-0.00035898685455326707 +snapshot_exploit_ep100,dfa,delta_acc_1step,0.002343749999999978 +snapshot_exploit_ep100,scalar_cb,gamma,0.12223921716213226 +snapshot_exploit_ep100,scalar_cb,rho,0.09000759199261665 +snapshot_exploit_ep100,scalar_cb,nudge,-0.00036903251748299226 +snapshot_exploit_ep100,scalar_cb,loss_before,1.1802499413490295 +snapshot_exploit_ep100,scalar_cb,loss_after_1step,1.1835142850875855 +snapshot_exploit_ep100,scalar_cb,delta_loss_1step,0.003264343738555997 +snapshot_exploit_ep100,scalar_cb,delta_acc_1step,0.0007812499999999556 +snapshot_exploit_ep100,vec_eT_M4,gamma,0.37760399281978607 +snapshot_exploit_ep100,vec_eT_M4,rho,0.41141805797815323 +snapshot_exploit_ep100,vec_eT_M4,nudge,-0.0013705549063161016 +snapshot_exploit_ep100,vec_eT_M4,loss_before,1.1802499413490295 +snapshot_exploit_ep100,vec_eT_M4,loss_after_1step,1.1832772016525268 +snapshot_exploit_ep100,vec_eT_M4,delta_loss_1step,0.0030272603034973145 +snapshot_exploit_ep100,vec_eT_M4,delta_acc_1step,-0.0031250000000000444 +snapshot_exploit_ep100,oracle_bp,gamma,1.0 +snapshot_exploit_ep100,oracle_bp,rho,0.9979714304208755 +snapshot_exploit_ep100,oracle_bp,nudge,-0.0031722619314678013 +snapshot_exploit_ep100,oracle_bp,loss_before,1.1802499413490295 +snapshot_exploit_ep100,oracle_bp,loss_after_1step,1.1796290874481201 +snapshot_exploit_ep100,oracle_bp,delta_loss_1step,-0.0006208539009093794 +snapshot_exploit_ep100,oracle_bp,delta_acc_1step,0.005468750000000022 +snapshot_ep5,dfa,dl_held_1,6.842613220214844e-05 +snapshot_ep5,dfa,dl_same_1,-0.011249661445617676 +snapshot_ep5,dfa,dl_held_5,0.0032531023025512695 +snapshot_ep5,dfa,dl_same_5,-0.004767775535583496 +snapshot_ep5,vec_eT_M4,dl_held_1,-0.0002554655075073242 +snapshot_ep5,vec_eT_M4,dl_same_1,-0.011568784713745117 +snapshot_ep5,vec_eT_M4,dl_held_5,-0.005142092704772949 +snapshot_ep5,vec_eT_M4,dl_same_5,-0.007385373115539551 +snapshot_ep5,oracle_bp,dl_held_1,-0.0002244710922241211 +snapshot_ep5,oracle_bp,dl_same_1,-0.011359930038452148 +snapshot_ep5,oracle_bp,dl_held_5,-0.008973956108093262 +snapshot_ep5,oracle_bp,dl_same_5,-0.008551597595214844 +snapshot_ep20,dfa,dl_held_1,0.0006439685821533203 +snapshot_ep20,dfa,dl_same_1,-0.0050983428955078125 +snapshot_ep20,dfa,dl_held_5,0.0009417533874511719 +snapshot_ep20,dfa,dl_same_5,-0.001807570457458496 +snapshot_ep20,vec_eT_M4,dl_held_1,4.982948303222656e-05 +snapshot_ep20,vec_eT_M4,dl_same_1,-0.005342721939086914 +snapshot_ep20,vec_eT_M4,dl_held_5,0.0015401840209960938 +snapshot_ep20,vec_eT_M4,dl_same_5,-0.00039839744567871094 +snapshot_ep20,oracle_bp,dl_held_1,6.651878356933594e-05 +snapshot_ep20,oracle_bp,dl_same_1,-0.004968762397766113 +snapshot_ep20,oracle_bp,dl_held_5,0.0003821849822998047 +snapshot_ep20,oracle_bp,dl_same_5,-0.0005745887756347656 +scaffold_3seed,dfa,final_mean,0.30593333333333333 +scaffold_3seed,dfa,final_std,0.006104825049818285 +scaffold_3seed,dfa,acc20_mean,0.30383333333333334 +scaffold_3seed,dfa,acc20_std,0.007825741001478518 +scaffold_3seed,perlayer,final_mean,0.30396666666666666 +scaffold_3seed,perlayer,final_std,0.006049977043115317 +scaffold_3seed,perlayer,acc20_mean,0.2874666666666667 +scaffold_3seed,perlayer,acc20_std,0.011382540235914942 +scaffold_3seed,vec,final_mean,0.3133333333333333 +scaffold_3seed,vec,final_std,0.007196912918436331 +scaffold_3seed,vec,acc20_mean,0.30333333333333334 +scaffold_3seed,vec,acc20_std,0.007024401912065005 +online_3seed,dfa_s42,test_acc,0.3116 +online_3seed,dfa_s42,mean_gamma,0.10076353600015864 +online_3seed,dfa_s42,mean_rho,-0.00476757250726223 +online_3seed,cb_eT_s42,test_acc,0.283 +online_3seed,cb_eT_s42,mean_gamma,0.17921950668096542 +online_3seed,cb_eT_s42,mean_rho,0.008699589408934116 +online_3seed,dfa_s123,test_acc,0.3106 +online_3seed,dfa_s123,mean_gamma,0.11738517042249441 +online_3seed,dfa_s123,mean_rho,0.005885639227926731 +online_3seed,cb_eT_s123,test_acc,0.2753 +online_3seed,cb_eT_s123,mean_gamma,0.17617796920239925 +online_3seed,cb_eT_s123,mean_rho,0.0019302130676805973 +online_3seed,dfa_s456,test_acc,0.297 +online_3seed,dfa_s456,mean_gamma,0.09892195643624291 +online_3seed,dfa_s456,mean_rho,-0.004888533148914576 +online_3seed,cb_eT_s456,test_acc,0.2893 +online_3seed,cb_eT_s456,mean_gamma,0.23417379707098007 +online_3seed,cb_eT_s456,mean_rho,-0.002338360995054245 -- cgit v1.2.3