summaryrefslogtreecommitdiff
path: root/research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
committerYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
commit66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a (patch)
treec29cba61124018755a19b02c9d33e3ad5f2e05cc /research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv
rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipelineHEADmain
Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv')
-rw-r--r--research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv25
1 files changed, 25 insertions, 0 deletions
diff --git a/research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv b/research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv
new file mode 100644
index 0000000..5e1db0a
--- /dev/null
+++ b/research/flossing/directional_lyap_perturb/trm_baseline_best_step58590_n1000_c8_dirlyap.summary.csv
@@ -0,0 +1,25 @@
+label,perturb_after,sigma,n_samples,candidates,fd_eps,ckpt_root,ckpt_name,clean_acc,mean_sign_exact,mean_sign_token_acc,worst_sign_exact,best_sign_exact,selected_growth_mean,selected_growth_q90,retain_mean_on_clean_success,retain_worst_on_clean_success,rescue_mean_on_clean_fail,rescue_best_on_clean_fail
+trm_baseline_best,0,0.0,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8579999804496765,0.8579999804496765,0.9472222328186035,0.8579999804496765,0.8579999804496765,-3.885612726211548,-3.8856122493743896,1.0,1.0,0.0,0.0
+trm_baseline_best,0,0.001,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8579999804496765,0.8579999804496765,0.9472222328186035,0.8579999804496765,0.8579999804496765,-3.885612726211548,-3.8856122493743896,1.0,1.0,0.0,0.0
+trm_baseline_best,0,0.003,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8579999804496765,0.8535000085830688,0.9457222819328308,0.8289999961853027,0.878000020980835,-3.885612726211548,-3.8856122493743896,0.9825174808502197,0.9650349617004395,0.07394365966320038,0.14084507524967194
+trm_baseline_best,0,0.01,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8579999804496765,0.8615000247955322,0.9481049180030823,0.8240000009536743,0.8989999890327454,-3.885612726211548,-3.8856122493743896,0.9603729844093323,0.9382284283638,0.26408451795578003,0.39436620473861694
+trm_baseline_best,0,0.03,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8579999804496765,0.8560000061988831,0.9467840790748596,0.8119999766349792,0.8999999761581421,-3.885612726211548,-3.8856122493743896,0.9545454382896423,0.9219114184379578,0.26056337356567383,0.3732394278049469
+trm_baseline_best,0,0.1,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8579999804496765,0.8619999885559082,0.9479444622993469,0.8240000009536743,0.8999999761581421,-3.885612726211548,-3.8856122493743896,0.9586247205734253,0.939393937587738,0.27816900610923767,0.42957746982574463
+trm_baseline_best,4,0.0,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8489999771118164,0.8489999771118164,0.9435185194015503,0.8489999771118164,0.8489999771118164,-1.2879749536514282,0.8905364871025085,1.0,1.0,0.0,0.0
+trm_baseline_best,4,0.001,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8489999771118164,0.8510000109672546,0.944135844707489,0.8379999995231628,0.8640000224113464,-1.2879749536514282,0.8905364871025085,0.9929328560829163,0.9858657121658325,0.05298013240098953,0.09933774918317795
+trm_baseline_best,4,0.003,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8489999771118164,0.8554999828338623,0.9452839493751526,0.8270000219345093,0.8840000033378601,-1.2879749536514282,0.8905364871025085,0.9734982252120972,0.9611307382583618,0.19205297529697418,0.3112582862377167
+trm_baseline_best,4,0.01,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8489999771118164,0.8565000295639038,0.9460123181343079,0.828000009059906,0.8849999904632568,-1.2879749536514282,0.8905364871025085,0.9723203778266907,0.9587750434875488,0.20529800653457642,0.3178808093070984
+trm_baseline_best,4,0.03,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8489999771118164,0.8560000061988831,0.9458826184272766,0.828000009059906,0.8840000033378601,-1.2879749536514282,0.8905364871025085,0.9699646830558777,0.9564192891120911,0.215231791138649,0.3245033025741577
+trm_baseline_best,4,0.1,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8489999771118164,0.8550000190734863,0.9454135894775391,0.8289999961853027,0.8809999823570251,-1.2879749536514282,0.8905364871025085,0.9699646830558777,0.9552414417266846,0.20860926806926727,0.29801324009895325
+trm_baseline_best,8,0.0,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8539999723434448,0.8539999723434448,0.9449505805969238,0.8539999723434448,0.8539999723434448,-1.811623215675354,1.4589354991912842,1.0,1.0,0.0,0.0
+trm_baseline_best,8,0.001,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8539999723434448,0.8544999957084656,0.9452963471412659,0.8429999947547913,0.8659999966621399,-1.811623215675354,1.4589354991912842,0.993559718132019,0.9871194362640381,0.04109589010477066,0.08219178020954132
+trm_baseline_best,8,0.003,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8539999723434448,0.8600000143051147,0.9476419687271118,0.8420000076293945,0.878000020980835,-1.811623215675354,1.4589354991912842,0.983021080493927,0.976580798625946,0.14041095972061157,0.22602739930152893
+trm_baseline_best,8,0.01,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8539999723434448,0.8544999957084656,0.9457098245620728,0.8320000171661377,0.8769999742507935,-1.811623215675354,1.4589354991912842,0.9783372282981873,0.966042160987854,0.13013698160648346,0.21232876181602478
+trm_baseline_best,8,0.03,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8539999723434448,0.8529999852180481,0.9448826909065247,0.8360000252723694,0.8700000047683716,-1.811623215675354,1.4589354991912842,0.9783372282981873,0.9695550203323364,0.11986301094293594,0.18493150174617767
+trm_baseline_best,8,0.1,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8539999723434448,0.8544999957084656,0.9452345371246338,0.8379999995231628,0.8709999918937683,-1.811623215675354,1.4589354991912842,0.9800936579704285,0.9730679392814636,0.11986301094293594,0.19178082048892975
+trm_baseline_best,12,0.0,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8550000190734863,0.8550000190734863,0.9453826546669006,0.8550000190734863,0.8550000190734863,-3.6991007328033447,2.8621342182159424,1.0,1.0,0.0,0.0
+trm_baseline_best,12,0.001,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8550000190734863,0.8525000214576721,0.944302499294281,0.847000002861023,0.8579999804496765,-3.6991007328033447,2.8621342182159424,0.9947368502616882,0.9906432628631592,0.013793103396892548,0.027586206793785095
+trm_baseline_best,12,0.003,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8550000190734863,0.8519999980926514,0.9443457126617432,0.8429999947547913,0.8610000014305115,-3.6991007328033447,2.8621342182159424,0.988304078578949,0.984795331954956,0.04827586188912392,0.08965517580509186
+trm_baseline_best,12,0.01,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8550000190734863,0.8489999771118164,0.9430555105209351,0.8460000157356262,0.8519999980926514,-3.6991007328033447,2.8621342182159424,0.988304078578949,0.9871345162391663,0.027586206793785095,0.04137931019067764
+trm_baseline_best,12,0.03,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8550000190734863,0.8554999828338623,0.945648193359375,0.8479999899864197,0.8629999756813049,-3.6991007328033447,2.8621342182159424,0.9888888597488403,0.9859648942947388,0.06896551698446274,0.1034482792019844
+trm_baseline_best,12,0.1,1000,8,0.001,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8550000190734863,0.8500000238418579,0.9435864090919495,0.8460000157356262,0.8539999723434448,-3.6991007328033447,2.8621342182159424,0.988304078578949,0.9871345162391663,0.03448275849223137,0.05517241358757019