From 66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Sat, 13 Jun 2026 12:35:36 -0500 Subject: rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipeline Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 --- .../official_gbs768_spectrum/headline_trm_multi4_dynamics_table.csv | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 research/flossing/official_gbs768_spectrum/headline_trm_multi4_dynamics_table.csv (limited to 'research/flossing/official_gbs768_spectrum/headline_trm_multi4_dynamics_table.csv') diff --git a/research/flossing/official_gbs768_spectrum/headline_trm_multi4_dynamics_table.csv b/research/flossing/official_gbs768_spectrum/headline_trm_multi4_dynamics_table.csv new file mode 100644 index 0000000..742ac68 --- /dev/null +++ b/research/flossing/official_gbs768_spectrum/headline_trm_multi4_dynamics_table.csv @@ -0,0 +1,4 @@ +model,step,full_exact,full_token_acc,lm_loss,dyn_sample_exact,lambda1_all,mean8_all,tail4_all,pos_count_all +TRM baseline best,58590,0.8686309456825256,0.9508475661277772,0.1155559569597244,0.875,0.02823458132615997,0.013457294571722192,0.0075273313675370546,7.841796875 +TRM multi4 best,35805,0.8964653611183167,0.9604493975639344,0.0945562794804573,0.900390625,0.020381716455975862,0.0065844104191477015,0.001402141885882835,3.841796875 +TRM multi4 final,65100,0.8350536823272705,0.9350366592407228,0.1547555029392242,0.82421875,0.03232463403946895,0.018508151198432188,0.013372940185377047,8.0 -- cgit v1.2.3