diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-06-13 12:35:36 -0500 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-06-13 12:35:36 -0500 |
| commit | 66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a (patch) | |
| tree | c29cba61124018755a19b02c9d33e3ad5f2e05cc /research/flossing/analysis_2x2/results_trm_singleGPU_step260410_n512.json | |
Curated export for clone-and-run Maze training (2x A6000) + diagnostics.
trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible).
Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md.
Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'research/flossing/analysis_2x2/results_trm_singleGPU_step260410_n512.json')
| -rw-r--r-- | research/flossing/analysis_2x2/results_trm_singleGPU_step260410_n512.json | 105 |
1 files changed, 105 insertions, 0 deletions
diff --git a/research/flossing/analysis_2x2/results_trm_singleGPU_step260410_n512.json b/research/flossing/analysis_2x2/results_trm_singleGPU_step260410_n512.json new file mode 100644 index 0000000..3b11879 --- /dev/null +++ b/research/flossing/analysis_2x2/results_trm_singleGPU_step260410_n512.json @@ -0,0 +1,105 @@ +{ + "npz": "/home/yurenh2/rrm/research/flossing/diag_trm_singleGPU_step260410_512.npz", + "n": 512, + "exact_acc": 0.76953125, + "late_drift_def": "mean(drift_zH[:, -4:])", + "otsu_tau_log10": 1.406412158338842, + "frac_converged": 0.748046875, + "cells": { + "A_conv_correct": { + "n": 383, + "lam1_median": 0.004744160454720259, + "lam1_mean": 0.01041777972714804, + "lam1_iqr": [ + 0.0007444327347911894, + 0.013659899588674307 + ], + "lam8_median": -0.004219561815261841, + "spectrum_median": [ + 0.004744160454720259, + 0.0016308835474774241, + 0.00021728611318394542, + -0.0006795059307478368, + -0.001709386589936912, + -0.002729899948462844, + -0.0034774676896631718, + -0.004219561815261841 + ], + "token_acc_median": 1.0, + "halted_at_median": 2.0 + }, + "B_conv_wrong": { + "n": 0 + }, + "C_nonconv_correct": { + "n": 11, + "lam1_median": 0.09982780367136002, + "lam1_mean": 0.08986719998277047, + "lam1_iqr": [ + 0.09067171066999435, + 0.10350960865616798 + ], + "lam8_median": 0.013320312835276127, + "spectrum_median": [ + 0.09982780367136002, + 0.06963343918323517, + 0.051610760390758514, + 0.03814869746565819, + 0.022425860166549683, + 0.01762143149971962, + 0.012642345391213894, + 0.013320312835276127 + ], + "token_acc_median": 1.0, + "halted_at_median": 15.0 + }, + "D_nonconv_wrong": { + "n": 118, + "lam1_median": 0.10232088342308998, + "lam1_mean": 0.10288177159125522, + "lam1_iqr": [ + 0.09352006390690804, + 0.11121566034853458 + ], + "lam8_median": 0.021454622969031334, + "spectrum_median": [ + 0.10232088342308998, + 0.07419029250741005, + 0.05829045735299587, + 0.047421256080269814, + 0.040371473878622055, + 0.032383667305111885, + 0.027303663082420826, + 0.021454622969031334 + ], + "token_acc_median": 0.6419752836227417, + "halted_at_median": 0.0 + } + }, + "mixture": { + "wrong_that_converged": 0.0, + "correct_that_nonconverged": 0.027918781725888325 + }, + "contrasts": { + "dlam1_correct_minus_wrong_overall": -0.09725644066929817, + "dlam1_within_converged": NaN, + "dlam1_within_nonconverged": -0.002493079751729965, + "dlam1_wrong_conv_minus_wrong_nonconv": NaN + }, + "auc": { + "neg_lam1_predicts_correct_overall": 0.9893530069689409, + "neg_lam1_predicts_correct_within_conv": NaN, + "neg_lam1_predicts_correct_within_nonconv": 0.6186440677966102, + "neg_logdrift_predicts_correct": 0.9747913619547449, + "neg_lam1_predicts_converged": 0.9955269496225231 + }, + "aux": { + "late_drift_zL_corr_with_zH_log": 0.9724686803222311, + "q_halt_final_median_by_cell": { + "A_conv_correct": 7.4375, + "B_conv_wrong": NaN, + "C_nonconv_correct": 7.40625, + "D_nonconv_wrong": -11.125 + } + } +}
\ No newline at end of file |
