From 66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Sat, 13 Jun 2026 12:35:36 -0500 Subject: rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipeline Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 --- .../results_trm_official58590_n2048.json | 105 +++++++++++++++++++++ 1 file changed, 105 insertions(+) create mode 100644 research/flossing/analysis_2x2/results_trm_official58590_n2048.json (limited to 'research/flossing/analysis_2x2/results_trm_official58590_n2048.json') diff --git a/research/flossing/analysis_2x2/results_trm_official58590_n2048.json b/research/flossing/analysis_2x2/results_trm_official58590_n2048.json new file mode 100644 index 0000000..bc000b2 --- /dev/null +++ b/research/flossing/analysis_2x2/results_trm_official58590_n2048.json @@ -0,0 +1,105 @@ +{ + "npz": "retest/trm_gbs768_step58590_full_n2048.npz", + "n": 2048, + "exact_acc": 0.8759765625, + "late_drift_def": "mean(drift_zH[:, -4:])", + "otsu_tau_log10": 1.3628430376123835, + "frac_converged": 0.841796875, + "cells": { + "A_conv_correct": { + "n": 1724, + "lam1_median": 0.011281780432909727, + "lam1_mean": 0.015547435924631226, + "lam1_iqr": [ + 0.008467044215649366, + 0.01652396097779274 + ], + "lam8_median": 0.0020897792419418693, + "spectrum_median": [ + 0.011281780432909727, + 0.008820333052426577, + 0.007248040288686752, + 0.0058647627010941505, + 0.004666940309107304, + 0.003820874495431781, + 0.0028478524181991816, + 0.0020897792419418693 + ], + "token_acc_median": 1.0, + "halted_at_median": 2.0 + }, + "B_conv_wrong": { + "n": 0 + }, + "C_nonconv_correct": { + "n": 70, + "lam1_median": 0.0819745659828186, + "lam1_mean": 0.07783016583749226, + "lam1_iqr": [ + 0.06863085739314556, + 0.09041773155331612 + ], + "lam8_median": 0.008648575283586979, + "spectrum_median": [ + 0.0819745659828186, + 0.052037810906767845, + 0.039651695638895035, + 0.028503953479230404, + 0.023648646660149097, + 0.016836480237543583, + 0.011321825440973043, + 0.008648575283586979 + ], + "token_acc_median": 1.0, + "halted_at_median": 14.0 + }, + "D_nonconv_wrong": { + "n": 254, + "lam1_median": 0.10287182405591011, + "lam1_mean": 0.10287220525283983, + "lam1_iqr": [ + 0.09241268038749695, + 0.11242476664483547 + ], + "lam8_median": 0.01879305113106966, + "spectrum_median": [ + 0.10287182405591011, + 0.0741146095097065, + 0.05705060437321663, + 0.045855674892663956, + 0.03607587888836861, + 0.029474849812686443, + 0.023949903436005116, + 0.01879305113106966 + ], + "token_acc_median": 0.6296296119689941, + "halted_at_median": 0.0 + } + }, + "mixture": { + "wrong_that_converged": 0.0, + "correct_that_nonconverged": 0.03901895206243032 + }, + "contrasts": { + "dlam1_correct_minus_wrong_overall": -0.09140016930177808, + "dlam1_within_converged": NaN, + "dlam1_within_nonconverged": -0.020897258073091507, + "dlam1_wrong_conv_minus_wrong_nonconv": NaN + }, + "auc": { + "neg_lam1_predicts_correct_overall": 0.9934800165029538, + "neg_lam1_predicts_correct_within_conv": NaN, + "neg_lam1_predicts_correct_within_nonconv": 0.8484814398200224, + "neg_logdrift_predicts_correct": 0.9719340057409211, + "neg_lam1_predicts_converged": 0.9923716736845121 + }, + "aux": { + "late_drift_zL_corr_with_zH_log": 0.9854614526028403, + "q_halt_final_median_by_cell": { + "A_conv_correct": 7.78125, + "B_conv_wrong": NaN, + "C_nonconv_correct": 7.71875, + "D_nonconv_wrong": -11.125 + } + } +} \ No newline at end of file -- cgit v1.2.3