summaryrefslogtreecommitdiff
path: root/research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
committerYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
commit66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a (patch)
treec29cba61124018755a19b02c9d33e3ad5f2e05cc /research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json
rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipelineHEADmain
Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json')
-rw-r--r--research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json105
1 files changed, 105 insertions, 0 deletions
diff --git a/research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json b/research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json
new file mode 100644
index 0000000..460e407
--- /dev/null
+++ b/research/flossing/analysis_2x2/results_trm_official_gbs768_step58590_n512.json
@@ -0,0 +1,105 @@
+{
+ "npz": "../official_gbs768_spectrum/trm_gbs768_base_step58590_n512_k8_seed20260602.npz",
+ "n": 512,
+ "exact_acc": 0.875,
+ "late_drift_def": "mean(drift_zH[:, -4:])",
+ "otsu_tau_log10": 1.364234039179148,
+ "frac_converged": 0.84765625,
+ "cells": {
+ "A_conv_correct": {
+ "n": 434,
+ "lam1_median": 0.011052772868424654,
+ "lam1_mean": 0.015589851711679268,
+ "lam1_iqr": [
+ 0.008054324658587575,
+ 0.017474188469350338
+ ],
+ "lam8_median": 0.0021472229855135083,
+ "spectrum_median": [
+ 0.011052772868424654,
+ 0.008679452817887068,
+ 0.007291494170203805,
+ 0.005999391432851553,
+ 0.004774029366672039,
+ 0.0037459908053278923,
+ 0.0029579862020909786,
+ 0.0021472229855135083
+ ],
+ "token_acc_median": 1.0,
+ "halted_at_median": 2.0
+ },
+ "B_conv_wrong": {
+ "n": 0
+ },
+ "C_nonconv_correct": {
+ "n": 14,
+ "lam1_median": 0.08274861052632332,
+ "lam1_mean": 0.0802882562524506,
+ "lam1_iqr": [
+ 0.07004822231829166,
+ 0.09586159884929657
+ ],
+ "lam8_median": 0.00618100818246603,
+ "spectrum_median": [
+ 0.08274861052632332,
+ 0.05459940806031227,
+ 0.039645833894610405,
+ 0.026364507153630257,
+ 0.020821912214159966,
+ 0.015413322485983372,
+ 0.010960425715893507,
+ 0.00618100818246603
+ ],
+ "token_acc_median": 1.0,
+ "halted_at_median": 14.0
+ },
+ "D_nonconv_wrong": {
+ "n": 64,
+ "lam1_median": 0.10339764878153801,
+ "lam1_mean": 0.10259491263423115,
+ "lam1_iqr": [
+ 0.09241705574095249,
+ 0.1118917465209961
+ ],
+ "lam8_median": 0.02135413885116577,
+ "spectrum_median": [
+ 0.10339764878153801,
+ 0.07536708191037178,
+ 0.057968027889728546,
+ 0.0463954322040081,
+ 0.03947761468589306,
+ 0.03304685465991497,
+ 0.026251215487718582,
+ 0.02135413885116577
+ ],
+ "token_acc_median": 0.6296296119689941,
+ "halted_at_median": 0.0
+ }
+ },
+ "mixture": {
+ "wrong_that_converged": 0.0,
+ "correct_that_nonconverged": 0.03125
+ },
+ "contrasts": {
+ "dlam1_correct_minus_wrong_overall": -0.09217484341934323,
+ "dlam1_within_converged": NaN,
+ "dlam1_within_nonconverged": -0.02064903825521469,
+ "dlam1_wrong_conv_minus_wrong_nonconv": NaN
+ },
+ "auc": {
+ "neg_lam1_predicts_correct_overall": 0.99267578125,
+ "neg_lam1_predicts_correct_within_conv": NaN,
+ "neg_lam1_predicts_correct_within_nonconv": 0.7667410714285714,
+ "neg_logdrift_predicts_correct": 0.9767020089285714,
+ "neg_lam1_predicts_converged": 0.9906947890818859
+ },
+ "aux": {
+ "late_drift_zL_corr_with_zH_log": 0.983883308834529,
+ "q_halt_final_median_by_cell": {
+ "A_conv_correct": 7.78125,
+ "B_conv_wrong": NaN,
+ "C_nonconv_correct": 7.71875,
+ "D_nonconv_wrong": -11.125
+ }
+ }
+} \ No newline at end of file