summaryrefslogtreecommitdiff
path: root/research/flossing/analysis_2x2/results_hrm26040_n8192.json
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
committerYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
commit66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a (patch)
treec29cba61124018755a19b02c9d33e3ad5f2e05cc /research/flossing/analysis_2x2/results_hrm26040_n8192.json
rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipelineHEADmain
Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'research/flossing/analysis_2x2/results_hrm26040_n8192.json')
-rw-r--r--research/flossing/analysis_2x2/results_hrm26040_n8192.json124
1 files changed, 124 insertions, 0 deletions
diff --git a/research/flossing/analysis_2x2/results_hrm26040_n8192.json b/research/flossing/analysis_2x2/results_hrm26040_n8192.json
new file mode 100644
index 0000000..bf4c711
--- /dev/null
+++ b/research/flossing/analysis_2x2/results_hrm26040_n8192.json
@@ -0,0 +1,124 @@
+{
+ "npz": "/home/yurenh2/rrm/research/flossing/diag_8k.npz",
+ "n": 8192,
+ "exact_acc": 0.524658203125,
+ "late_drift_def": "mean(drift_zH[:, -4:])",
+ "otsu_tau_log10": 0.766353451713377,
+ "frac_converged": 0.508544921875,
+ "cells": {
+ "A_conv_correct": {
+ "n": 4103,
+ "lam1_median": -0.8617429137229919,
+ "lam1_mean": -0.8564737750180547,
+ "lam1_iqr": [
+ -0.9020151197910309,
+ -0.815339982509613
+ ],
+ "lam8_median": -0.9746241569519043,
+ "spectrum_median": [
+ -0.8617429137229919,
+ -0.8905690908432007,
+ -0.9112593531608582,
+ -0.9292124509811401,
+ -0.9435566663742065,
+ -0.9553980827331543,
+ -0.9662551879882812,
+ -0.9746241569519043
+ ],
+ "token_acc_median": 1.0,
+ "halted_at_median": 4.0
+ },
+ "B_conv_wrong": {
+ "n": 63,
+ "lam1_median": -0.5912281274795532,
+ "lam1_mean": -0.6317614662268806,
+ "lam1_iqr": [
+ -0.809065192937851,
+ -0.5061159133911133
+ ],
+ "lam8_median": -0.7379652261734009,
+ "spectrum_median": [
+ -0.5912281274795532,
+ -0.6236273050308228,
+ -0.6583524942398071,
+ -0.681266725063324,
+ -0.6938952207565308,
+ -0.7069988250732422,
+ -0.7344604730606079,
+ -0.7379652261734009
+ ],
+ "token_acc_median": 0.6296296119689941,
+ "halted_at_median": 0.0
+ },
+ "C_nonconv_correct": {
+ "n": 195,
+ "lam1_median": -0.694297194480896,
+ "lam1_mean": -0.6856319598662548,
+ "lam1_iqr": [
+ -0.7354169189929962,
+ -0.6466438174247742
+ ],
+ "lam8_median": -0.7886528372764587,
+ "spectrum_median": [
+ -0.694297194480896,
+ -0.7198933362960815,
+ -0.7372102737426758,
+ -0.7535885572433472,
+ -0.7657074928283691,
+ -0.7715225219726562,
+ -0.7826006412506104,
+ -0.7886528372764587
+ ],
+ "token_acc_median": 1.0,
+ "halted_at_median": 14.0
+ },
+ "D_nonconv_wrong": {
+ "n": 3831,
+ "lam1_median": -0.5997700691223145,
+ "lam1_mean": -0.5970111100099877,
+ "lam1_iqr": [
+ -0.64748615026474,
+ -0.548848420381546
+ ],
+ "lam8_median": -0.7142836451530457,
+ "spectrum_median": [
+ -0.5997700691223145,
+ -0.634728193283081,
+ -0.6558717489242554,
+ -0.6714187860488892,
+ -0.6842536330223083,
+ -0.6956309676170349,
+ -0.7056014537811279,
+ -0.7142836451530457
+ ],
+ "token_acc_median": 0.6296296119689941,
+ "halted_at_median": 0.0
+ }
+ },
+ "mixture": {
+ "wrong_that_converged": 0.016178736517719568,
+ "correct_that_nonconverged": 0.04536993950674732
+ },
+ "contrasts": {
+ "dlam1_correct_minus_wrong_overall": -0.2586202025413513,
+ "dlam1_within_converged": -0.2705147862434387,
+ "dlam1_within_nonconverged": -0.09452712535858154,
+ "dlam1_wrong_conv_minus_wrong_nonconv": 0.00854194164276123
+ },
+ "auc": {
+ "neg_lam1_predicts_correct_overall": 0.9841127835524125,
+ "neg_lam1_predicts_correct_within_conv": 0.8520014391328065,
+ "neg_lam1_predicts_correct_within_nonconv": 0.8180149790173282,
+ "neg_logdrift_predicts_correct": 0.9639893544685683,
+ "neg_lam1_predicts_converged": 0.9859867295607834
+ },
+ "aux": {
+ "late_drift_zL_corr_with_zH_log": 0.9985142270869076,
+ "q_halt_final_median_by_cell": {
+ "A_conv_correct": 7.46875,
+ "B_conv_wrong": -8.6875,
+ "C_nonconv_correct": 7.46875,
+ "D_nonconv_wrong": -9.625
+ }
+ }
+} \ No newline at end of file