1
2
3
|
corr_neg_lambda1_correct,corr_neg_spec_count_pos_correct,corr_neg_spec_lambda1_correct,corr_neg_spec_mean_correct,corr_neg_spec_pos_l2_correct,corr_neg_spec_pos_mass_correct,corr_neg_spec_spread_correct,corr_q_correct,corr_q_lambda1,corr_q_spec_count_pos,corr_q_spec_lambda1,corr_q_spec_mean,corr_q_spec_pos_l2,corr_q_spec_pos_mass,corr_q_spec_spread,deterministic/exact,file,lambda1_both_fail,lambda1_feature_wins,lambda1_min/exact,lambda1_min/token_acc,lambda1_q_wins,mean_rollout/exact,n_samples,oracle_pass/exact,q_max/exact,q_max/token_acc,rollouts,spec_count_pos_both_fail,spec_count_pos_feature_wins,spec_count_pos_min/exact,spec_count_pos_min/token_acc,spec_count_pos_q_wins,spec_lambda1_both_fail,spec_lambda1_feature_wins,spec_lambda1_min/exact,spec_lambda1_min/token_acc,spec_lambda1_q_wins,spec_mean_both_fail,spec_mean_feature_wins,spec_mean_min/exact,spec_mean_min/token_acc,spec_mean_q_wins,spec_pos_l2_both_fail,spec_pos_l2_feature_wins,spec_pos_l2_min/exact,spec_pos_l2_min/token_acc,spec_pos_l2_q_wins,spec_pos_mass_both_fail,spec_pos_mass_feature_wins,spec_pos_mass_min/exact,spec_pos_mass_min/token_acc,spec_pos_mass_q_wins,spec_spread_both_fail,spec_spread_feature_wins,spec_spread_min/exact,spec_spread_min/token_acc,spec_spread_q_wins
0.8814938732175305,nan,0.8814938732175305,0.881548727791444,0.8816329740738039,0.881548727791444,0.7016889487515001,0.9656375405401326,-0.9166162782344888,nan,-0.9166162782344888,-0.916666132347328,-0.9167544021264978,-0.916666132347328,-0.7300307437150374,0.734375,research/flossing/ptrm_spectrum_k4_trm_base260410_k100_d64_sigma03_Lonly_n64.npz,3.0,2.0,0.890625,0.9523533582687378,4.0,0.78296875,64.0,0.953125,0.921875,0.9720293283462524,100.0,3.0,2.0,0.71875,0.899498462677002,15.0,3.0,2.0,0.890625,0.9523533582687378,4.0,3.0,2.0,0.890625,0.9511959552764893,4.0,3.0,2.0,0.890625,0.9511959552764893,4.0,3.0,2.0,0.890625,0.9511959552764893,4.0,3.0,2.0,0.890625,0.953125,4.0
0.9158759787150939,nan,0.9158759787150939,0.9174927024166323,0.9174867637523325,0.9174927024166323,0.8654349435118633,0.9987222810222618,-0.9132736884879366,nan,-0.9132736884879366,-0.9147807220489171,-0.9147768468622256,-0.9147807220489171,-0.8639983425079254,0.828125,research/flossing/ptrm_spectrum_k4_trm_multi4_104164_k100_d64_sigma03_Lonly_n64.npz,3.0,0.0,0.953125,0.9826388955116272,0.0,0.87265625,64.0,0.953125,0.953125,0.9814814925193787,100.0,3.0,0.0,0.84375,0.9394290447235107,7.0,3.0,0.0,0.953125,0.9826388955116272,0.0,3.0,0.0,0.953125,0.9814814925193787,0.0,3.0,0.0,0.953125,0.9814814925193787,0.0,3.0,0.0,0.953125,0.9814814925193787,0.0,3.0,0.0,0.953125,0.9814814925193787,0.0
|