{ "aggregate": { "uph": { "rougeL": 0.12591913138908858, "meteor": 0.15704431994591794, "sfd_nolen": 0.9380754971612366, "avg_len": 165.04 }, "lm_head_update": { "rougeL": 0.1381619922784921, "meteor": 0.14988041373383443, "sfd_nolen": 1.2312511738320773, "avg_len": 142.135 } }, "significance": { "lm_head_update": { "rougeL": { "mean_a": 0.12591913138908858, "mean_b": 0.1381619922784921, "mean_diff": -0.012242860889403491, "ci_low": -0.015769665293717965, "ci_high": -0.008716056485089017, "t_pval": 1.1679421884663955e-10, "w_pval": 5.342212114561821e-11 }, "sfd_nolen": { "mean_a": 0.9380754971612366, "mean_b": 1.2312511738320773, "mean_diff": -0.2931756766708408, "ci_low": -1.0036757003149965, "ci_high": 0.41732434697331494, "t_pval": 0.41961878992446333, "w_pval": 0.04049481176403265 } } }, "num_examples": 200, "task": "review", "setting": "user", "K": 4, "methods": [ "uph", "lm_head_update" ] }