summaryrefslogtreecommitdiff
path: root/resulets/outputs/injection_ablation_rerun/review_user_K4/summary.json
blob: 4f1bce593cb629297b7c69dcef8cc8a72da8ba0b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
{
  "aggregate": {
    "uph": {
      "rougeL": 0.12591913138908858,
      "meteor": 0.15704431994591794,
      "sfd_nolen": 0.9380754971612366,
      "avg_len": 165.04
    },
    "lm_head_update": {
      "rougeL": 0.1381619922784921,
      "meteor": 0.14988041373383443,
      "sfd_nolen": 1.2312511738320773,
      "avg_len": 142.135
    }
  },
  "significance": {
    "lm_head_update": {
      "rougeL": {
        "mean_a": 0.12591913138908858,
        "mean_b": 0.1381619922784921,
        "mean_diff": -0.012242860889403491,
        "ci_low": -0.015769665293717965,
        "ci_high": -0.008716056485089017,
        "t_pval": 1.1679421884663955e-10,
        "w_pval": 5.342212114561821e-11
      },
      "sfd_nolen": {
        "mean_a": 0.9380754971612366,
        "mean_b": 1.2312511738320773,
        "mean_diff": -0.2931756766708408,
        "ci_low": -1.0036757003149965,
        "ci_high": 0.41732434697331494,
        "t_pval": 0.41961878992446333,
        "w_pval": 0.04049481176403265
      }
    }
  },
  "num_examples": 200,
  "task": "review",
  "setting": "user",
  "K": 4,
  "methods": [
    "uph",
    "lm_head_update"
  ]
}