1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
|
{
"aggregate": {
"uph": {
"rougeL": 0.12591913138908858,
"meteor": 0.15704431994591794,
"sfd_nolen": 0.9380754971612366,
"avg_len": 165.04
},
"lm_head_update": {
"rougeL": 0.1381619922784921,
"meteor": 0.14988041373383443,
"sfd_nolen": 1.2312511738320773,
"avg_len": 142.135
}
},
"significance": {
"lm_head_update": {
"rougeL": {
"mean_a": 0.12591913138908858,
"mean_b": 0.1381619922784921,
"mean_diff": -0.012242860889403491,
"ci_low": -0.015769665293717965,
"ci_high": -0.008716056485089017,
"t_pval": 1.1679421884663955e-10,
"w_pval": 5.342212114561821e-11
},
"sfd_nolen": {
"mean_a": 0.9380754971612366,
"mean_b": 1.2312511738320773,
"mean_diff": -0.2931756766708408,
"ci_low": -1.0036757003149965,
"ci_high": 0.41732434697331494,
"t_pval": 0.41961878992446333,
"w_pval": 0.04049481176403265
}
}
},
"num_examples": 200,
"task": "review",
"setting": "user",
"K": 4,
"methods": [
"uph",
"lm_head_update"
]
}
|