1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
|
{
"aggregate": {
"uph": {
"rougeL": 0.11947665707568338,
"meteor": 0.2031354029453746,
"sfd_nolen": 0.8995390462886158,
"avg_len": 246.47
},
"lm_head_update": {
"rougeL": 0.12993177009628162,
"meteor": 0.19363473440376885,
"sfd_nolen": 0.9707037426803997,
"avg_len": 253.99
}
},
"significance": {
"lm_head_update": {
"rougeL": {
"mean_a": 0.11947665707568338,
"mean_b": 0.12993177009628162,
"mean_diff": -0.010455113020598263,
"ci_low": -0.013828552374635705,
"ci_high": -0.0070816736665608206,
"t_pval": 6.213636827361804e-09,
"w_pval": 1.1330271751337874e-11
},
"sfd_nolen": {
"mean_a": 0.8995390462886158,
"mean_b": 0.9707037426803997,
"mean_diff": -0.07116469639178391,
"ci_low": -0.1589445052822547,
"ci_high": 0.016615112498686885,
"t_pval": 0.1136461024786351,
"w_pval": 0.7252815218848135
}
}
},
"num_examples": 200,
"task": "topic",
"setting": "user",
"K": 4,
"methods": [
"uph",
"lm_head_update"
]
}
|