@@ -19,10 +19,12 @@ mixin squad_2_model_display(group, is_test)
19
19
th Model
20
20
th first_acc
21
21
th end_acc
22
- th expected wins
23
- - var largest_sent1_acc = Math .max .apply (null , group .map (function (model ) { return model .sent1_acc ; }))
24
- - var largest_eoq_acc = Math .max .apply (null , group .map (function (model ) { return model .eoq_acc ; }))
25
- - var largest_curve = Math .max .apply (null , group .map (function (model ) { return model .curve ; }))
22
+ th EW
23
+ th EW_OPT
24
+ - var largest_first_acc = Math .max .apply (null , group .map (function (model ) { return model .first_acc ; }))
25
+ - var largest_end_acc = Math .max .apply (null , group .map (function (model ) { return model .end_acc ; }))
26
+ - var largest_ew = Math .max .apply (null , group .map (function (model ) { return model .ew ; }))
27
+ - var largest_ew_opt = Math .max .apply (null , group .map (function (model ) { return model .ew_opt ; }))
26
28
each model in group
27
29
tr
28
30
if is_test
@@ -35,20 +37,25 @@ mixin squad_2_model_display(group, is_test)
35
37
if model .link
36
38
a.link ( href =model .link ) #{model .link }
37
39
td
38
- if model .sent1_acc == largest_sent1_acc
39
- b #{model .sent1_acc .toPrecision (5 )}
40
+ if model .first_acc == largest_first_acc
41
+ b #{model .first_acc .toPrecision (3 )}
40
42
else
41
- | #{model .sent1_acc .toPrecision (5 )}
43
+ | #{model .first_acc .toPrecision (3 )}
42
44
td
43
- if model .eoq_acc == largest_eoq_acc
44
- b #{model .eoq_acc .toPrecision (5 )}
45
+ if model .end_acc == largest_end_acc
46
+ b #{model .end_acc .toPrecision (3 )}
45
47
else
46
- | #{model .eoq_acc .toPrecision (5 )}
48
+ | #{model .end_acc .toPrecision (3 )}
47
49
td
48
- if model .curve == largest_curve
49
- b #{model .curve .toPrecision (5 )}
50
+ if model .ew == largest_ew
51
+ b #{model .ew .toPrecision (3 )}
50
52
else
51
- | #{model .curve .toPrecision (5 )}
53
+ | #{model .ew .toPrecision (3 )}
54
+ td
55
+ if model .ew_opt == largest_ew_opt
56
+ b #{model .ew_opt .toPrecision (3 )}
57
+ else
58
+ | #{model .ew_opt .toPrecision (3 )}
52
59
block content
53
60
.cover #contentCover
54
61
.container
@@ -128,6 +135,7 @@ block content
128
135
.infoHeadline
129
136
h2 Leaderboard
130
137
p
131
- | We evaluate each system with three metrics: accuracy at the end of the first sentence (first_acc) and at the end of the question (end_acc), and the
132
- a( href ="https://worksheets.codalab.org/worksheets/0xfb3d16165dd24f69bb1ba9420fca9212/" ) expected wins.
138
+ | We evaluate each system with three metrics: accuracy at the end of the first sentence (first_acc) and at the end of the question (end_acc), and two new metrics:
139
+ a( href ="https://worksheets.codalab.org/worksheets/0xfb3d16165dd24f69bb1ba9420fca9212/" ) expected wins
140
+ | with system buzzer (EW) and with optimal buzzer (EW_OPT).
133
141
+ squad_2_model_display(test2, true )
0 commit comments