forked from castorini/anserini
-
Notifications
You must be signed in to change notification settings - Fork 0
/
mb11.yaml
137 lines (137 loc) · 2.9 KB
/
mb11.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
---
name: mb11
index_command: target/appassembler/bin/IndexCollection
index_utils_command: target/appassembler/bin/IndexUtils
search_command: target/appassembler/bin/SearchCollection
topic_root: src/main/resources/topics-and-qrels/
qrels_root: src/main/resources/topics-and-qrels/
index_root:
ranking_root:
input_roots:
- /tuna1/ # on tuna
- /store/ # on orca
- /scratch2/ # on damiano
input: collections/twitter/Tweets2011-corpus/json.gold/
index_path: indexes/lucene-index.mb11.pos+docvectors+rawdocs # path to the existing index, used in regression test if `--index` option is absent
collection: TweetCollection
threads: 44
generator: TweetGenerator
index_options:
- -storePositions
- -storeDocvectors
- -storeRawDocs
- -uniqueDocid
- -tweet.keepUrls
- -tweet.stemming
index_stats:
documents: 14950477
documents (non-empty): 14950449
total terms: 175050212
topic_reader: Microblog
topics:
- name: "[TREC 2011 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2011.txt)"
path: topics.microblog2011.txt
qrel: qrels.microblog2011.txt
- name: "[TREC 2012 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2012.txt)"
path: topics.microblog2012.txt
qrel: qrels.microblog2012.txt
evals:
- command: eval/trec_eval.9.0.4/trec_eval
params:
- -m map
separator: "\t"
parse_index: 2
metric: map
metric_precision: 4
can_combine: true
- command: eval/trec_eval.9.0.4/trec_eval
params:
- -m P.30
separator: "\t"
parse_index: 2
metric: p30
metric_precision: 4
can_combine: true
models:
- name: bm25
display: BM25
params:
- -searchtweets
- -bm25
results:
map:
- 0.3384
- 0.1948
p30:
- 0.3959
- 0.3316
- name: bm25+rm3
display: +RM3
params:
- -searchtweets
- -bm25
- -rm3
results:
map:
- 0.3650
- 0.2193
p30:
- 0.4170
- 0.3463
- name: bm25+ax
display: +Ax
params:
- -searchtweets
- -bm25
- -axiom
- -axiom.beta 1.0
- -axiom.deterministic
- -rerankCutoff 20
results:
map:
- 0.4008
- 0.2309
p30:
- 0.4612
- 0.3554
- name: ql
display: QL
params:
- -searchtweets
- -qld
results:
map:
- 0.3584
- 0.2102
p30:
- 0.4061
- 0.3333
- name: ql+rm3
display: +RM3
params:
- -searchtweets
- -qld
- -rm3
results:
map:
- 0.3923
- 0.2389
p30:
- 0.4435
- 0.3514
- name: ql+ax
display: +Ax
params:
- -searchtweets
- -qld
- -axiom
- -axiom.beta 1.0
- -axiom.deterministic
- -rerankCutoff 20
results:
map:
- 0.4201
- 0.2474
p30:
- 0.4408
- 0.3842