Information Technology Reference
In-Depth Information
Table 10.3
Features for the OHSUMED corpus
ID
Feature description
t
i
∈
q
∩
d
TF(t
i
,d)
in title
1
t
i
∈
q
∩
d
log
(TF(t
i
,d)
2
+
1
)
in title
t
i
∈
q
∩
d
TF(t
i
,d)
LEN(d)
in title
3
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
4
+
1
)
in title
LEN(d)
t
i
∈
q
log
(
|
C
|·
5
IDF(t
i
))
in title
t
i
∈
q
log
(
log
(
|
C
|·
6
IDF(t
i
)))
in title
t
i
∈
q
log
(
|
TF(t
i
,C)
|
C
7
+
1
)
in title
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
8
·
log
(
|
C
|·
IDF(t
i
))
+
1
)
in title
LEN(d)
t
i
∈
q
∩
d
TF(t
i
,d)
·
9
log
(
|
C
|·
IDF(t
i
))
in title
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
|
TF(t
i
,C)
|
C
10
·
+
1
)
in title
LEN(d)
11
BM25 of title
12
log(BM25) of title
13
LMIR.DIR of title
14
LMIR.JM of title
15
LMIR.ABS of title
t
i
∈
q
∩
d
TF(t
i
,d)
in abstract
16
t
i
∈
q
∩
d
log
(TF(t
i
,d)
17
+
1
)
in abstract
t
i
∈
q
∩
d
TF(t
i
,d)
LEN(d)
in abstract
18
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
19
+
1
)
in abstract
LEN(d)
t
i
∈
q
log
(
|
C
|·
20
IDF(t
i
))
in abstract
t
i
∈
q
log
(
log
(
|
C
|·
21
IDF(t
i
)))
in abstract
t
i
∈
q
log
(
|
TF(t
i
,C)
|
C
22
+
1
)
in abstract
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
23
·
log
(
|
C
|·
IDF(t
i
))
+
1
)
in abstract
LEN(d)
t
i
∈
q
∩
d
TF(t
i
,d)
·
24
log
(
|
C
|·
IDF(t
i
))
in abstract
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
|
TF(t
i
,C)
|
C
25
·
+
1
)
in abstract
LEN(d)
26
BM25 of abstract
27
log(BM25) of abstract
28
LMIR.DIR of abstract
29
LMIR.JM of abstract
30
LMIR.ABS of abstract
t
i
∈
q
∩
d
TF(t
i
,d)
in 'title
31
+
abstract'
t
i
∈
q
∩
d
log
(TF(t
i
,d)
32
+
1
)
in 'title
+
abstract'
t
i
∈
q
∩
d
TF(t
i
,d)
LEN(d)
in 'title
33
+
abstract'
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
34
+
1
)
in 'title
+
abstract'
LEN(d)
t
i
∈
q
log
(
|
C
|·
IDF(t
i
))
in 'title
35
+
abstract'
t
i
∈
q
log
(
log
(
|
C
|·
IDF(t
i
)))
in 'title
36
+
abstract'
t
i
∈
q
log
(
|
C
|
TF(t
i
,C)
37
+
1
)
in 'title
+
abstract'
t
i
∈
q
∩
d
log
(
TF(t
i
,d)
38
·
log
(
|
C
|·
IDF(t
i
))
+
1
)
in 'title
+
abstract'
LEN(d)