Professional Documents
Culture Documents
Thorsten Joachims
GMD Forschungszentrum IT, AIS.KD
Schloss Birlinghoven, 53754 Sankt Augustin, Germany
Thorsten.Joachims@gmd.de
"
>
$
!
?$ 0
" '
*
=<$<<<
*
High Level of Redundancy. &
"
" '
$
Sparse Document Vectors. &
$
"
"
* - ,--/
*
G
>
!
?
" 1
"
*"
%EE
E
9
* ,-./
step step step
2 3 1
1
0
0
1
4
0
1
"
200 positive
600 irrelevant
11
00
00
11
1 00
11 10
00
11 11
00
9
300011 1
00
positive
00
11 3000 negative 4000 irrelevant
. " /
! * *"
:
;<<
" )
$
*
$
"
" ,-./ 1"
$
. 8 .$
"
"
" -
* *
G
"$
. ,;<%;<%-<</ P !
,.%-%;<</ ,-%.%;<</ ,3%3%4<</ P !
"
,N%-%=<<</ ,-%N%=<<</ ,-<%-<%.<<</ P !
, (
"$
-<$<<<
!"
$
*
&
$
*
.$<<<
-<
:
(
*
H
=$<<<
" Empirical Validation. :
!" N
G
;-3C5 $
&*KH $
A
-
"
" *
*
:
=( F
" >?
&*KH
8
$
0
01 2 + --$-<<
$
$
$
#
" ,-./
*"
$
N5 !"
+ 1 3 9
" 3<
$
--$<3< ; 3; !"
<3 1
8 3 "$
.=- =.-
0 , " #
!"
. !" N !"
3
<;
: !"
3$<.3
3< $
"
-< ;.$;C4
"
<- 1
*"
0 4 " H
"
;<< *
$
!" =$<<< !"
"
"
8
* *
" $ >
?
*
.
!" N
" 1
&*KH
;CC
!"
: 8
" ??$
"
!" $
;CCQ
;CC
N5
* 3<
!"
!"
%EE
EE
;-3C5
"
%EE EEE0
E
;<EE
=
%EE E*E
"(
"(
"(
7& .* $8.$
"
*
<<; <<N << << <-
* * *
<- <; <=
<= <=
<.
" * *
* !- !;
"
!=
"*
*
"
"
0
"
" "
" "
" "
"
"
< <* <*- < < < <
" <5; .' -<< -<< -<<
Æ
-<;<4;< -<; -<=
"
*
*
"
*
* "
*
*
"
"
" " "
<<
$! *. !.!%9
"(
"(
"(
6 N
A
Æ
7 ; 7
" >
"? ¾
6
,; % - % -</ ,- % . % ;;/ P !
,; % - % N;/ ,- % ; % N./ P !
,3%-%.<5</ ,-%-<%;<N;;/ P !
B 6 6 $
,-NC % -N< % -=.3N/ P
!
"
!
$ £
-N
<
%$¼
*
6 <
6 ' & ! &' - ;<
* %
- *
-N "
6 " -< %
; -
, / - £ 6 - ' & ! &' -
$¼ # ;-
;
' & ! &'
*
--
, / -
' & ! &' 6
! !
;;
"
£
Æ 6 ; £ H"
*$
*
"
6
!
!
;=
*
F
6
-
;.
!
*
6 # !#
#
"
--
* H"
$
*
;-
*
"
$
!
"
:
$
# - $
"$ #
-
*
" " *
@
*
"
&
"
¼ # 6 " # !#
- -;
" $ ,-./
; *
# - -=
*
9
*
*
"
#
- -. - :"$
(
F
# *
£ # $
¼ £ £
9
( @
$
Æ ; ¼ #£ * ¼ £
*
"
*
* #
*
!
"
"
*
F
$ OL
¼ #£ !
$# £ 1
!
"
OL ,-3/
-
$# 6 # !# # - 7 # 7 - -3
; ! 6 ;3
7 )
< <
F
"
) 3$ * -=$
-= -. #
*
OL
"
%$# !"
"
R
"
%#
6< -4
!
#
!"
* OL
$
# 6 ! , / -C
OL
"$
"
8
!
"
!"$
"
9
# 6 ! &' -5
& & " # )
& 6 $ ' 6 %- -$ 6 % ! !
(
" *
F "
*+
- ! 6 7 ) ;4
$ 6 - -N
; ' & ! &'
! % ! (
"
!
6 *0
< <
" *
$
*
< < G
"
*0
7
%
6(
) 7 )
$¼ £
8
*
!"
*
!"
!
G
¾
ƾ
&*KH
¾
ƾ
3-N
<
--.= <
" -4=4 <
! 6 ;C 0
C.- <
7 ) ! -5.5 <
%
! ! $
9
"
-.5N
353
;C
<
A
-355
¾
ƾ
<
5-< .
54N N +
" --4-. <
6 ;5
;<5; == :
.=5C <
7 ) .35 < @ ;545 <
.<3 ; @
" ==<= <
=C5 < ;334 <
:* F - F ;
-
! =>
" # !%?9$& "? :
;<
&
) $%$ # *&?*$7 "? @ *&?9%7
, % % / , % % /
" " 6 3<
(
? 21 "
*+ ! 6
# @? "
& '
:
;<
= "
@
6
¾
8
$ * ;
A
$
7; 7 6
¾ &*KH
$
G
;-3C5
7- " *
6 <
6
"
6
"$
*
" G
*
"
% 6 % 6 ( *
$ *
" *
*
-
'
$
-
;N
""
7- Æ
*
:
"
"
Æ
"
F
-
* Æ *
*
7 ; 7
=<
5. COMPARING THE THEORETICAL
Æ MODEL WITH EXPERIMENTAL
RESULTS
*
" *
9
"
!
F ;
*
OL ! 6
$
*
8
$
"
:
$
"
"
*
:
"
0
$ *
Empirical Validation. :
0
" " *
6 <$
$
*"
Æ
*
.; :
&*KH
"
@ (
D
"
$
*
$
&*KH >? --;Q ..Q
!"
G
>? -3Q -=Q
A >
"? N.3Q ;=-Q 1 B " +
* /
*" ' *
' *
"
*
A
" $
'
:
;<
')? # !
')? @
' , " #
"$
) 6 -<<< =
*
*
"
"$
*
"
'
>?
8
$
8B8
'
OL
&*KH
6 .C<<<<$
,-./
) 6 3$ * 6 -;3 *0
;$ *
*
7. LIMITATIONS OF THE MODEL AND
OPEN QUESTIONS
<;==- -5NNC
..= =- 9
" *
"
7- 7-
"
*
:!
"$ 8
$
"
=N3C
OL $
--;Q
"
1
G
" >?
$
* !
<-5<; C4;N
-=5 $
*
=;
:
&
7- 7-
*
*
N4<=
$
* *
"
-3Q "$
*
*
$ *
"
A
" >
"? *
C.-;= -;C35
N.3C )
$
*
==
$
* &
7- 7-
" ,-./
N.3Q
*
$
*
-<$<<<
*
1
$
* =
*
"
*"
*
*
&
* 8"$
"
" *
&
*
$ * =
Æ
Æ
*
"
$ * " *
$
"
"
!
>?
$ >?
$
*
>
"?
Æ
&
:
**"
*
* 8. RELATED WORK
,-=/$
:
&
* "
"
$
""
*
"
* ,-./
0
H" @
6. SENSITIVITY ANALYSIS: DIFFICULT H" " 0
,=/ )
$
AND EASY LEARNING TASKS
"
*
*
&
* :
,-C/$ *
D
'
8
$
*
"
"
Æ
>"? > Æ
?
$
,-./
$ *
"
"
*0
*
*
" 1)-5$ 4<4S4;=$ -NN-
"
*
,4/ @ 8 D K G
*
E" :
1
*
G0*$
$ 1 ."
;+ ,-/ )
$
H )
1" 2
,
0
*"
,5$ N/ B
6# -#
$ =N-S.<5
,C/ ,4/ ,3/
:* #
" +$ M" -N5.
$ *
!
,C/ @ DT
$ F$ @ 8 1 **
"
&*
& '
$
2
#)/33 4 -#
+
)
#
)
,-4/ "
/
$ .C3S.5;$ K :
"$
*
$ #$ -NNN 1: +$ @ I$ #
*
*
,5/ + )
1 **
"
' " +
%
*
*
)
$
"
"
,
-
)
$
"
* ;4.%-NCS;<4$ -NC3
,N/ + )
1 **
9. SUMMARY AND CONCLUSIONS " +
% 1
**
,
-
*
!
"
)
$ ;43%;5<S;5N$ -NC3
,-</ M B ) +**
#
-) $
#
-NNN
$
,--/ M
% F
"
Æ
2
(
#
$
7$ -=C S -.;$ H$ -NN5
"
,-;/ M
H
$
H T$ : H$ 1 $
$ -" /
7$
-- +$ :* $ 1$
*
-NNN
,-=/ M 9
*
Æ
" 2
*
"
S
" S "$ )
#
7$
$
8$ ;<<< K
!" Æ
,-./ M -
8"$
7 #$
*
-
+B
$ #
T
B
$ ;<<-
K$
,-3/ H *
1
*
10. REFERENCES
% 1"
! *" ) 1
,-/ 1 H
B G +**
)
#
$ ;-%N<SNN$ 1
,
- -N3N
)
$ ;33%=-;S=-5$ -NC. ,-4/ : ) +
$ + G
$ ) $
,;/ : H 1
F
% 1 **
. /
" 1:$
$ 25. +34 2
.
"$ ;;%-;-S-4C$ -NN5 -# )0-#)05.)0-1
,=/ & :
2
. , 8334
**
)
9
$ -3NS-45$ @ I$ @I -<<=4$
-# )0)1 #
1 #1$ -NN5 1: +
."
)
1"$ 3CS4-$ ,-C/ : 7
)
"
-NN- )
- +B
$
#
"$
,./ B$ M +
$ B )$ -NN5
,-5/ 7
&"$
2
-##)/34$ :
$ DH$ -NN5
@
* -NN5 ,-N/ D K O ; 6"
2
,3/ @ 8$ )
$ D F
$
$ 7 (<
- )
; (
K $ D K 1E * 1 &"$ :* $ 1$ #1$ -N.N