½
½
¾
½
!" # $%
¾
&'()* +,% '*,** -./+$%
$''0'+''' 1+
2 31 !$4* 5 ' ' 0 %
''+166311
"' 6#1+* +'
7 2%' 1 + +' 1 8+ 1
+ 1 0 1 * 4 + 1 + % 9
1+ 80 0 ** : 80
%; + 1 7 * 4 7 0 0
1++ 1 +80 07 1
+* <1 ' + !$421
!+0' * $0%
% 1 1++* $ '' 1 %2
1 ' 1 '1 %'1 8 +* 5
6 ''1+% 20*
4'+ 11++21:Æ
6 8= 0 6 1 '+ +'* 4 2 1
$1+"$#>-?%++0 +
91+6' 7 %* $7 18%'
'1 @1+7 %+''11+
8=8=+%+*
A8= ' %'% 8 0 8 % 1 * 4
+ +2 8 6 1+ % 0* B0
+8 +%:0%6''*
$ % 8+ 0 + 1 +
+* 4 8+ + 0 + 8 (
6' 8 1 ( 1 Æ *
! +81''1+1
0: 18+ 8*
4$8+'01 11+ ++
+2 82 3* 4 0 8%
1+ 1' 8'1
%+1+ 8%''0%16'
01 * "#%+1
0 0+ +'1 *
4 206'01++ +
0'' 5 +"5#%* A
1%0''+ 2* < 8++ 1
!+!$4*
4 '' 10* $$ 8 +% 1
* $$$$08+ !$46'+ * $
$0'++200 *
$1+ 6 2 ' 0' '* 5 +
'0 3 ' +0 % '3
+ +* $ % " # ' +' 1 +
2'8%%1+' 6'20*
6+'1 0 '' 0 0+ 1% 0
6 0* $ 3' 0 6 1% % C
8=* % 0&20) %
'0= +81% ++('3+1
* A 6+'1 0' ' 0 0( 8=1
682 % *
< % + 0% % D
80++%''3 11+* $0
'' 0 6 Æ% % 1+1 7 "** 6#*
0 8 1+ + 1+ " + # 0 0 %
61+7 E 40 7 11+8*
B ' + 3 ' ' 0
+ + 1% 1+ *
<10$1+4''>F?* $$1+4%"$4#0
&1+) 7 %' + +% &'%) 1 * $
'%+ +7 * '' '
1 ' '%'88%1 * $1
0'88%"%# ' 0 8(* A
1'88%1 1 07 + '0 8
''%*
$'8631'%110
%1 * 400%(60 ;
'' 20* + +% 7 3 1 '% 8
1 G++'6%++'6%" 1
>/?#C
*
+'61+'6% '' * 4 3 % 8C 1
+'8 '' 3 '+>/?* 3
8+8'+ 2' 7 8
+6 '+ % '
" %3# +*
4+Æ %1+ '%11
0+'%80'%+6+ ++'17
½
¾
¿
#6''80 %+8* $1 17
'8 +' 7 "0 '8 0
%+8#0(+;* 41 +8181
<06+6'%''+
1 '+ * 4 3 +' (''* $ %'
(''8 '3 '++% 8
'%+* 48+'+ 1(''3
++'+ 80 8+ 1'%'
8% (''* $ 0 20 +' + ' '01 1
+ 1'% +%1+ 1 +' + 1
+'6%>?*
%+ +'%"8++'6%#1
1"08% ''#% %'* 4
'+0 8'80
%''17 "** 6#+'* <'+
%8''+>H?1663
1 1 1+* +'7
2%'1 + +' 1 8+ 1+1081
20* 4 8 1 ' 8 3 8
807 1 '%*
4 2% ' 1 0 + +'* '' % 0 + &)
" +%# 80 6 + 1 1+ * 5 1
060 : "** $#&) +
1 Æ %6' 8% %' '21 + 6
0 * % + + +800
8%+ 8006'10 *
'80%++80068''>H?+1
'%>.?* ( 1''6+08
' 10* <26 0'' $ 6 0
(' 6* 4(''831+ 61
08"+#'+%3"+1+'
' #* <$'8(''0%0'+
1* 3'1$30* 10
(''&)$ * 4111$3&+
) : 80 " 8# 1 ('' I$ 6
"8#16(''0+ 1))80
06* 5 '0 JHH+>? 1
8 20 +' +* < +% 01
>HK?*
Sequential zipping of an A+B file
encoding A better and better
Matching process on A Matching process on B
encoding B with a code optimal for A
optimizing progressively the code on B (measuring the relative entropy)
B file A file
(Learning A)
(Learning B)
5 C + '107 ('''+(1 1
800: 7 0 ('' 7 I 88% +'%
8001'01 +'+ 8
+1(&6)17 "16+'17 1
' 6 0+ 2 ( 0 0 8=
#*
$1+0215-0'' +!$428
!+* 5+ ' 10 1 + !$4 2 8 ++(
10* < ' 1 20 + "L /K# ' 1 '
" LH#* 5 1 '
0 +' 3 ' 6
0
' 13 1 + "L/K#* 4 13
' 01 3 1 + ' '3 0 8
6* 41 36101
1 %101+'1 +* $
3 6 '' '1 1 + 1
'3 *
$ +' +'+1 + 6
7 7 1"$$1+#0 ' +2
8+* % '"!+# 8
+*
5'316 "
+ #
' 21 +* $ 13
' 6
0 2 +" 3 #
1'%'803'6
3 16* < '%806 6
8%++ +81 8 % 1% 6 0 '+1 6
">K?1#*
4!+$6 "!$4#+'360
+1 *
4!$4 15-+'/K +80
' ' + + !+"!$4F # "!$4F
#* $ +' 8% 0 8C 5A$ A$* 5A$ "
$1+%+#:1++''=
!+% 0(* ,= 1+ + 1+ *
1 1+ % * A$ "
$1+%+#1+!+ "=
+'% * $ +' +'
//= 6+ 1#* 8 !+* 4
1 1% + 8 HM1 +
8*
1 +88'1+" 1 +
' 8%#+1+368*+
6 + 8% 6'D + 6+*
3 + ++'31'* $ 6'+
0 %8 +*
4 ' + 'C ' +
+'6'1%+* $ 6'+0
% ''*
*/-. *F/ */KF *H.H *KK
48C " '#1 3 * < ' 1
80 +81 +"'%1
' 2# +816 +*
5!+ 20'1+10 C
$ 3' 6+' %8%* A
3 1 6 8 8% '' 1
16+*
$ +% 3 '6 +' %8%
'' ' 1 '* 4 3 1 6
88%''81 116+*
$ 3'6+'%8%* 4
316+' 8%8116*
5 20'1+10 C
$ 3' 6+'%8%* A
3 1 6 8 8% '' 1
16+*
$ +% 3 ' 6 +' % 8%
'' ' 1 '* 4 3 1 6
88%''81 116+*
$ 7 1, 4 '% 8 HM1
1 + 8* 4 0 8 6
8 +0 80 8*
48'1: "'#**
80 +8 1 +"'% 1 '
2# +816 +*
5*- 3* ' 1 81 ' 1
1!+'%*
<' 5*F 1'81' 1
+'0'1+*
10+2 ++ * $ 0 0 + 8
+'%** 1+1+ '10'
0* A0 +%'01 1%C 0''%
0 0 % 21 +3 * 1 1
81+ %+2 + +11+ 86'
8% 1 ' 3 6 8 +'* < 0
0%+'+ 810
75 77 79 81 83 85 87 89 91 93 95 97 99 101
Topic number
0 0.2 0.4 0.6 0.8 1 1.2
Recall
ENEASAPETDC ENEASAPETC
5 -C C 81' 1 *
Æ % 0 +8 ' 0 8 +'* 4 ' 8+
0 1 68+'%+" 100#
15'*
<2''1 +006'
7 % 1 ' 1 087
0 '% '* $ '% 1 +''
0 02* <+0'8'* A '8%'1+
+6'' 17 ;16
8 6+1 +8+'* A
++%8' +2:88012'
+ 1+ '81 %'*
>? =8 N"KHK#$1+ * 0*
>-? 1"*# "-# $1+ 1+
1$$1+*G 0+, 8*
>? "KF.#++ %1 ++ *4 %+4
N -HCHKF--O/*
>F? J 2<B"#"KK#+'6%'%,%1$1+*<%
0 %*
>/? P%,"KKH# G++'6%''*
'-**
>? G$"K/H# +5 1$1+4%* 0Q2*
>H? "--# (''*,%0
75 77 79 81 83 85 87 89 91 93 95 97 99 101
Topic number
0 0.2 0.4 0.6 0.8 1 1.2
Recall
ENEASAPDTDC ENEASAPDTC ENEASAPDTA
5 C !+C 81 ' 1 *
>.? JN "KK#+ 1'%80 7 0
'' 3*$4$1+4%KC-.
-K-*
>K? , '"-# +'
+7 %*,% .CK-H*
>? "-# J'' 1+* $
+ )+' ,') $,;$ =
N %58 % *
>? JN+'"KHH#+17 +'*$
4*$1* 4*-C HF*
>-? '' "-# ++ +' 1 !+ 46
*$1+,1-/ '1
$$ -,$%*
75 77 79 81 83 85 87 89 91 93 95 97 99 101 0
0.2 0.4 0.6 0.8
1 AVERAGE
ENEASAPETDC ENEASAPETC
75 77 79 81 83 85 87 89 91 93 95 97 99 101
0 0.2 0.4 0.6 0.8 1
AVERAGE ENEASAPDTDC ENEASAPDTC ENEASAPDTA
ENGLISH
GERMAN
5 FC '81' 1 +'0
'1+* '''C * 0'C !+*