Zornitsa Kozareva USC/ISI Marina del Rey, CA · The first debate was in Oxford.A draw for Obama...
Transcript of Zornitsa Kozareva USC/ISI Marina del Rey, CA · The first debate was in Oxford.A draw for Obama...
!"#$$%&'()*+&,-./0&123452)2-(.6-&
Zornitsa Kozareva!USC/ISI!
Marina del Rey, [email protected]!
www.isi.edu/~kozareva!
7(-8(50&9:;&9<==&
!"#$%&'()*+)"'
>?6&23&7*550&@6AA3B'!"##$&CD&%&''(,'-..$"//0'1!234!4'5676'-.8+$#9:;'<#;',,,'!"##$'=,'%&''()*&''(>+/+',".?'
-@<,%A8'7*550&@6AA3BC?*+DE"'-8"$+%#F/'@A/:'<#):".'+/'#'9A)*B$?))+)*'-8"$+%#)'GH'
/&AI'J$A.?%".'K;'LM:&'2"):?$;'CANO'#).'+/':&"'9A)*"/:B$?))+)*'J$A*$#8'AP'#);'Q+).'+)'
:&"'&+/:A$;'AP':&"'DDD'-99"*".'R+99"$'S#.'S")+".'TA).O'!"$E+%"/'!":' PA$'GIA'U+V9"'W+$9.,'-' ' X?.*"'&#.'.")+".'
KA).' PA$' !"##$) %&''(,' DDD' !"##$) %&''(O' I&A' +/' #%%?/".' AP' Q+99+)*' &+/' YB;"#$BA9.+)' :&+/'?).#:".'DDD'
7*550&@6AA3B'<+Q+J".+#O' :&"'P$""'")%;%9AJ".+#&S$,'!"##$'=,'%&''(' ZKA$)'L['\#)?#$;']Y5L^'+/'#'J$A8+)"):'$"/"#$%&"$'+)':&"'_"9./'AP'9''<A$9.'@#$D#9'-$:/'W#8"/'=#)Q0'`$.'S#)O'S+/%+J9+)"0'\?B\?:/?'4//?".'T;0'!"##$)%&''('
]M:&'S#)'=#)Q0']/:'
&&&E2/?&'()*+&,-./0&C*46F-2.6-& GCH&I,C&
a'
''''a'
a'
L'
b('="%A*)+DA)'E/,'b('S+/%$+8+)#DA)'
• b(' ="%A*)+DA)' c' .":"%DA)' d' %9#//+_%#DA)' AP' ")D:;'8")DA)"/'+):A'#'J$"."_)".'/":'AP'%#:"*A$+"/,'
! ''#%&+"E"/'A)9;'#'J#$D#9'.+/#8K+*?#DA)'AP')#8"/'
• b('S+/%$+8+)#DA)'c'_).+)*':&"'#%:?#9'")D:;'.")A:".'
K;'#'J#$D%?9#')#8"'A%%?$$")%"'+)':"N:,'
I,C&
a'
''''a'
a'
`'
J+*(KK0;&E*&E(-/&
!"##$)%&''(O'#'_e&'*")"$#DA)'P#$8"$O'
<#;)"'2$;:/'_)+/&".'&#$E"/D)*'&+/'%$AJ'
!"##$)%&''('+/':&"'$#*"B_99".O'.A8"/D%B
#K?/+)*'%#$""$'%$+8+)#9'I&A'Q+99".'&+/''
!"##$)%&''(O'I&A'+/'#%%?/".'AP'Q+99+)*'&+/'fB;"#$BA9.'.#?*&:"$'#).'&"$'K"/:'
S$,'!"##$'=,'%&''('+/'#'J$A8+)"):'$"/"#$%&"$'
+)':&"'_"9./'AP'%A8J?:#DA)#9'9+)*?+/D%'
!"##$'=,'%&''(,'-..$"//0'1!234!4'5676'-.8+$#9:;'<#;'D'
5'
?LM%NN3*(54?D2-/*K283D46)N&
1,!,'2")/?/'T?$"#?'/:#:"/'YMOMMM')#8"/'#$"'/&#$".'K;']MMOMMMOMMM'J"AJ9"'
The first debate was in Oxford.
The first debate was in Oxford. A draw for Obama would be considered a win.
He is seen as a national hero by those who live in Georgia after the independence from the USSR.
48JA$:#)%"'AP'b('S+/%$+8+)#DA)'
• g?"$+"/' #KA?:' b(/' %A)/D:?:"' /+*)+_%#):' JA$DA)' AP'<"K'h?"$+"/0'
– ]]B]7i'%A):#+)'J"$/A)')#8"j'
– 5i'#$"'#KA?:'#'J"$/A)')#8"*
• 4."#99;O' /"#$%&' $"/?9:/' /&A?9.' K"' %9?/:"$".' /?%&' :&#:'"#%&'%9?/:"$'%A$$"/JA)./':A':&"'/#8"'+).+E+.?#9'
– P#/:"$'P#%:'"N:$#%DA)'
– 8A$"'#%%?$#:"'+)PA$8#DA)'$":$+"E#9'
f'j'/:?.;'K;'\#E+"$'-$D9"/O'LMMY'
k)':&"'<"K'l'
• bAKA.;'Q)AI/'&AI'8#);'/")/"/'Z8"#)+)*/^'#$"'
:&"$"'PA$'#'*+E")'J"$/A)')#8"'
• 4:'+/'+8JA//+K9"':A'"/D8#:"'#).':$#%"':&"'8A/:'
P$"h?"):'/")/"'
– :&"':#/Q'+/'D8"'%A)/?8+)*'#).':".+A?/'PA$'&?8#)/'
– )"I'<"K'J#*"/'%A)/:#):9;'#JJ"#$'
– A9.'<"K'J#*"/'8+*&:'K"'."9":".'AE"$'D8"'
Y'
<&;'+/'+:'%#99".'mS+/%$+8+)#DA)na'
123452)2-(.6-&
B &/?*&/6/(K&-8)A*5&6O&3*-3*3&23&8-P-6E-&
B &/?*&)*(-2-F&6O&*(4?&3*-3*&23&8-P-6E-&
B &-6&3M*42Q4&)(MM2-F&6O&4K83/*5R&3*-3*&
123()A2F8(.6-&
B &/?*&/6/(K&-8)A*5&6O&3*-3*3&23&P-6E-&
B &/?*&)*(-2-F&6O&*(4?&3*-3*&23&P-6E-&
B &/?*&65+*5&23&A(3*+&6-&/?*&O5*S8*-40&
&8"#)+)*']0'
''''''''''':&"'/9AJ"'K"/+."'#'KA.;'AP'I#:"$'
''''''''''''8"#)+)*'L0''
''''''''''''."JA/+:A$;'_)#)%+#9'+)/D:?DA)'
T&
A(-P& 7*550&@6AA3&
*$A?J]'
*$A?J'L'
*$A?J'`'
]M'
]]'
?LM%NN3*(54?D4(556/9D65FN3/(AK*N3*(54?&
!(556/&"*(54?&C*38K/3&!K83/*52-F&,-F2-*&
GA.#;'
]L'
?LM%NN3*(54?D4(556/U3*(54?D46)N4(556/9UE*A(MMN3*(54?&
!(556/&"*(54?&
GA.#;'
29?/:"$+)*'
1)/?J"$E+/".'U"#$)+)*'
• U#K"9/'8?/:'K"'#?:A8#D%#99;'.+/%AE"$".'
• @":&A.0'%9?/:"$+)*'
• G#/Q/'I&+%&'%#)'K"'$"/A9E".0'b#8".'()D:;'
S+/#8K+*?#DA)O'#);':;J"'AP'G"N:'29#//+_%#DA)'
:#/Q'
]5'
29?/:"$+)*'
• -$"':&"$"'#);'m*$A?J/n'+)':&"'.#:#'a''• <&#:'+/'"#%&'*$A?J'a''
• oAI'8#);'a''
• oAI':A'+.")DP;':&"8a'
]['
<&#:'+/'29?/:"$+)*a'
• 29?/:"$+)*'+/':&"'J$A%"//'AP'*$A?J+)*'#'/":'AP'AKX"%:/'+):A'%9#//"/'AP'/+8+9#$'AKX"%:/'
• -'%A88A)'#).'+8JA$:#):':#/Q':&#:'_)./'8#);'
#JJ9+%#DA)/'+)'!%+")%"O'()*+)""$+)*'#8A)*'
A:&"$/'
– *$A?J'*")"/':&#:'J"$PA$8':&"'/#8"'P?)%DA)'
– *$A?J'+).+E+.?#9/':&#:'&#/'/+8+9#$'JA9+D%#9'E+"I'
– +.")DP;'/+8+9#$'AKX"%:/'P$A8'J+%:?$"/'
– %#:"*A$+p"'.A%?8"):/'AP'/+8+9#$':AJ+%/''
– .+/#8K+*?#:"')#8".'")DD"/'Z+)'A?$'%#/"^']6'
4//?"/'+)'29?/:"$+)*'
• <&#:'+/'#')#:?$#9'*$A?J+)*'#8A)*':&"/"'AKX"%:/a''
• <&#:'8#Q"/'AKX"%:/'m$"9#:".na''
– q/+8+9#$+:;3.+/:#)%"n'8":$+%'
• ="J$"/"):#DA)'PA$'AKX"%:/''''r'':&$A?*&'E"%:A$'/J#%"'
• oAI'8#);'%9?/:"$/a ''
'B'_N".'#BJ$+A$;''
'B'%A8J9":"9;'.#:#'.$+E")'
' 'B'#EA+.'m:$+E+#9n'%9?/:"$/'B':AA'9#$*"'A$'/8#99'
• 29?/:"$+)*'-9*A$+:&8/'
' 'r's#$DDA)'#9*A$+:&8/'
''r'o+"$#$%&+%#9'#9*A$+:&8/&]7'
<&#:'+/':&"')#:?$#9'*$A?J+)*'
#8A)*':&"/"'AKX"%:/a'
]f'
<&#:'+/':&"')#:?$#9'*$A?J+)*'
#8A)*':&"/"'AKX"%:/a'
]Y'
]Y'
29?/:"$+)*'K;'
%A9A$' /+p"'
<&#:'+/'!+8+9#$+:;a'
LM'
• Hard to define, but we know it when we see it. • Easier to think in terms of the distance between vectors
s$AJ"$D"/'AP'.+/:#)%"'8"#/?$"'
• SZ-OT^'c'SZTO-^' ' '+$,,"-#$)
• SZ-O-^'c'M' ' ' '''''.&/(-0/1$)&2)+"324+5,530#5-$)
• SZ-OT^'c'M'+P'-c'T' ' ' '6&(5785-$)+"90#07&/)
• SZ-OT^'t'SZ-O2^'u'SZTO2^'':#50/;<30#)=/"><035-$)
L]'
s$AJ"$D"/'AP'.+/:#)%"'8"#/?$"'
• SZ-OT^'c'SZTO-^' ' '+$,,"-#$)' ' 'k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'9+Q"'TAKO'K?:'
TAK'9AAQ/')A:&+)*'9+Q"'-9"Nn'
• SZ-O-^'c'M' ' ' '''''.&/(-0/1$)&2)+"324+5,530#5-$)
• SZ-OT^'c'M'+P'-c'T' ' ' '6&(5785-$)+"90#07&/)
• SZ-OT^'t'SZ-O2^'u'SZTO2^'':#50/;<30#)=/"><035-$)
LL'
s$AJ"$D"/'AP'.+/:#)%"'8"#/?$"'
• SZ-OT^'c'SZTO-^' ' '+$,,"-#$)' ' 'k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'9+Q"'TAKO'K?:'
TAK'9AAQ/')A:&+)*'9+Q"'-9"Nn'
• SZ-O-^'c'M' ' ' '''''.&/(-0/1$)&2)+"324+5,530#5-$)''''k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'8A$"'9+Q"'TAKO'
:&#)'TAK'.A"/n'
• 'SZ-OT^'c'M'+P'-c'T ' ' '6&(5785-$)+"90#07&/)
• SZ-OT^'t'SZ-O2^'u'SZTO2^'':#50/;<30#)=/"><035-$)
L`'
s$AJ"$D"/'AP'.+/:#)%"'8"#/?$"'
• SZ-OT^'c'SZTO-^' ' '+$,,"-#$)' ' 'k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'9+Q"'TAKO'K?:'
TAK'9AAQ/')A:&+)*'9+Q"'-9"Nn'
• SZ-O-^'c'M' ' ' '''''.&/(-0/1$)&2)+"324+5,530#5-$)''''k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'8A$"'9+Q"'TAKO'
:&#)'TAK'.A"/n'
• 'SZ-OT^'c'M'+P'-c'T ' ' '6&(5785-$)+"90#07&/)' ' k:&"$I+/"' :&"$"' #$"' AKX"%:/' +)' ;A?$' IA$9.' :&#:' #$"'
.+v"$"):O'K?:';A?'%#))A:':"99'#J#$:'
• SZ-OT^'t'SZ-O2^'u'SZTO2^'':#50/;<30#)=/"><035-$)L5'
s$AJ"$D"/'AP'.+/:#)%"'8"#/?$"'
• SZ-OT^'c'SZTO-^' ' '+$,,"-#$)' ' 'k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'9+Q"'TAKO'K?:'
TAK'9AAQ/')A:&+)*'9+Q"'-9"Nn'
• SZ-O-^'c'M' ' ' '''''.&/(-0/1$)&2)+"324+5,530#5-$)''''k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'9AAQ/'8A$"'9+Q"'TAKO'
:&#)'TAK'.A"/n'
• 'SZ-OT^'c'M'+P'-c'T ' ' '6&(5785-$)+"90#07&/)' ' k:&"$I+/"' :&"$"' #$"' AKX"%:/' +)' ;A?$' IA$9.' :&#:' #$"'
.+v"$"):O'K?:';A?'%#))A:':"99'#J#$:'
• SZ-OT^'t'SZ-O2^'u'SZTO2^'':#50/;<30#)=/"><035-$)'''k:&"$I+/"';A?'%A?9.'%9#+8':&#:'m-9"N'+/'E"$;'9+Q"'TAK'#).'
-9"N'+/'E"$;'9+Q"'2#$9O'K?:'TAK'+/'E"$;'?)9+Q"'2#$9) L['
S+/:#)%"'8"#/?$"/'
• W+E")':IA'AKX"%:/'?'#).'$'KA:&'I+:&'/'E#9?"/'' ' ' ''
' ' ' ''
%#9%?9#:"':&"'(?%9+."#)'.+/:#)%"'#/'
L6'
!
d(x,y) = xi " yi2
i=1
p
#2
!
x = x1,x2,…,xn( )
!
y = y1,y2,…,yn( )
TAVA8B?J'29?/:"$+)*'
B''T"*+)'I+:&'"#%&'"9"8"):'+)'#'/"J#$#:"'%9?/:"$'
B @"$*"'%9?/:"$/'+):A'/?%%"//+E"9;'9#$*"'%9?/:"$'
B ="J"#:'?)D9'A)"'%9?/:"$'+/'9"e'
L7'
Recommended reading: Chapter 14 on Clustering from the book of Manning& Schütze
GAJB.AI)'29?/:"$+)*'
B T"*+)'I+:&'#99'"9"8"):/'+)'#'I&A9"'%9?/:"$'
B S+E+."'%9?/:"$/'+):A'/?%%"//+E"9;'/8#99"$'
%9?/:"$'
B '="J"#:'?)D9'#99'"9"8"):/'#$"'+)'/+)*9":A)'
%9?/:"$/'
Lf'
Recommended reading: Chapter 14 on Clustering from the book of Manning& Schütze
29?/:"$'s$AN+8+:;'(/D8#:"'
• !+)*9"BU+)Q'– b"#$"/:'b"+*&KA$0':&"'%9A/"/'8"8K"$/'
• 2A8J9":"BU+)Q'
– C?$:&"/:'b"+*&KA$0':&"'P?$:&"/:'8"8K"$/'
• 2"):$A+.'– 2"):"$/'AP'*$#E+:;'
LY'
s#$DDA)+)*'29?/:"$+)*'
• 2A)/:$?%:/'#'J#$DDA)'AP'/)AKX"%:/'+):A'#'/":'AP'R'%9?/:"$/'• RB8"#)/'#9*A$+:&80'
4)J?:0'S"/+$".')?8K"$'AP'%9?/:"$/O'@)
4)+D#9+p"0':&"'@'%9?/:"$'%"):"$/'Z$#).A8'+P')"%"//#$;^'
4:"$#:"0'
],'S"%+."':&"'%9#//'8"8K"$/&+J/'AP':&"'b'AKX"%:/'K;'#//+*)+)*':&"8':A'':&"'
)"#$"/:'%9?/:"$'%"):$A+./'Z8"#)^'
L,'="B"/D8#:"':&"'@)%9?/:"$/O'K;'#//?8+)*':&"'8"8K"$/&+J'PA?).'#KAE"'#$"'
%A$$"%:'
G"$8+)#:"0'
4P')A)"'AP':&"'b'AKX"%:/'%&#)*".'8"8K"$/&+J'+)':&"'9#/:'+:"$#DA)O'"N+:'
`M'
!
µk =1ck
xii"Ck
#
T#%Q':A'b('S+/%$+8+)#DA)'
G"N:'!)+JJ":'
• -'/8#99'P$#*8"):'AP':"N:':&#:'%A):#+)/'P$A8'
A)"':A':&$""'/"):")%"/'
`L'
Dr. Jerry R. Hobbs (born 25 January 1942) is a prominent researcher in the fields of computational linguistics, discourse analysis, and artificial
Jerry Hobbs is the rage-filled, domestic-abusing career criminal who killed his 8-year-old daughter and her 9-year-old friend, with scarcely ...
s$AK9"8'CA$8?9#DA)'
• 4)J?:0'– b' -"?-) (/599"-(' :&#:' 8")DA)' #' J#$D%?9#$' J$AJ"$'
)#8"'Z+:'%#)'K"'J"$/A)O'A$*#)+p#DA)'A$'9A%#DA)^'
• k?:J?:0'– R' %9?/:"$/O' I&"$"' "#%&' %9?/:"$' &#/' -"?-) (/599"-(':&#:' #$"' /+8+9#$' :A' "#%&' A:&"$' #).' .+v"$"):' P$A8'
:&"'(/599"-()+)':&"'$"/:'AP':&"'%9?/:"$/''
``'
4)J?:''
• S$,'!"##$&CD&%&''('ZKA$)'L['\#)?#$;']Y5L^'+/'#'J$A8+)"):'$"/"#$%&"$'+)':&"'_"9./'AP'%A8J?:#DA)#9'9+)*?+/D%/O'.+/%A?$/"'#)#9;/+/O'#).'#$D_%+#9'
• !"##$)%&''(&+/':&"'$#*"B_99".O'.A8"/D%B#K?/+)*'%#$""$'%$+8+)#9'I&A'Q+99".'&+/'fB;"#$BA9.'.#?*&:"$'#).'&"$'YB;"#$BA9.'P$+").O'I+:&'/%#$%"9;'DDD&
• !"##$)%&''(O'-?:&A$,'-'_e&'*")"$#DA)'P#$8"$O'<#;)"'2$;:/'_)+/&".'&#$E"/D)*'&+/'%$AJ'+)':&"'P#99'AP']YfM'#).'&#?9".'8A$"':&#)'`LMMM'K?/&"9/'AP'/A;K"#)/'DDD&
• !"##$)%&''(O'I&A'+/'#%%?/".'AP'Q+99+)*'&+/'fB;"#$BA9.'.#?*&:"$'#).'&"$'K"/:'DDD'k)'<".)"/.#;O'#'X?.*"'.")+".'K#+9'PA$'!"##$)%&''(O'`5O'DDD&
• C?*+DE"/'w'!"##$)%&''(&B'T$+"P'B'C#:&"$'S")+".'T#+9'-I#+:/'G$+#9'CA$'2&+9.$")'/'@?$."$/'\"$$;'T$#):A)'oAKK/'#%%?/".'AP':&"'/:#KK+)*'."#:&/'DDD&
• !"##$&CD&%&''(,'-..$"//0'1!234!4'5676'-.8+$#9:;'<#;'DDD'!"##$&CD&%&''()*&''(>+/+,".?,'1!234!4O'5676'-.8+$#9:;'<#;O'@#$+)#'."9'=";O'2-'YMLYL'&
`5'
k?:J?:'• !K83/*5&=%&
– S$,'!"##$&CD&%&''('ZKA$)'L['\#)?#$;']Y5L^'+/'#'J$A8+)"):'$"/"#$%&"$'+)':&"'_"9./'AP'%A8J?:#DA)#9'9+)*?+/D%/O'.+/%A?$/"'#)#9;/+/O'#).'#$D_%+#9'
– !"##$&CD&%&''(,'-..$"//0'1!234!4'5676'-.8+$#9:;'<#;'DDD'!"##$&CD&%&''()*&''(>+/+,".?,'1!234!4O'5676'-.8+$#9:;'<#;O'@#$+)#'."9'=";O'2-'YMLYL''
• !K83/*5&9%&– !"##$)%&''(&+/':&"'$#*"B_99".O'.A8"/D%B#K?/+)*'%#$""$'%$+8+)#9'I&A'Q+99".'&+/'
fB;"#$BA9.'.#?*&:"$'#).'&"$'YB;"#$BA9.'P$+").O'I+:&'/%#$%"9;'DDD&– !"##$)%&''(O'I&A'+/'#%%?/".'AP'Q+99+)*'&+/'fB;"#$BA9.'.#?*&:"$'#).'&"$'K"/:'DDD'
k)'<".)"/.#;O'#'X?.*"'.")+".'K#+9'PA$'!"##$)%&''(O'`5O'T&– C?*+DE"/'w'!"##$)%&''(&B'T$+"P'B'C#:&"$'S")+".'T#+9'-I#+:/'G$+#9'CA$'2&+9.$")'/'
@?$."$/'\"$$;'T$#):A)'oAKK/'#%%?/".'AP':&"'/:#KK+)*'."#:&/'DDD&
• !K83/*5&V%&– !"##$)%&''(O'-?:&A$,'-'_e&'*")"$#DA)'P#$8"$O'<#;)"'2$;:/'_)+/&".'
&#$E"/D)*'&+/'%$AJ'+)':&"'P#99'AP']YfM'#).'&#?9".'8A$"':&#)'`LMMM'K?/&"9/'AP'/A;K"#)/'DDDD&
`['
1)."$9;+)*'s$"8+/"j'
• xA?'/c'Q)AI'#'IA$.'K;':&"'%A8J#);'+:'Q""J/'
– C+$:&O']Y[7'Z!:?.+"/'+)'U+)*?+/D%'-)#9;/+/^'
• @"#)+)*/'AP'IA$./'#$"'.":"$8+)".'K;':&"+$'
.+/:$+K?DA)#9'J#V"$)/'ZS+/:$+K?DA)#9'o;JA:&"/+/^'
– o#$$+/O']Y6f'Z@#:&"8#D%#9'!:$?%:?$"/'AP'U#)*?#*"^'
• <A$./':&#:'A%%?$'+)'/+8+9#$'%A):"N:/'I+99'&#E"'/+8+9#$'
8"#)+)*/'Z!:$A)*'2A):"N:?#9'o;JA:&"/+/^'
– @+99"$'#).'2&#$9"/O']YY]'ZU#)*?#*"'#).'2A*)+DE"'
''''s$A%"//"/^'
`6'j'G&+/'/9+."'+/'#.#J:".'P$A8'#':?:A$+#9'AP'G".'s"."$/")'
`7'
4K83/*5&3-2MM*/3&
!"##$)%&''('+/':&"'$#*"B_99".O'.A8"/D%B
#K?/+)*'%#$""$'%$+8+)#9'I&A'Q+99".'&+/''!"##$)%&''(O'I&A'+/'#%%?/".'AP'Q+99+)*'&+/'YB;"#$BA9.'.#?*&:"$'#).'&"$'K"/:'
S$,'!"##$'=,'%&''('+/'#'J$A8+)"):'$"/"#$%&"$'+)'
:&"'_"9./'AP'%A8J?:#DA)#9'9+)*?+/D%'
!"##$'=,'%&''(,'-..$"//0'1!234!4'5676'-.8+$#9:;'<#;'D'
!"##$)%&''(O'#'_e&'*")"$#DA)'P#$8"$O'
<#;)"'2$;:/'_)+/&".'&#$E"/D)*'&+/'%$AJ'
s1 s2 … sn
teach 2 0 … 7
kill 10 2 … 3
child 1 3 … 0 /*W/&3-2MM*/&5*M5*3*-/(.6-&
3-2MM*/&32)2K(52/0&
!6KK*4.6-&6O&/*W/&3-2MM*/3&46-/(2-2-F&/?*&-()*&6O&2-/*5*3/&
G"N:'!)+JJ":'="J$"/"):#DA)'
• G&"'%A):"N:'AP'"#%&'/)+JJ":'+/'$"J$"/"):".'K;'#'E"%:A$'I+:&'@'.+8")/+A)/'
• (#%&'.+8")/+A)'+).+%#:"/'I&":&"$'#'J#$D%?9#$'P"#:?$"'
A%%?$$".'+)':&"'%A):"N:'
– :&"'E#9?"'%#)'K"'K+)#$;O'P$"h?")%;'%A?):'":%,'
• G&"'P"#:?$"/'%#J:?$"':&"'%&#$#%:"$+/D%/'AP':&"'%A):"N:':A'K"'%9?/:"$".'
• 4):?+DE"9;O'E"%:A$/3%A):"N:/':&#:'/&#$"':&"'/#8"'
P"#:?$"/'I+99'K"'/+8+9#$':A'"#%&'A:&"$'
`f'
2A):"N:/'Z+)J?:':"N:'/)+JJ":/^'
• 2):]0' S$,' !"##$& CD& %&''(' ZKA$)' L[' \#)?#$;' ]Y5L^' +/' #'J$A8+)"):' $"/"#$%&"$' +)' :&"' _"9./' AP' %A8J?:#DA)#9'9+)*?+/D%/O'.+/%A?$/"'#)#9;/+/O'#).'#$D_%+#9'
• 2):L0'!"##$)%&''(& +/' :&"'$#*"B_99".O'.A8"/D%B#K?/+)*'%#$""$'%$+8+)#9'I&A'Q+99".'&+/'fB;"#$BA9.'.#?*&:"$'#).'&"$'YB;"#$BA9.'P$+").O'I+:&'/%#$%"9;'DDD&
• 2):`0' !"##$)%&''(O'-?:&A$,'-'_e&'*")"$#DA)' P#$8"$O'<#;)"'2$;:/' _)+/&".' &#$E"/D)*' &+/' %$AJ' +)' :&"' P#99' AP' ]YfM' #).'&#?9".'8A$"':&#)'`LMMM'K?/&"9/'AP'/A;K"#)/'DDD&
• 2):50' !"##$) %&''(O' I&A' +/' #%%?/".' AP' Q+99+)*' &+/' YB;"#$BA9.'.#?*&:"$'#).'&"$'K"/:'DDD'k)'<".)"/.#;O'#'X?.*"'.")+".'K#+9'PA$'!"##$)%&''(O'`5O'DDD&
`Y'
G"N:'!)+JJ":'C"#:?$"/'Z]^'
• 1)+*$#8'r'#'/+)*9"'IA$.':&#:'A%%?$/'8A$"'
:&#)'#'*+E")')?8K"$'AP'D8"/'
5M'
P2KK& (5.Q42(K& 5*3*(54?*5& T& +(8F?/*5&
2):]0' M' ]' ]' M'
2):L0' ]' M' M' ]'
2):`0' M' M' M' M'
2):50' ]' M' M' ]'
K+)#$;'E#9?"/'
G"N:'!)+JJ":'C"#:?$"/'Z]^'
• 1)+*$#8'r'#'/+)*9"'IA$.':&#:'A%%?$/'8A$"'
:&#)'#'*+E")')?8K"$'AP'D8"/'
' ' ' ''
5]'
• 'Q+99' ' ']MMM'
• '#$D_%+#9' '[MM'
• '$"/"#$%&"$ 'LMM'
l'
• '.#?*&:"$ ']MM ''
P$"h?")%;'"/D8#:".'P$A8'%A$J?/'
P2KK& (5.Q42(K& 5*3*(54?*5& T& +(8F?/*5&
2):]0' M' [MM' LMM' M'
2):L0' ]MMM' M' M' ]MM'
2):`0' M' M' M' M'
2):50' ]MMM' M' M' ]MM'
P$"h?")%;'E#9?"/'
G"N:'!)+JJ":'C"#:?$"/'ZL^'
• T+*$#8r'#)'A$."$".'J#+$'AP'IA$./':&#:'A%%?$'
:A*":&"$'8A$"'Ae")':&#)'"NJ"%:".'K;'%&#)%"'
5L'
P2KK&?23& M56)2-*-/&5*3*(54?*5& 452)2-(K&E?6& T& XU0*(5U6K+&+(8F?/*5&
2):]0' M' ]' M' M'
2):L0' ]' M' ]' ]'
2):`0' M' M' M' M'
2):50' ]' M' M' ]'
K+)#$;'E#9?"/'
G"N:'!)+JJ":'C"#:?$"/'ZL^'• T+*$#8r'#)'A$."$".'J#+$'AP'IA$./':&#:'A%%?$'
:A*":&"$'8A$"'Ae")':&#)'"NJ"%:".'K;'%&#)%"'
5`'
P2KK&?23& M56)2-*-/&5*3*(54?*5& 452)2-(K&E?6& T& XU0*(5U6K+&+(8F?/*5&
2):]0' M' ]ML,Y' M' M'
2):L0' L],L' M' 6f,[' `[,Y'
2):`0' M' M' M' M'
2):50' L],L' M' M' `[,Y'
P$"h?")%;'I"+*&:/'
• 'Q+99'&+/ ' ' ' ''''L],L'
• 'J$A8+)"):'$"/"#$%&"$ '''']ML,Y'
• '%$+8+)#9'I&A' ' ''''6f,['
l'
• 'fB;"#$BA9.'.#?*&:"$ '''`[,Y'
''''''''''''''''''''O'9A*B9+Q"9+&AA.'/%A$"/'K#/".'A)'
P$"h?")%;'"/D8#:".'P$A8'%A$J?/'
!
"logP(w1 |w0)
G"N:'!)+JJ":'29?/:"$+)*'
• *$A?J':"N:'/)+JJ":/'K;'/+8+9#$'8"#)+)*'
• /)+JJ":'/+8+9#$+:;'+/'%#9%?9#:".'#/''
55'
P2KK& (5.Q42(K& 5*3*(54?*5& +(8F?/*5&
2):]0' M' ]' ]' M'
2):L0' ]' M' M' ]'
2):`0' M' M' M' M'
2):50' ]' M' M' ]'
!
sim(Cnt1,Cnt2) = w1i *w2ii=1
n"
/+8Z2):]O2):L^cZMj]^uZ]jM^uZ]jM^uZMj]^cM'
/+8Z2):]O2):`^cZMjM^uZ]jM^uZ]jM^uZMjM^cM'
/+8Z2):]O2):5^cZMj]^uZ]jM^uZ]jM^uZMj]^cM'
/+8Z2):LO2):`^cZ]jM^uZMjM^uZMjM^uZMjM^cM'
/+8Z2):LO2):5^cZ]j]^uZMjM^uZMjM^uZ]j]^cL'
/+8Z2):`O2):5^cZMj]^uZMjM^uZMjM^uZMj]^cM'
C+)#9'k?:J?:'
• (#%&'%9?/:"$'%A)/+/:/'AP'#'%"$:#+)')?8K"$'AP'-"?-)(/599"-(A)5B"B'/8#99':"N:'P$#*8"):/'
• CA$'"#%&'%9?/:"$'#//+*)'%9?/:"$'9#K"9/0'– :AJ']M'8A/:'/+*)+_%#):'K+*$#8/'AP'"#%&'%9?/:"$'#%:'
#/'#'."/%$+JDE"'9#K"9'
– :AJ']M'8A/:'?)+h?"'K+*$#8/'PA$'"#%&'%9?/:"$'#%:'#/'
.+/%$+8+)#D)*'9#K"9''
5['
29?/:"$'(E#9?#DA)'
• 4):"$)#9'%$+:"$+A)'– +):$#B%9#//'&+*&'/+8+9#$+:;'
– +):"$B%9#//'9AI'/+8+9#$+:;'
– :&"'h?#9+:;'."J")./'A)':&"'AKX"%:'$"J$"/"):#DA)'#).':&"'/+8+9#$+:;'8"#/?$"'?/".'
• (N:"$)#9'%$+:"$+A)'PA$'%9?/:"$+)*'h?#9+:;'– 8"#/?$"':&"'#K+9+:;':A'.+/%AE"$':&"')#8".'")D:;'*$A?J/'+)':&"'*A9.'/:#).#$.'.#:#'
– #//"/':&"'%9?/:"$+)*'I+:&'$"/J"%:':A'*$A?).':$?:&'
56'
57'
<&#:'A:&"$'P"#:?$"/'%#)'A)"'?/"a'
4."#/'PA$'8A$"'P"#:?$"/'+P'I"'?/"'/:$?%:?$".':"N:'
9+Q"''<+Q+J".+#''
Page Titles (ID)
Disambiguation text
4."#/'PA$'8A$"'P"#:?$"/'+P'I"'?/"'/:$?%:?$".':"N:'
9+Q"''<+Q+J".+#''
Category
4."#/'PA$'8A$"'P"#:?$"/'+P'I"'?/"'/:$?%:?$".':"N:'
9+Q"''<+Q+J".+#''
Redirect page titles
4."#/'PA$'8A$"'P"#:?$"/'+P'I"'?/"'/:$?%:?$".':"N:'
9+Q"''<+Q+J".+#''
Hyperlinks
4."#/'PA$'8A$"'P"#:?$"/'+P'I"'?/"'/:$?%:?$".':"N:'
9+Q"''<+Q+J".+#''
<"K's"AJ9"'!"#$%&'2c")*"'
• G&"'_$/:'%c")*"'I#/'A$*#)+p".'+)'LMM7'
• <"s!'PA%?/"/'A)'J"$/A)'#).'A$*#)+p#DA)')#8"'
.+/#8K+*?#DA)'AP'<"K'J#*"/'
• CA$'"#%&'#8K+*?A?/')#8"O':&"'/;/:"8'8?/:'$":?$)':&"'
.A%?8"):/'#).':&"'#V$+K?:"/'I&+%&'#$"'$"9"E#):'PA$':&"'
.+v"$"):'/")/"/'AP':&"')#8"'
• U#/:'/?%&'%c")*"'I#/'A)']/:'AP'\?9;'LM]M'
• @A$"'+)PA$8#DA)'#:0''&VJ033)9J,?)".,"/3I"J/3'
[`'
b#8"'S+/%$+8+)#DA)'S"8A'
• !")/"29?/:"$/'K;'G".'s"."$/")'&VJ0338#$+8K#,.,?8),".?3%*+BK+)3!2B%*+3+)."N,%*+'
• G&"'/AeI#$"'%#)'K"'?/".'PA$0'– J$AJ"$')#8"'.+/%$+8+)#DA)'
– IA$.'/")/"'.+/%$+8+)#DA)'
– "B8#+9'%9?/:"$+)*'
– /;)A);8'_).+)*'
[5'
<&#:'IA?9.';A?'.A'I+:&'%9?/:"$+)*a'
[['
<&#:'IA?9.';A?'.A'I+:&'%9?/:"$+)*a'
• (B8#+9'/J#8'%9#//+_%#DA)'
• k$*#)+p"':&"'.A%?8"):/'+):A'8?9DJ9"'
%#:"*A$+"/'9+Q"'WAA*9"')"I/'
• G$#%"'I&#:':IA'J"AJ9"'IA?9.':#9Q'#KA?:'• !")D8"):'#)#9;/+/''
• GI"":':$").'+.")D_%#DA)'• GI"":':AJ+%'.":"%DA)'• 'l'
[6'