!"# $
Thierry Dutoit
Faculté Polytechnique de Mons
TCTS Lab
Ave. Copernic Ph: +32 65 374774
Parc Initialis Fax: +32 65 374729
B-7000 Mons Thierry.Dutoit at fpms.ac.be
Belgium http://tcts.fpms.ac.be/~dutoit
!"#
% & '( $)*+ ,( $)* ((+ -
%%($)* $$+'
. ,%. ( ( .
.$( + $ $ $
$, . ( ( %$ $ $
. ,&$/( (.$($
( $$/$0,
$ ($1+(2)34(., 522%
$ , . '$ ' ,
%. $0,((,4-1+
-67 $$ $
$ $+),$$,
%%( $ +)($,2"4
$ ( '4 $ 2'.$
%%$(,$ $"0- (1$+
-67(80'82'1.(
$ 2 ,$ ,$+ 8
($ . ( ( ( $
+ -67 ( $$% # 0-(. 9. :;;1
, / $ ((. / $ $ ,
4-+
$ %"&$'(%$'"
8$$<2,,$0++
,$ , ( ( $ & %. .
$=%. $ $=% $%1 $ > 0 ?1+
( . $ 8 ($
2+), ($.$%$$.
8%.( (.$(+
!)%(28
?
$'" (%$'"
3(0
(<>.<%>.$<$>1
(<>@A
(<>$
<%>
<>.<>.<>
(<$>.<>
$<( >
0($1
$=%.$ <>@A
: <><>@A
$=%$% <>@A
B$% 0($1
:$% 0($1
(.( <C>
$ <$>
$ <>
B(.: ( <>
"0<>$<>
D%1
<>
<> <>
<>0$ %1 <>
" 0%1 <>
9% <,>
) # . ( $. 2 8+#
$ (.., $//8&
“[Gengling on the genglish gengle of John gengle] It is gengle
gengle; gengle gengle is the gengle of gengling the gengle on the
gengle…”
$(8.,%$4- .
genglish_load_corpus.m.genglish_corpus, E8
0 ,$1,,$$,..
$ F 0+ ?1+ ( .
genglish_test_corpus 0 G ,$1. , , $ +
6?,$genglish_corpus&
» genglish_load_corpus;
» genglish_corpus(1:10,:)
ans =
'gengles' 'noun' 'gEN_l_z'
?
(% $ 28 $+ 2
,,$%$ $H%$$+
'are' 'auxiliary' 'a__'
'gengly' 'adverb' 'gEN_lI'
'the' 'determiner' 'D_@'
'gengle' 'noun' 'gEN_l_'
'of' 'of' 'Qv'
'gengle' 'noun' 'gEN_l_'
'.' 'punctuation' '_'
'on' 'preposition' 'Qn'
'the' 'determiner' 'D_@'
,. 8( (20$
( (1. ( . . $ $
(+) .8( 0%(21.
% $ % ( 0 $ 1+ 8
( ( 2. , &
,$($.$+).8+
,(/ $/( (.,/(=
& +$$ (.
,%$# $ ,+
genglish_corpus = {
% Trigrams are simply an extension of bigrams.
% Gengles are gengly the gengle of gengle.
'gengles' 'noun' 'gEN_l_z'
'are' 'auxiliary' 'Ar_'
'gengly' 'adverb' 'gEN_lI'
'the' 'determiner' 'D_@'
'gengle' 'noun' 'gEN_l_'
'of' 'of' 'Qv'
'gengle' 'noun' 'gEN_l_'
'.' 'punctuation' '_'
% In the corresponding automaton, states correspond to a
couple of part-of-speech categories.
% On the genglish gengle, gengles gengle on the gengle
of gengle gengles.
'on' 'preposition' 'Qn'
'the' 'determiner' 'D_@'
'genglish' 'adjective' 'gEN_lIS_'
'gengle' 'noun' 'gEN_l_'
',' 'punctuation' '_'
'gengles' 'noun' 'gEN_l_z'
'gengle' 'verb' 'JEN_l_'
'on' 'preposition' 'Qn'
'the' 'determiner' 'D_@'
'gengle' 'noun' 'gEN_l_'
'of' 'of' 'Qv'
'gengle' 'noun' 'gEN_l_'
'gengles' 'noun' 'gEN_l_z'
'.' 'punctuation' '_'
. . .
*'8 01+
+,-.-
, , I $ . (
# ,$ , /,$ .
,F . , $$
# %%$+
"(($((.
(,$0((# $1.,%$
. $$ , $ 0/ < .
<.<.2.$<81+
(($ ( ($&