Mentions légales du service

Skip to content
Snippets Groups Projects
Commit f5490ccd authored by Benoît Sagot's avatar Benoît Sagot
Browse files

git-svn-id: https://scm.gforge.inria.fr/authscm/cfourrie/svn/lingwb/MElt/trunk@5711 dc05b511-7f1d-0410-9f1c-d6f32a2df9e4
parent 0147686d
No related branches found
No related tags found
No related merge requests found
...@@ -673,7 +673,7 @@ sub tokenize_sequence { ...@@ -673,7 +673,7 @@ sub tokenize_sequence {
} }
s/(?<=[^\}]) Mr +\. / {Mr .} Mr. /go; s/(?<=[^\}]) Mr +\. / {Mr .} Mr. /go;
s/(?<=[^\}]) (autocad) / {$1} _SPECWORD_AutoCAD /gi; s/(?<=[^\}]) (autocad) / {$1} _SPECWORD_AutoCAD /gi;
if ($lang eq "en") { if ($lang eq "en") {
if ($expand_contractions) { if ($expand_contractions) {
s/(?<=[^\}]) ([cC]a)n't / {\1n't} \1n _UNSPLIT_not /goi; s/(?<=[^\}]) ([cC]a)n't / {\1n't} \1n _UNSPLIT_not /goi;
...@@ -686,7 +686,9 @@ sub tokenize_sequence { ...@@ -686,7 +686,9 @@ sub tokenize_sequence {
s/(?<=[^\}]) (I|you|he|she|we|they|there)'(ll) / {\1'll} \1 _UNSPLIT_will /goi; s/(?<=[^\}]) (I|you|he|she|we|they|there)'(ll) / {\1'll} \1 _UNSPLIT_will /goi;
s/(?<=[^\}]) (they)'(re) / {\1're} \1 _UNSPLIT_are /goi; s/(?<=[^\}]) (they)'(re) / {\1're} \1 _UNSPLIT_are /goi;
s/(?<=[^\}]) ([^ ]*[^ s_])'s / {\1's} \1 _UNSPLIT_'s /goi; s/(?<=[^\}]) ([^ ]*[^ s_])'s / {\1's} \1 _UNSPLIT_'s /goi;
s/(?<=[^\}]) ([^ _][^ ]*s)'(?=[a-z] )/ \1 _REGLUE___APOS__/goi;
s/(?<=[^\}]) ([^ _][^ ]*s)'(?!s |\}.)/ {\1'} \1 _UNSPLIT_'s /goi; s/(?<=[^\}]) ([^ _][^ ]*s)'(?!s |\}.)/ {\1'} \1 _UNSPLIT_'s /goi;
s/__APOS__/'/g;
} else { } else {
s/(?<=[^\}]) ([cC]a)n't / {\1n't} \1n _UNSPLIT_n't /goi; s/(?<=[^\}]) ([cC]a)n't / {\1n't} \1n _UNSPLIT_n't /goi;
s/(?<=[^\}]) ([Ww])on't / {\1on't} \1ill _UNSPLIT_n't /goi; s/(?<=[^\}]) ([Ww])on't / {\1on't} \1ill _UNSPLIT_n't /goi;
...@@ -698,7 +700,9 @@ sub tokenize_sequence { ...@@ -698,7 +700,9 @@ sub tokenize_sequence {
s/(?<=[^\}]) (they)'(re) / \1 '\2 /goi; s/(?<=[^\}]) (they)'(re) / \1 '\2 /goi;
s/(?<=[^\}]) ([^ ]*[^ s_])'s / \1 's /goi; s/(?<=[^\}]) ([^ ]*[^ s_])'s / \1 's /goi;
s/(?<=[^\}]) ([^ ]*[^ s_]){''} " ((?:_REGLUE_)?)s / {\1''s} \1 \2's /goi; s/(?<=[^\}]) ([^ ]*[^ s_]){''} " ((?:_REGLUE_)?)s / {\1''s} \1 \2's /goi;
s/(?<=[^\}]) ([^ _][^ ]*s)'(?=[a-z] )/ \1 _REGLUE___APOS__/goi;
s/(?<=[^\}]) ([^ _][^ ]*s)'(?!s |\}.)/ \1 {'} 's /goi; s/(?<=[^\}]) ([^ _][^ ]*s)'(?!s |\}.)/ \1 {'} 's /goi;
s/__APOS__/'/g;
} }
} elsif ($lang eq "fr") { } elsif ($lang eq "fr") {
s/(?<=[^\}]) ([Ss]) ' (\S+)/ {\1 '} \1' \2/goi; s/(?<=[^\}]) ([Ss]) ' (\S+)/ {\1 '} \1' \2/goi;
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment