Mentions légales du service

Skip to content
Snippets Groups Projects
Commit fbc4a960 authored by Clémence Laurent's avatar Clémence Laurent
Browse files

debug

parent 1a7279ca
No related branches found
No related tags found
No related merge requests found
......@@ -90,7 +90,7 @@ def altok_split_sentences(s, lang, weak_sbound = 0, less_lists = 0, noxml = 0, a
s = re.sub(r" ([:;:;]|)( +)", r" \1</s>\2<s>", s)
elif re.search(r"^km(_|$)", lang):
s = re.sub(r" ([។៕])( +)", r" \1</s>\2<s>", s)
elif re.search(r"^th(_|$)", lang)::
elif re.search(r"^th(_|$)", lang):
pass
else:
s = re.sub(rf"([…\.:;\?\!])( +)([\"“”\˝] {maj.pattern}[^\"“”\˝<>]*[\.:;\?\!] [\"“”\˝])( +)({maj.pattern})", r"\1</s>\2<s>\3</s>\4<s>\5", s) # detection of sentences entirely surrounded by double quotes
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment