We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c924822 commit d181905Copy full SHA for d181905
src/sentences/sentence_splitting.jl
@@ -120,7 +120,8 @@ function postproc_splits(sentences::AbstractString)
120
sentences = replace(sentences, r"(\bMs\.)\n" => s"\1 ")
121
sentences = replace(sentences, r"(\bMrs\.)\n" => s"\1 ")
122
123
-
+ # no sentence break in between two words with no punctuation
124
+ sentences=replace(sentences,r"([a-zA-Z0-9])\n([a-zA-Z0-9])"=>s"\1 \2")
125
126
127
# possible TODO: filter excessively long / short sentences
0 commit comments