Skip to content

Commit

Permalink
Added missing defaults in Tokenizer
Browse files Browse the repository at this point in the history
  • Loading branch information
saif-ellafi committed Aug 18, 2019
1 parent 51f1f19 commit 76eaf77
Showing 1 changed file with 6 additions and 0 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -96,6 +96,12 @@ class Tokenizer(override val uid: String) extends AnnotatorApproach[TokenizerMod
$(splitChars)
}

setDefault(
targetPattern -> "\\S+",
contextChars -> Array(".", ",", ";", ":", "!", "?", "*", "-", "(", ")", "\"", "'"),
caseSensitiveExceptions -> true
)

def buildRuleFactory: RuleFactory = {
val rules = ArrayBuffer.empty[String]

Expand Down

0 comments on commit 76eaf77

Please sign in to comment.