Module: PragmaticSegmenter::Languages::Common::SubSymbolsRules

Defined in:
lib/pragmatic_segmenter/languages/common.rb

Constant Summary collapse

Period =
Rule.new(//, '.')
ArabicComma =
Rule.new(//, '،')
SemiColon =
Rule.new(//, ':')
FullWidthPeriod =
Rule.new(/&ᓰ&/, '')
SpecialPeriod =
Rule.new(/&ᓱ&/, '')
FullWidthExclamation =
Rule.new(/&ᓳ&/, '')
ExclamationPoint =
Rule.new(/&ᓴ&/, '!')
QuestionMark =
Rule.new(/&ᓷ&/, '?')
FullWidthQuestionMark =
Rule.new(/&ᓸ&/, '')
MixedDoubleQE =
Rule.new(//, '?!')
MixedDoubleQQ =
Rule.new(//, '??')
MixedDoubleEQ =
Rule.new(//, '!?')
MixedDoubleEE =
Rule.new(//, '!!')
LeftParens =
Rule.new(/&✂&/, '(')
RightParens =
Rule.new(/&⌬&/, ')')
TemporaryEndingPunctutation =
Rule.new('ȸ', '')
Newline =
Rule.new(/ȹ/, "\n")
All =
[ Period, ArabicComma,
SemiColon, FullWidthPeriod,
SpecialPeriod, FullWidthExclamation,
ExclamationPoint, QuestionMark,
FullWidthQuestionMark, MixedDoubleQE,
MixedDoubleQQ, MixedDoubleEQ,
MixedDoubleEE, LeftParens,
RightParens, TemporaryEndingPunctutation,
Newline ]