Module: PragmaticSegmenter::Languages::Common::SubSymbolsRules
- Defined in:
- lib/pragmatic_segmenter/languages/common.rb
Constant Summary collapse
- Period =
Rule.new(/∯/, '.')
- ArabicComma =
Rule.new(/♬/, '،')
- SemiColon =
Rule.new(/♭/, ':')
- FullWidthPeriod =
Rule.new(/&ᓰ&/, '。')
- SpecialPeriod =
Rule.new(/&ᓱ&/, '.')
- FullWidthExclamation =
Rule.new(/&ᓳ&/, '!')
- ExclamationPoint =
Rule.new(/&ᓴ&/, '!')
- QuestionMark =
Rule.new(/&ᓷ&/, '?')
- FullWidthQuestionMark =
Rule.new(/&ᓸ&/, '?')
- MixedDoubleQE =
Rule.new(/☉/, '?!')
- MixedDoubleQQ =
Rule.new(/☇/, '??')
- MixedDoubleEQ =
Rule.new(/☈/, '!?')
- MixedDoubleEE =
Rule.new(/☄/, '!!')
- LeftParens =
Rule.new(/&✂&/, '(')
- RightParens =
Rule.new(/&⌬&/, ')')
- TemporaryEndingPunctutation =
Rule.new('ȸ', '')
- Newline =
Rule.new(/ȹ/, "\n")
- All =
[ Period, ArabicComma, SemiColon, FullWidthPeriod, SpecialPeriod, FullWidthExclamation, ExclamationPoint, QuestionMark, FullWidthQuestionMark, MixedDoubleQE, MixedDoubleQQ, MixedDoubleEQ, MixedDoubleEE, LeftParens, RightParens, TemporaryEndingPunctutation, Newline ]