Copyright | (c) Edward Kmett 2010 |
---|---|
License | BSD3 |
Maintainer | ekmett@gmail.com |
Stability | experimental |
Portability | portable |
Safe Haskell | Safe |
Language | Haskell98 |
Data.CharSet.Unicode
Contents
Description
Provides unicode general categories, which are typically connoted by
\p{Ll}
or \p{Modifier_Letter}
. Lookups can be constructed using categories
or individual character sets can be used directly.
- data UnicodeCategory = UnicodeCategory String String CharSet String
- unicodeCategories :: [UnicodeCategory]
- modifierLetter :: CharSet
- otherLetter :: CharSet
- letter :: CharSet
- lowercaseLetter :: CharSet
- uppercaseLetter :: CharSet
- titlecaseLetter :: CharSet
- letterAnd :: CharSet
- nonSpacingMark :: CharSet
- spacingCombiningMark :: CharSet
- enclosingMark :: CharSet
- mark :: CharSet
- space :: CharSet
- lineSeparator :: CharSet
- paragraphSeparator :: CharSet
- separator :: CharSet
- mathSymbol :: CharSet
- currencySymbol :: CharSet
- modifierSymbol :: CharSet
- otherSymbol :: CharSet
- symbol :: CharSet
- decimalNumber :: CharSet
- letterNumber :: CharSet
- otherNumber :: CharSet
- number :: CharSet
- dashPunctuation :: CharSet
- openPunctuation :: CharSet
- closePunctuation :: CharSet
- initialQuote :: CharSet
- finalQuote :: CharSet
- connectorPunctuation :: CharSet
- otherPunctuation :: CharSet
- punctuation :: CharSet
- control :: CharSet
- format :: CharSet
- privateUse :: CharSet
- surrogate :: CharSet
- notAssigned :: CharSet
- other :: CharSet
Unicode General Category
Lookup
CharSets by UnicodeCategory
Letter
Letter&
Mark
Separator
Symbol
mathSymbol :: CharSet Source #
Number
Punctuation
finalQuote :: CharSet Source #
Other
privateUse :: CharSet Source #