perl

 view release on metacpan or  search on metacpan

lib/unicore/auxiliary/SentenceBreakProperty.txt  view on Meta::CPAN

1611E..16129  ; Extend # Mn  [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK
1612A..1612C  ; Extend # Mc   [3] GURUNG KHEMA CONSONANT SIGN MEDIAL YA..GURUNG KHEMA CONSONANT SIGN MEDIAL HA
1612D..1612F  ; Extend # Mn   [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA
16AF0..16AF4  ; Extend # Mn   [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE
16B30..16B36  ; Extend # Mn   [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM
16F4F         ; Extend # Mn       MIAO SIGN CONSONANT MODIFIER BAR
16F51..16F87  ; Extend # Mc  [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
16F8F..16F92  ; Extend # Mn   [4] MIAO TONE RIGHT..MIAO TONE BELOW
16FE4         ; Extend # Mn       KHITAN SMALL SCRIPT FILLER
16FF0..16FF1  ; Extend # Mc   [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY
1BC9D..1BC9E  ; Extend # Mn   [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK
1CF00..1CF2D  ; Extend # Mn  [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT
1CF30..1CF46  ; Extend # Mn  [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG
1D165..1D166  ; Extend # Mc   [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM
1D167..1D169  ; Extend # Mn   [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3
1D16D..1D172  ; Extend # Mc   [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5
1D17B..1D182  ; Extend # Mn   [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE
1D185..1D18B  ; Extend # Mn   [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE
1D1AA..1D1AD  ; Extend # Mn   [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO
1D242..1D244  ; Extend # Mn   [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME
1DA00..1DA36  ; Extend # Mn  [55] SIGNWRITING HEAD RIM..SIGNWRITING AIR SUCKING IN
1DA3B..1DA6C  ; Extend # Mn  [50] SIGNWRITING MOUTH CLOSED NEUTRAL..SIGNWRITING EXCITEMENT
1DA75         ; Extend # Mn       SIGNWRITING UPPER BODY TILTING FROM HIP JOINTS
1DA84         ; Extend # Mn       SIGNWRITING LOCATION HEAD NECK
1DA9B..1DA9F  ; Extend # Mn   [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6
1DAA1..1DAAF  ; Extend # Mn  [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16
1E000..1E006  ; Extend # Mn   [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE
1E008..1E018  ; Extend # Mn  [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU
1E01B..1E021  ; Extend # Mn   [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI
1E023..1E024  ; Extend # Mn   [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS
1E026..1E02A  ; Extend # Mn   [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA
1E08F         ; Extend # Mn       COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
1E130..1E136  ; Extend # Mn   [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D
1E2AE         ; Extend # Mn       TOTO SIGN RISING TONE
1E2EC..1E2EF  ; Extend # Mn   [4] WANCHO TONE TUP..WANCHO TONE KOINI
1E4EC..1E4EF  ; Extend # Mn   [4] NAG MUNDARI SIGN MUHOR..NAG MUNDARI SIGN SUTUH
1E5EE..1E5EF  ; Extend # Mn   [2] OL ONAL SIGN MU..OL ONAL SIGN IKIR
1E8D0..1E8D6  ; Extend # Mn   [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS
1E944..1E94A  ; Extend # Mn   [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA
E0020..E007F  ; Extend # Cf  [96] TAG SPACE..CANCEL TAG
E0100..E01EF  ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256

# Total code points: 2601

# ================================================

0085          ; Sep # Cc       <control-0085>
2028          ; Sep # Zl       LINE SEPARATOR
2029          ; Sep # Zp       PARAGRAPH SEPARATOR

# Total code points: 3

# ================================================

00AD          ; Format # Cf       SOFT HYPHEN
061C          ; Format # Cf       ARABIC LETTER MARK
070F          ; Format # Cf       SYRIAC ABBREVIATION MARK
180E          ; Format # Cf       MONGOLIAN VOWEL SEPARATOR
200B          ; Format # Cf       ZERO WIDTH SPACE
200E..200F    ; Format # Cf   [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK
202A..202E    ; Format # Cf   [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE
2060..2064    ; Format # Cf   [5] WORD JOINER..INVISIBLE PLUS
2066..206F    ; Format # Cf  [10] LEFT-TO-RIGHT ISOLATE..NOMINAL DIGIT SHAPES
FEFF          ; Format # Cf       ZERO WIDTH NO-BREAK SPACE
FFF9..FFFB    ; Format # Cf   [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATION TERMINATOR
13430..1343F  ; Format # Cf  [16] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE
1BCA0..1BCA3  ; Format # Cf   [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP
1D173..1D17A  ; Format # Cf   [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE
E0001         ; Format # Cf       LANGUAGE TAG

# Total code points: 60

# ================================================

0009          ; Sp # Cc       <control-0009>
000B..000C    ; Sp # Cc   [2] <control-000B>..<control-000C>
0020          ; Sp # Zs       SPACE
00A0          ; Sp # Zs       NO-BREAK SPACE
1680          ; Sp # Zs       OGHAM SPACE MARK
2000..200A    ; Sp # Zs  [11] EN QUAD..HAIR SPACE
202F          ; Sp # Zs       NARROW NO-BREAK SPACE
205F          ; Sp # Zs       MEDIUM MATHEMATICAL SPACE
3000          ; Sp # Zs       IDEOGRAPHIC SPACE

# Total code points: 20

# ================================================

0061..007A    ; Lower # L&  [26] LATIN SMALL LETTER A..LATIN SMALL LETTER Z
00AA          ; Lower # Lo       FEMININE ORDINAL INDICATOR
00B5          ; Lower # L&       MICRO SIGN
00BA          ; Lower # Lo       MASCULINE ORDINAL INDICATOR
00DF..00F6    ; Lower # L&  [24] LATIN SMALL LETTER SHARP S..LATIN SMALL LETTER O WITH DIAERESIS
00F8..00FF    ; Lower # L&   [8] LATIN SMALL LETTER O WITH STROKE..LATIN SMALL LETTER Y WITH DIAERESIS
0101          ; Lower # L&       LATIN SMALL LETTER A WITH MACRON
0103          ; Lower # L&       LATIN SMALL LETTER A WITH BREVE
0105          ; Lower # L&       LATIN SMALL LETTER A WITH OGONEK
0107          ; Lower # L&       LATIN SMALL LETTER C WITH ACUTE
0109          ; Lower # L&       LATIN SMALL LETTER C WITH CIRCUMFLEX
010B          ; Lower # L&       LATIN SMALL LETTER C WITH DOT ABOVE
010D          ; Lower # L&       LATIN SMALL LETTER C WITH CARON
010F          ; Lower # L&       LATIN SMALL LETTER D WITH CARON
0111          ; Lower # L&       LATIN SMALL LETTER D WITH STROKE
0113          ; Lower # L&       LATIN SMALL LETTER E WITH MACRON
0115          ; Lower # L&       LATIN SMALL LETTER E WITH BREVE
0117          ; Lower # L&       LATIN SMALL LETTER E WITH DOT ABOVE
0119          ; Lower # L&       LATIN SMALL LETTER E WITH OGONEK
011B          ; Lower # L&       LATIN SMALL LETTER E WITH CARON
011D          ; Lower # L&       LATIN SMALL LETTER G WITH CIRCUMFLEX
011F          ; Lower # L&       LATIN SMALL LETTER G WITH BREVE
0121          ; Lower # L&       LATIN SMALL LETTER G WITH DOT ABOVE
0123          ; Lower # L&       LATIN SMALL LETTER G WITH CEDILLA
0125          ; Lower # L&       LATIN SMALL LETTER H WITH CIRCUMFLEX
0127          ; Lower # L&       LATIN SMALL LETTER H WITH STROKE
0129          ; Lower # L&       LATIN SMALL LETTER I WITH TILDE
012B          ; Lower # L&       LATIN SMALL LETTER I WITH MACRON
012D          ; Lower # L&       LATIN SMALL LETTER I WITH BREVE
012F          ; Lower # L&       LATIN SMALL LETTER I WITH OGONEK
0131          ; Lower # L&       LATIN SMALL LETTER DOTLESS I
0133          ; Lower # L&       LATIN SMALL LIGATURE IJ
0135          ; Lower # L&       LATIN SMALL LETTER J WITH CIRCUMFLEX



( run in 0.809 second using v1.01-cache-2.11-cpan-71847e10f99 )