| 1 | # PropertyValueAliases-4.1.0.txt |
| 2 | # Date: 2005-03-28, 17:21:48 GMT [MD] |
| 3 | # |
| 4 | # Unicode Character Database |
| 5 | # Copyright (c) 1991-2005 Unicode, Inc. |
| 6 | # For terms of use, see http://www.unicode.org/terms_of_use.html |
| 7 | # For documentation, see UCD.html |
| 8 | # |
| 9 | # This file contains aliases for property values used in the UCD. |
| 10 | # These names can be used for XML formats of UCD data, for regular-expression |
| 11 | # property tests, and other programmatic textual descriptions of Unicode data. |
| 12 | # For information on which properties are normative, see UCD.html. |
| 13 | # |
| 14 | # The names may be translated in appropriate environments, and additional |
| 15 | # aliases may be useful. |
| 16 | # |
| 17 | # FORMAT |
| 18 | # |
| 19 | # Each line describes a property value name. |
| 20 | # This consists of three or more fields, separated by semicolons. |
| 21 | # |
| 22 | # First Field: The first field describes the property for which that |
| 23 | # property value name is used. |
| 24 | # |
| 25 | # Second Field: The second field is an abbreviated name. |
| 26 | # If there is no abbreviated name available, the field is marked with "n/a". |
| 27 | # |
| 28 | # Third Field: The third field is a long name. |
| 29 | # |
| 30 | # In the case of ccc, there are 4 fields. The second field is numeric, third |
| 31 | # is abbreviated, and fourth is long. |
| 32 | # |
| 33 | # The above are the preferred aliases. Other aliases may be listed in additional fields. |
| 34 | # |
| 35 | # Loose matching should be applied to all property names and property values, with |
| 36 | # the exception of String Property values. With loose matching of property names and |
| 37 | # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property |
| 38 | # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1". |
| 39 | # |
| 40 | # NOTE: Property value names are NOT unique across properties. For example: |
| 41 | # |
| 42 | # AL means Arabic Letter for the Bidi_Class property, and |
| 43 | # AL means Alpha_Left for the Combining_Class property, and |
| 44 | # AL means Alphabetic for the Line_Break property. |
| 45 | # |
| 46 | # In addition, some property names may be the same as some property value names. |
| 47 | # For example: |
| 48 | # |
| 49 | # sc means the Script property, and |
| 50 | # Sc means the General_Category property value Currency_Symbol (Sc) |
| 51 | # |
| 52 | # The combination of property value and property name is, however, unique. |
| 53 | # |
| 54 | # For more information, see UTS #18: Regular Expression Guidelines |
| 55 | # ================================================ |
| 56 | |
| 57 | |
| 58 | # Age (age) |
| 59 | |
| 60 | age; n/a ; 1.1 |
| 61 | age; n/a ; 2.0 |
| 62 | age; n/a ; 2.1 |
| 63 | age; n/a ; 3.0 |
| 64 | age; n/a ; 3.1 |
| 65 | age; n/a ; 3.2 |
| 66 | age; n/a ; 4.0 |
| 67 | age; n/a ; 4.1 |
| 68 | age; n/a ; unassigned |
| 69 | |
| 70 | # Bidi_Class (bc) |
| 71 | |
| 72 | bc ; AL ; Arabic_Letter |
| 73 | bc ; AN ; Arabic_Number |
| 74 | bc ; B ; Paragraph_Separator |
| 75 | bc ; BN ; Boundary_Neutral |
| 76 | bc ; CS ; Common_Separator |
| 77 | bc ; EN ; European_Number |
| 78 | bc ; ES ; European_Separator |
| 79 | bc ; ET ; European_Terminator |
| 80 | bc ; L ; Left_To_Right |
| 81 | bc ; LRE ; Left_To_Right_Embedding |
| 82 | bc ; LRO ; Left_To_Right_Override |
| 83 | bc ; NSM ; Nonspacing_Mark |
| 84 | bc ; ON ; Other_Neutral |
| 85 | bc ; PDF ; Pop_Directional_Format |
| 86 | bc ; R ; Right_To_Left |
| 87 | bc ; RLE ; Right_To_Left_Embedding |
| 88 | bc ; RLO ; Right_To_Left_Override |
| 89 | bc ; S ; Segment_Separator |
| 90 | bc ; WS ; White_Space |
| 91 | |
| 92 | # Block (blk) |
| 93 | |
| 94 | blk; n/a ; Aegean_Numbers |
| 95 | blk; n/a ; Alphabetic_Presentation_Forms |
| 96 | blk; n/a ; Ancient_Greek_Musical_Notation |
| 97 | blk; n/a ; Ancient_Greek_Numbers |
| 98 | blk; n/a ; Arabic |
| 99 | blk; n/a ; Arabic_Presentation_Forms-A |
| 100 | blk; n/a ; Arabic_Presentation_Forms-B |
| 101 | blk; n/a ; Arabic_Supplement |
| 102 | blk; n/a ; Armenian |
| 103 | blk; n/a ; Arrows |
| 104 | blk; n/a ; Basic_Latin |
| 105 | blk; n/a ; Bengali |
| 106 | blk; n/a ; Block_Elements |
| 107 | blk; n/a ; Bopomofo |
| 108 | blk; n/a ; Bopomofo_Extended |
| 109 | blk; n/a ; Box_Drawing |
| 110 | blk; n/a ; Braille_Patterns |
| 111 | blk; n/a ; Buginese |
| 112 | blk; n/a ; Buhid |
| 113 | blk; n/a ; Byzantine_Musical_Symbols |
| 114 | blk; n/a ; Cherokee |
| 115 | blk; n/a ; CJK_Compatibility |
| 116 | blk; n/a ; CJK_Compatibility_Forms |
| 117 | blk; n/a ; CJK_Compatibility_Ideographs |
| 118 | blk; n/a ; CJK_Compatibility_Ideographs_Supplement |
| 119 | blk; n/a ; CJK_Radicals_Supplement |
| 120 | blk; n/a ; CJK_Strokes |
| 121 | blk; n/a ; CJK_Symbols_and_Punctuation |
| 122 | blk; n/a ; CJK_Unified_Ideographs |
| 123 | blk; n/a ; CJK_Unified_Ideographs_Extension_A |
| 124 | blk; n/a ; CJK_Unified_Ideographs_Extension_B |
| 125 | blk; n/a ; Combining_Diacritical_Marks |
| 126 | blk; n/a ; Combining_Diacritical_Marks_for_Symbols |
| 127 | blk; n/a ; Combining_Diacritical_Marks_Supplement |
| 128 | blk; n/a ; Combining_Half_Marks |
| 129 | blk; n/a ; Control_Pictures |
| 130 | blk; n/a ; Coptic |
| 131 | blk; n/a ; Currency_Symbols |
| 132 | blk; n/a ; Cypriot_Syllabary |
| 133 | blk; n/a ; Cyrillic |
| 134 | blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary |
| 135 | blk; n/a ; Deseret |
| 136 | blk; n/a ; Devanagari |
| 137 | blk; n/a ; Dingbats |
| 138 | blk; n/a ; Enclosed_Alphanumerics |
| 139 | blk; n/a ; Enclosed_CJK_Letters_and_Months |
| 140 | blk; n/a ; Ethiopic |
| 141 | blk; n/a ; Ethiopic_Extended |
| 142 | blk; n/a ; Ethiopic_Supplement |
| 143 | blk; n/a ; General_Punctuation |
| 144 | blk; n/a ; Geometric_Shapes |
| 145 | blk; n/a ; Georgian |
| 146 | blk; n/a ; Georgian_Supplement |
| 147 | blk; n/a ; Glagolitic |
| 148 | blk; n/a ; Gothic |
| 149 | blk; n/a ; Greek_and_Coptic |
| 150 | blk; n/a ; Greek_Extended |
| 151 | blk; n/a ; Gujarati |
| 152 | blk; n/a ; Gurmukhi |
| 153 | blk; n/a ; Halfwidth_and_Fullwidth_Forms |
| 154 | blk; n/a ; Hangul_Compatibility_Jamo |
| 155 | blk; n/a ; Hangul_Jamo |
| 156 | blk; n/a ; Hangul_Syllables |
| 157 | blk; n/a ; Hanunoo |
| 158 | blk; n/a ; Hebrew |
| 159 | blk; n/a ; High_Private_Use_Surrogates |
| 160 | blk; n/a ; High_Surrogates |
| 161 | blk; n/a ; Hiragana |
| 162 | blk; n/a ; Ideographic_Description_Characters |
| 163 | blk; n/a ; IPA_Extensions |
| 164 | blk; n/a ; Kanbun |
| 165 | blk; n/a ; Kangxi_Radicals |
| 166 | blk; n/a ; Kannada |
| 167 | blk; n/a ; Katakana |
| 168 | blk; n/a ; Katakana_Phonetic_Extensions |
| 169 | blk; n/a ; Kharoshthi |
| 170 | blk; n/a ; Khmer |
| 171 | blk; n/a ; Khmer_Symbols |
| 172 | blk; n/a ; Lao |
| 173 | blk; n/a ; Latin-1_Supplement |
| 174 | blk; n/a ; Latin_Extended-A |
| 175 | blk; n/a ; Latin_Extended-B |
| 176 | blk; n/a ; Latin_Extended_Additional |
| 177 | blk; n/a ; Letterlike_Symbols |
| 178 | blk; n/a ; Limbu |
| 179 | blk; n/a ; Linear_B_Ideograms |
| 180 | blk; n/a ; Linear_B_Syllabary |
| 181 | blk; n/a ; Low_Surrogates |
| 182 | blk; n/a ; Malayalam |
| 183 | blk; n/a ; Mathematical_Alphanumeric_Symbols |
| 184 | blk; n/a ; Mathematical_Operators |
| 185 | blk; n/a ; Miscellaneous_Mathematical_Symbols-A |
| 186 | blk; n/a ; Miscellaneous_Mathematical_Symbols-B |
| 187 | blk; n/a ; Miscellaneous_Symbols |
| 188 | blk; n/a ; Miscellaneous_Symbols_and_Arrows |
| 189 | blk; n/a ; Miscellaneous_Technical |
| 190 | blk; n/a ; Modifier_Tone_Letters |
| 191 | blk; n/a ; Mongolian |
| 192 | blk; n/a ; Musical_Symbols |
| 193 | blk; n/a ; Myanmar |
| 194 | blk; n/a ; New_Tai_Lue |
| 195 | blk; n/a ; No_Block |
| 196 | blk; n/a ; Number_Forms |
| 197 | blk; n/a ; Ogham |
| 198 | blk; n/a ; Old_Italic |
| 199 | blk; n/a ; Old_Persian |
| 200 | blk; n/a ; Optical_Character_Recognition |
| 201 | blk; n/a ; Oriya |
| 202 | blk; n/a ; Osmanya |
| 203 | blk; n/a ; Phonetic_Extensions |
| 204 | blk; n/a ; Phonetic_Extensions_Supplement |
| 205 | blk; n/a ; Private_Use_Area |
| 206 | blk; n/a ; Runic |
| 207 | blk; n/a ; Shavian |
| 208 | blk; n/a ; Sinhala |
| 209 | blk; n/a ; Small_Form_Variants |
| 210 | blk; n/a ; Spacing_Modifier_Letters |
| 211 | blk; n/a ; Specials |
| 212 | blk; n/a ; Superscripts_and_Subscripts |
| 213 | blk; n/a ; Supplemental_Arrows-A |
| 214 | blk; n/a ; Supplemental_Arrows-B |
| 215 | blk; n/a ; Supplemental_Mathematical_Operators |
| 216 | blk; n/a ; Supplemental_Punctuation |
| 217 | blk; n/a ; Supplementary_Private_Use_Area-A |
| 218 | blk; n/a ; Supplementary_Private_Use_Area-B |
| 219 | blk; n/a ; Syloti_Nagri |
| 220 | blk; n/a ; Syriac |
| 221 | blk; n/a ; Tagalog |
| 222 | blk; n/a ; Tagbanwa |
| 223 | blk; n/a ; Tags |
| 224 | blk; n/a ; Tai_Le |
| 225 | blk; n/a ; Tai_Xuan_Jing_Symbols |
| 226 | blk; n/a ; Tamil |
| 227 | blk; n/a ; Telugu |
| 228 | blk; n/a ; Thaana |
| 229 | blk; n/a ; Thai |
| 230 | blk; n/a ; Tibetan |
| 231 | blk; n/a ; Tifinagh |
| 232 | blk; n/a ; Ugaritic |
| 233 | blk; n/a ; Unified_Canadian_Aboriginal_Syllabics |
| 234 | blk; n/a ; Variation_Selectors |
| 235 | blk; n/a ; Variation_Selectors_Supplement |
| 236 | blk; n/a ; Vertical_Forms |
| 237 | blk; n/a ; Yi_Radicals |
| 238 | blk; n/a ; Yi_Syllables |
| 239 | blk; n/a ; Yijing_Hexagram_Symbols |
| 240 | |
| 241 | # Canonical_Combining_Class (ccc) |
| 242 | |
| 243 | ccc; 0; NR ; Not_Reordered |
| 244 | ccc; 1; OV ; Overlay |
| 245 | ccc; 7; NK ; Nukta |
| 246 | ccc; 8; KV ; Kana_Voicing |
| 247 | ccc; 9; VR ; Virama |
| 248 | ccc; 200; ATBL ; Attached_Below_Left |
| 249 | ccc; 202; ATB ; Attached_Below |
| 250 | ccc; 216; ATAR ; Attached_Above_Right |
| 251 | ccc; 218; BL ; Below_Left |
| 252 | ccc; 220; B ; Below |
| 253 | ccc; 222; BR ; Below_Right |
| 254 | ccc; 224; L ; Left |
| 255 | ccc; 226; R ; Right |
| 256 | ccc; 228; AL ; Above_Left |
| 257 | ccc; 230; A ; Above |
| 258 | ccc; 232; AR ; Above_Right |
| 259 | ccc; 233; DB ; Double_Below |
| 260 | ccc; 234; DA ; Double_Above |
| 261 | ccc; 240; IS ; Iota_Subscript |
| 262 | |
| 263 | # Decomposition_Type (dt) |
| 264 | |
| 265 | dt ; can ; Canonical |
| 266 | dt ; com ; Compat |
| 267 | dt ; enc ; Circle |
| 268 | dt ; fin ; Final |
| 269 | dt ; font ; Font |
| 270 | dt ; fra ; Fraction |
| 271 | dt ; init ; Initial |
| 272 | dt ; iso ; Isolated |
| 273 | dt ; med ; Medial |
| 274 | dt ; nar ; Narrow |
| 275 | dt ; nb ; Nobreak |
| 276 | dt ; none ; None |
| 277 | dt ; sml ; Small |
| 278 | dt ; sqr ; Square |
| 279 | dt ; sub ; Sub |
| 280 | dt ; sup ; Super |
| 281 | dt ; vert ; Vertical |
| 282 | dt ; wide ; Wide |
| 283 | |
| 284 | # East_Asian_Width (ea) |
| 285 | |
| 286 | ea ; A ; Ambiguous |
| 287 | ea ; F ; Fullwidth |
| 288 | ea ; H ; Halfwidth |
| 289 | ea ; N ; Neutral |
| 290 | ea ; Na ; Narrow |
| 291 | ea ; W ; Wide |
| 292 | |
| 293 | # General_Category (gc) |
| 294 | |
| 295 | gc ; C ; Other # Cc | Cf | Cn | Co | Cs |
| 296 | gc ; Cc ; Control ; cntrl |
| 297 | gc ; Cf ; Format |
| 298 | gc ; Cn ; Unassigned |
| 299 | gc ; Co ; Private_Use |
| 300 | gc ; Cs ; Surrogate |
| 301 | gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu |
| 302 | gc ; LC ; Cased_Letter # Ll | Lt | Lu |
| 303 | gc ; Ll ; Lowercase_Letter |
| 304 | gc ; Lm ; Modifier_Letter |
| 305 | gc ; Lo ; Other_Letter |
| 306 | gc ; Lt ; Titlecase_Letter |
| 307 | gc ; Lu ; Uppercase_Letter |
| 308 | gc ; M ; Mark # Mc | Me | Mn |
| 309 | gc ; Mc ; Spacing_Mark |
| 310 | gc ; Me ; Enclosing_Mark |
| 311 | gc ; Mn ; Nonspacing_Mark |
| 312 | gc ; N ; Number # Nd | Nl | No |
| 313 | gc ; Nd ; Decimal_Number ; digit |
| 314 | gc ; Nl ; Letter_Number |
| 315 | gc ; No ; Other_Number |
| 316 | gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps |
| 317 | gc ; Pc ; Connector_Punctuation |
| 318 | gc ; Pd ; Dash_Punctuation |
| 319 | gc ; Pe ; Close_Punctuation |
| 320 | gc ; Pf ; Final_Punctuation |
| 321 | gc ; Pi ; Initial_Punctuation |
| 322 | gc ; Po ; Other_Punctuation |
| 323 | gc ; Ps ; Open_Punctuation |
| 324 | gc ; S ; Symbol # Sc | Sk | Sm | So |
| 325 | gc ; Sc ; Currency_Symbol |
| 326 | gc ; Sk ; Modifier_Symbol |
| 327 | gc ; Sm ; Math_Symbol |
| 328 | gc ; So ; Other_Symbol |
| 329 | gc ; Z ; Separator # Zl | Zp | Zs |
| 330 | gc ; Zl ; Line_Separator |
| 331 | gc ; Zp ; Paragraph_Separator |
| 332 | gc ; Zs ; Space_Separator |
| 333 | |
| 334 | # Grapheme_Cluster_Break (GCB) |
| 335 | |
| 336 | GCB; CN ; Control |
| 337 | GCB; CR ; CR |
| 338 | GCB; EX ; Extend |
| 339 | GCB; L ; L |
| 340 | GCB; LF ; LF |
| 341 | GCB; LV ; LV |
| 342 | GCB; LVT ; LVT |
| 343 | GCB; T ; T |
| 344 | GCB; V ; V |
| 345 | GCB; XX ; Other |
| 346 | |
| 347 | # Hangul_Syllable_Type (hst) |
| 348 | |
| 349 | hst; L ; Leading_Jamo |
| 350 | hst; LV ; LV_Syllable |
| 351 | hst; LVT ; LVT_Syllable |
| 352 | hst; NA ; Not_Applicable |
| 353 | hst; T ; Trailing_Jamo |
| 354 | hst; V ; Vowel_Jamo |
| 355 | |
| 356 | # Joining_Group (jg) |
| 357 | |
| 358 | jg ; n/a ; Ain |
| 359 | jg ; n/a ; Alaph |
| 360 | jg ; n/a ; Alef |
| 361 | jg ; n/a ; Beh |
| 362 | jg ; n/a ; Beth |
| 363 | jg ; n/a ; Dal |
| 364 | jg ; n/a ; Dalath_Rish |
| 365 | jg ; n/a ; E |
| 366 | jg ; n/a ; Fe |
| 367 | jg ; n/a ; Feh |
| 368 | jg ; n/a ; Final_Semkath |
| 369 | jg ; n/a ; Gaf |
| 370 | jg ; n/a ; Gamal |
| 371 | jg ; n/a ; Hah |
| 372 | jg ; n/a ; Hamza_On_Heh_Goal |
| 373 | jg ; n/a ; He |
| 374 | jg ; n/a ; Heh |
| 375 | jg ; n/a ; Heh_Goal |
| 376 | jg ; n/a ; Heth |
| 377 | jg ; n/a ; Kaf |
| 378 | jg ; n/a ; Kaph |
| 379 | jg ; n/a ; Khaph |
| 380 | jg ; n/a ; Knotted_Heh |
| 381 | jg ; n/a ; Lam |
| 382 | jg ; n/a ; Lamadh |
| 383 | jg ; n/a ; Meem |
| 384 | jg ; n/a ; Mim |
| 385 | jg ; n/a ; No_Joining_Group |
| 386 | jg ; n/a ; Noon |
| 387 | jg ; n/a ; Nun |
| 388 | jg ; n/a ; Pe |
| 389 | jg ; n/a ; Qaf |
| 390 | jg ; n/a ; Qaph |
| 391 | jg ; n/a ; Reh |
| 392 | jg ; n/a ; Reversed_Pe |
| 393 | jg ; n/a ; Sad |
| 394 | jg ; n/a ; Sadhe |
| 395 | jg ; n/a ; Seen |
| 396 | jg ; n/a ; Semkath |
| 397 | jg ; n/a ; Shin |
| 398 | jg ; n/a ; Swash_Kaf |
| 399 | jg ; n/a ; Syriac_Waw |
| 400 | jg ; n/a ; Tah |
| 401 | jg ; n/a ; Taw |
| 402 | jg ; n/a ; Teh_Marbuta |
| 403 | jg ; n/a ; Teth |
| 404 | jg ; n/a ; Waw |
| 405 | jg ; n/a ; Yeh |
| 406 | jg ; n/a ; Yeh_Barree |
| 407 | jg ; n/a ; Yeh_With_Tail |
| 408 | jg ; n/a ; Yudh |
| 409 | jg ; n/a ; Yudh_He |
| 410 | jg ; n/a ; Zain |
| 411 | jg ; n/a ; Zhain |
| 412 | |
| 413 | # Joining_Type (jt) |
| 414 | |
| 415 | jt ; C ; Join_Causing |
| 416 | jt ; D ; Dual_Joining |
| 417 | jt ; L ; Left_Joining |
| 418 | jt ; R ; Right_Joining |
| 419 | jt ; T ; Transparent |
| 420 | jt ; U ; Non_Joining |
| 421 | |
| 422 | # Line_Break (lb) |
| 423 | |
| 424 | lb ; AI ; Ambiguous |
| 425 | lb ; AL ; Alphabetic |
| 426 | lb ; B2 ; Break_Both |
| 427 | lb ; BA ; Break_After |
| 428 | lb ; BB ; Break_Before |
| 429 | lb ; BK ; Mandatory_Break |
| 430 | lb ; CB ; Contingent_Break |
| 431 | lb ; CL ; Close_Punctuation |
| 432 | lb ; CM ; Combining_Mark |
| 433 | lb ; CR ; Carriage_Return |
| 434 | lb ; EX ; Exclamation |
| 435 | lb ; GL ; Glue |
| 436 | lb ; H2 ; H2 |
| 437 | lb ; H3 ; H3 |
| 438 | lb ; HY ; Hyphen |
| 439 | lb ; ID ; Ideographic |
| 440 | lb ; IN ; Inseparable ; Inseperable |
| 441 | lb ; IS ; Infix_Numeric |
| 442 | lb ; JL ; JL |
| 443 | lb ; JT ; JT |
| 444 | lb ; JV ; JV |
| 445 | lb ; LF ; Line_Feed |
| 446 | lb ; NL ; Next_Line |
| 447 | lb ; NS ; Nonstarter |
| 448 | lb ; NU ; Numeric |
| 449 | lb ; OP ; Open_Punctuation |
| 450 | lb ; PO ; Postfix_Numeric |
| 451 | lb ; PR ; Prefix_Numeric |
| 452 | lb ; QU ; Quotation |
| 453 | lb ; SA ; Complex_Context |
| 454 | lb ; SG ; Surrogate |
| 455 | lb ; SP ; Space |
| 456 | lb ; SY ; Break_Symbols |
| 457 | lb ; WJ ; Word_Joiner |
| 458 | lb ; XX ; Unknown |
| 459 | lb ; ZW ; ZWSpace |
| 460 | |
| 461 | # NFC_Quick_Check (NFC_QC) |
| 462 | |
| 463 | NFC_QC; M ; Maybe |
| 464 | NFC_QC; N ; No |
| 465 | NFC_QC; Y ; Yes |
| 466 | |
| 467 | # NFD_Quick_Check (NFD_QC) |
| 468 | |
| 469 | NFD_QC; N ; No |
| 470 | NFD_QC; Y ; Yes |
| 471 | |
| 472 | # NFKC_Quick_Check (NFKC_QC) |
| 473 | |
| 474 | NFKC_QC; M ; Maybe |
| 475 | NFKC_QC; N ; No |
| 476 | NFKC_QC; Y ; Yes |
| 477 | |
| 478 | # NFKD_Quick_Check (NFKD_QC) |
| 479 | |
| 480 | NFKD_QC; N ; No |
| 481 | NFKD_QC; Y ; Yes |
| 482 | |
| 483 | # Numeric_Type (nt) |
| 484 | |
| 485 | nt ; De ; Decimal |
| 486 | nt ; Di ; Digit |
| 487 | nt ; None ; None |
| 488 | nt ; Nu ; Numeric |
| 489 | |
| 490 | # Script (sc) |
| 491 | |
| 492 | sc ; Arab ; Arabic |
| 493 | sc ; Armn ; Armenian |
| 494 | sc ; Beng ; Bengali |
| 495 | sc ; Bopo ; Bopomofo |
| 496 | sc ; Brai ; Braille |
| 497 | sc ; Bugi ; Buginese |
| 498 | sc ; Buhd ; Buhid |
| 499 | sc ; Cans ; Canadian_Aboriginal |
| 500 | sc ; Cher ; Cherokee |
| 501 | sc ; Copt ; Coptic ; Qaac |
| 502 | sc ; Cprt ; Cypriot |
| 503 | sc ; Cyrl ; Cyrillic |
| 504 | sc ; Deva ; Devanagari |
| 505 | sc ; Dsrt ; Deseret |
| 506 | sc ; Ethi ; Ethiopic |
| 507 | sc ; Geor ; Georgian |
| 508 | sc ; Glag ; Glagolitic |
| 509 | sc ; Goth ; Gothic |
| 510 | sc ; Grek ; Greek |
| 511 | sc ; Gujr ; Gujarati |
| 512 | sc ; Guru ; Gurmukhi |
| 513 | sc ; Hang ; Hangul |
| 514 | sc ; Hani ; Han |
| 515 | sc ; Hano ; Hanunoo |
| 516 | sc ; Hebr ; Hebrew |
| 517 | sc ; Hira ; Hiragana |
| 518 | sc ; Hrkt ; Katakana_Or_Hiragana |
| 519 | sc ; Ital ; Old_Italic |
| 520 | sc ; Kana ; Katakana |
| 521 | sc ; Khar ; Kharoshthi |
| 522 | sc ; Khmr ; Khmer |
| 523 | sc ; Knda ; Kannada |
| 524 | sc ; Laoo ; Lao |
| 525 | sc ; Latn ; Latin |
| 526 | sc ; Limb ; Limbu |
| 527 | sc ; Linb ; Linear_B |
| 528 | sc ; Mlym ; Malayalam |
| 529 | sc ; Mong ; Mongolian |
| 530 | sc ; Mymr ; Myanmar |
| 531 | sc ; Ogam ; Ogham |
| 532 | sc ; Orya ; Oriya |
| 533 | sc ; Osma ; Osmanya |
| 534 | sc ; Qaai ; Inherited |
| 535 | sc ; Runr ; Runic |
| 536 | sc ; Shaw ; Shavian |
| 537 | sc ; Sinh ; Sinhala |
| 538 | sc ; Sylo ; Syloti_Nagri |
| 539 | sc ; Syrc ; Syriac |
| 540 | sc ; Tagb ; Tagbanwa |
| 541 | sc ; Tale ; Tai_Le |
| 542 | sc ; Talu ; New_Tai_Lue |
| 543 | sc ; Taml ; Tamil |
| 544 | sc ; Telu ; Telugu |
| 545 | sc ; Tfng ; Tifinagh |
| 546 | sc ; Tglg ; Tagalog |
| 547 | sc ; Thaa ; Thaana |
| 548 | sc ; Thai ; Thai |
| 549 | sc ; Tibt ; Tibetan |
| 550 | sc ; Ugar ; Ugaritic |
| 551 | sc ; Xpeo ; Old_Persian |
| 552 | sc ; Yiii ; Yi |
| 553 | sc ; Zyyy ; Common |
| 554 | |
| 555 | # Sentence_Break (SB) |
| 556 | |
| 557 | SB ; AT ; ATerm |
| 558 | SB ; CL ; Close |
| 559 | SB ; FO ; Format |
| 560 | SB ; LE ; OLetter |
| 561 | SB ; LO ; Lower |
| 562 | SB ; NU ; Numeric |
| 563 | SB ; SE ; Sep |
| 564 | SB ; SP ; Sp |
| 565 | SB ; ST ; STerm |
| 566 | SB ; UP ; Upper |
| 567 | SB ; XX ; Other |
| 568 | |
| 569 | # Word_Break (WB) |
| 570 | |
| 571 | WB ; EX ; ExtendNumLet |
| 572 | WB ; FO ; Format |
| 573 | WB ; KA ; Katakana |
| 574 | WB ; LE ; ALetter |
| 575 | WB ; ML ; MidLetter |
| 576 | WB ; MN ; MidNum |
| 577 | WB ; NU ; Numeric |
| 578 | WB ; XX ; Other |