Commit | Line | Data |
---|---|---|
920dae64 AT |
1 | # PropertyValueAliases-4.1.0.txt |
2 | # Date: 2005-03-28, 17:21:48 GMT [MD] | |
3 | # | |
4 | # Unicode Character Database | |
5 | # Copyright (c) 1991-2005 Unicode, Inc. | |
6 | # For terms of use, see http://www.unicode.org/terms_of_use.html | |
7 | # For documentation, see UCD.html | |
8 | # | |
9 | # This file contains aliases for property values used in the UCD. | |
10 | # These names can be used for XML formats of UCD data, for regular-expression | |
11 | # property tests, and other programmatic textual descriptions of Unicode data. | |
12 | # For information on which properties are normative, see UCD.html. | |
13 | # | |
14 | # The names may be translated in appropriate environments, and additional | |
15 | # aliases may be useful. | |
16 | # | |
17 | # FORMAT | |
18 | # | |
19 | # Each line describes a property value name. | |
20 | # This consists of three or more fields, separated by semicolons. | |
21 | # | |
22 | # First Field: The first field describes the property for which that | |
23 | # property value name is used. | |
24 | # | |
25 | # Second Field: The second field is an abbreviated name. | |
26 | # If there is no abbreviated name available, the field is marked with "n/a". | |
27 | # | |
28 | # Third Field: The third field is a long name. | |
29 | # | |
30 | # In the case of ccc, there are 4 fields. The second field is numeric, third | |
31 | # is abbreviated, and fourth is long. | |
32 | # | |
33 | # The above are the preferred aliases. Other aliases may be listed in additional fields. | |
34 | # | |
35 | # Loose matching should be applied to all property names and property values, with | |
36 | # the exception of String Property values. With loose matching of property names and | |
37 | # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property | |
38 | # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1". | |
39 | # | |
40 | # NOTE: Property value names are NOT unique across properties. For example: | |
41 | # | |
42 | # AL means Arabic Letter for the Bidi_Class property, and | |
43 | # AL means Alpha_Left for the Combining_Class property, and | |
44 | # AL means Alphabetic for the Line_Break property. | |
45 | # | |
46 | # In addition, some property names may be the same as some property value names. | |
47 | # For example: | |
48 | # | |
49 | # sc means the Script property, and | |
50 | # Sc means the General_Category property value Currency_Symbol (Sc) | |
51 | # | |
52 | # The combination of property value and property name is, however, unique. | |
53 | # | |
54 | # For more information, see UTS #18: Regular Expression Guidelines | |
55 | # ================================================ | |
56 | ||
57 | ||
58 | # Age (age) | |
59 | ||
60 | age; n/a ; 1.1 | |
61 | age; n/a ; 2.0 | |
62 | age; n/a ; 2.1 | |
63 | age; n/a ; 3.0 | |
64 | age; n/a ; 3.1 | |
65 | age; n/a ; 3.2 | |
66 | age; n/a ; 4.0 | |
67 | age; n/a ; 4.1 | |
68 | age; n/a ; unassigned | |
69 | ||
70 | # Bidi_Class (bc) | |
71 | ||
72 | bc ; AL ; Arabic_Letter | |
73 | bc ; AN ; Arabic_Number | |
74 | bc ; B ; Paragraph_Separator | |
75 | bc ; BN ; Boundary_Neutral | |
76 | bc ; CS ; Common_Separator | |
77 | bc ; EN ; European_Number | |
78 | bc ; ES ; European_Separator | |
79 | bc ; ET ; European_Terminator | |
80 | bc ; L ; Left_To_Right | |
81 | bc ; LRE ; Left_To_Right_Embedding | |
82 | bc ; LRO ; Left_To_Right_Override | |
83 | bc ; NSM ; Nonspacing_Mark | |
84 | bc ; ON ; Other_Neutral | |
85 | bc ; PDF ; Pop_Directional_Format | |
86 | bc ; R ; Right_To_Left | |
87 | bc ; RLE ; Right_To_Left_Embedding | |
88 | bc ; RLO ; Right_To_Left_Override | |
89 | bc ; S ; Segment_Separator | |
90 | bc ; WS ; White_Space | |
91 | ||
92 | # Block (blk) | |
93 | ||
94 | blk; n/a ; Aegean_Numbers | |
95 | blk; n/a ; Alphabetic_Presentation_Forms | |
96 | blk; n/a ; Ancient_Greek_Musical_Notation | |
97 | blk; n/a ; Ancient_Greek_Numbers | |
98 | blk; n/a ; Arabic | |
99 | blk; n/a ; Arabic_Presentation_Forms-A | |
100 | blk; n/a ; Arabic_Presentation_Forms-B | |
101 | blk; n/a ; Arabic_Supplement | |
102 | blk; n/a ; Armenian | |
103 | blk; n/a ; Arrows | |
104 | blk; n/a ; Basic_Latin | |
105 | blk; n/a ; Bengali | |
106 | blk; n/a ; Block_Elements | |
107 | blk; n/a ; Bopomofo | |
108 | blk; n/a ; Bopomofo_Extended | |
109 | blk; n/a ; Box_Drawing | |
110 | blk; n/a ; Braille_Patterns | |
111 | blk; n/a ; Buginese | |
112 | blk; n/a ; Buhid | |
113 | blk; n/a ; Byzantine_Musical_Symbols | |
114 | blk; n/a ; Cherokee | |
115 | blk; n/a ; CJK_Compatibility | |
116 | blk; n/a ; CJK_Compatibility_Forms | |
117 | blk; n/a ; CJK_Compatibility_Ideographs | |
118 | blk; n/a ; CJK_Compatibility_Ideographs_Supplement | |
119 | blk; n/a ; CJK_Radicals_Supplement | |
120 | blk; n/a ; CJK_Strokes | |
121 | blk; n/a ; CJK_Symbols_and_Punctuation | |
122 | blk; n/a ; CJK_Unified_Ideographs | |
123 | blk; n/a ; CJK_Unified_Ideographs_Extension_A | |
124 | blk; n/a ; CJK_Unified_Ideographs_Extension_B | |
125 | blk; n/a ; Combining_Diacritical_Marks | |
126 | blk; n/a ; Combining_Diacritical_Marks_for_Symbols | |
127 | blk; n/a ; Combining_Diacritical_Marks_Supplement | |
128 | blk; n/a ; Combining_Half_Marks | |
129 | blk; n/a ; Control_Pictures | |
130 | blk; n/a ; Coptic | |
131 | blk; n/a ; Currency_Symbols | |
132 | blk; n/a ; Cypriot_Syllabary | |
133 | blk; n/a ; Cyrillic | |
134 | blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary | |
135 | blk; n/a ; Deseret | |
136 | blk; n/a ; Devanagari | |
137 | blk; n/a ; Dingbats | |
138 | blk; n/a ; Enclosed_Alphanumerics | |
139 | blk; n/a ; Enclosed_CJK_Letters_and_Months | |
140 | blk; n/a ; Ethiopic | |
141 | blk; n/a ; Ethiopic_Extended | |
142 | blk; n/a ; Ethiopic_Supplement | |
143 | blk; n/a ; General_Punctuation | |
144 | blk; n/a ; Geometric_Shapes | |
145 | blk; n/a ; Georgian | |
146 | blk; n/a ; Georgian_Supplement | |
147 | blk; n/a ; Glagolitic | |
148 | blk; n/a ; Gothic | |
149 | blk; n/a ; Greek_and_Coptic | |
150 | blk; n/a ; Greek_Extended | |
151 | blk; n/a ; Gujarati | |
152 | blk; n/a ; Gurmukhi | |
153 | blk; n/a ; Halfwidth_and_Fullwidth_Forms | |
154 | blk; n/a ; Hangul_Compatibility_Jamo | |
155 | blk; n/a ; Hangul_Jamo | |
156 | blk; n/a ; Hangul_Syllables | |
157 | blk; n/a ; Hanunoo | |
158 | blk; n/a ; Hebrew | |
159 | blk; n/a ; High_Private_Use_Surrogates | |
160 | blk; n/a ; High_Surrogates | |
161 | blk; n/a ; Hiragana | |
162 | blk; n/a ; Ideographic_Description_Characters | |
163 | blk; n/a ; IPA_Extensions | |
164 | blk; n/a ; Kanbun | |
165 | blk; n/a ; Kangxi_Radicals | |
166 | blk; n/a ; Kannada | |
167 | blk; n/a ; Katakana | |
168 | blk; n/a ; Katakana_Phonetic_Extensions | |
169 | blk; n/a ; Kharoshthi | |
170 | blk; n/a ; Khmer | |
171 | blk; n/a ; Khmer_Symbols | |
172 | blk; n/a ; Lao | |
173 | blk; n/a ; Latin-1_Supplement | |
174 | blk; n/a ; Latin_Extended-A | |
175 | blk; n/a ; Latin_Extended-B | |
176 | blk; n/a ; Latin_Extended_Additional | |
177 | blk; n/a ; Letterlike_Symbols | |
178 | blk; n/a ; Limbu | |
179 | blk; n/a ; Linear_B_Ideograms | |
180 | blk; n/a ; Linear_B_Syllabary | |
181 | blk; n/a ; Low_Surrogates | |
182 | blk; n/a ; Malayalam | |
183 | blk; n/a ; Mathematical_Alphanumeric_Symbols | |
184 | blk; n/a ; Mathematical_Operators | |
185 | blk; n/a ; Miscellaneous_Mathematical_Symbols-A | |
186 | blk; n/a ; Miscellaneous_Mathematical_Symbols-B | |
187 | blk; n/a ; Miscellaneous_Symbols | |
188 | blk; n/a ; Miscellaneous_Symbols_and_Arrows | |
189 | blk; n/a ; Miscellaneous_Technical | |
190 | blk; n/a ; Modifier_Tone_Letters | |
191 | blk; n/a ; Mongolian | |
192 | blk; n/a ; Musical_Symbols | |
193 | blk; n/a ; Myanmar | |
194 | blk; n/a ; New_Tai_Lue | |
195 | blk; n/a ; No_Block | |
196 | blk; n/a ; Number_Forms | |
197 | blk; n/a ; Ogham | |
198 | blk; n/a ; Old_Italic | |
199 | blk; n/a ; Old_Persian | |
200 | blk; n/a ; Optical_Character_Recognition | |
201 | blk; n/a ; Oriya | |
202 | blk; n/a ; Osmanya | |
203 | blk; n/a ; Phonetic_Extensions | |
204 | blk; n/a ; Phonetic_Extensions_Supplement | |
205 | blk; n/a ; Private_Use_Area | |
206 | blk; n/a ; Runic | |
207 | blk; n/a ; Shavian | |
208 | blk; n/a ; Sinhala | |
209 | blk; n/a ; Small_Form_Variants | |
210 | blk; n/a ; Spacing_Modifier_Letters | |
211 | blk; n/a ; Specials | |
212 | blk; n/a ; Superscripts_and_Subscripts | |
213 | blk; n/a ; Supplemental_Arrows-A | |
214 | blk; n/a ; Supplemental_Arrows-B | |
215 | blk; n/a ; Supplemental_Mathematical_Operators | |
216 | blk; n/a ; Supplemental_Punctuation | |
217 | blk; n/a ; Supplementary_Private_Use_Area-A | |
218 | blk; n/a ; Supplementary_Private_Use_Area-B | |
219 | blk; n/a ; Syloti_Nagri | |
220 | blk; n/a ; Syriac | |
221 | blk; n/a ; Tagalog | |
222 | blk; n/a ; Tagbanwa | |
223 | blk; n/a ; Tags | |
224 | blk; n/a ; Tai_Le | |
225 | blk; n/a ; Tai_Xuan_Jing_Symbols | |
226 | blk; n/a ; Tamil | |
227 | blk; n/a ; Telugu | |
228 | blk; n/a ; Thaana | |
229 | blk; n/a ; Thai | |
230 | blk; n/a ; Tibetan | |
231 | blk; n/a ; Tifinagh | |
232 | blk; n/a ; Ugaritic | |
233 | blk; n/a ; Unified_Canadian_Aboriginal_Syllabics | |
234 | blk; n/a ; Variation_Selectors | |
235 | blk; n/a ; Variation_Selectors_Supplement | |
236 | blk; n/a ; Vertical_Forms | |
237 | blk; n/a ; Yi_Radicals | |
238 | blk; n/a ; Yi_Syllables | |
239 | blk; n/a ; Yijing_Hexagram_Symbols | |
240 | ||
241 | # Canonical_Combining_Class (ccc) | |
242 | ||
243 | ccc; 0; NR ; Not_Reordered | |
244 | ccc; 1; OV ; Overlay | |
245 | ccc; 7; NK ; Nukta | |
246 | ccc; 8; KV ; Kana_Voicing | |
247 | ccc; 9; VR ; Virama | |
248 | ccc; 200; ATBL ; Attached_Below_Left | |
249 | ccc; 202; ATB ; Attached_Below | |
250 | ccc; 216; ATAR ; Attached_Above_Right | |
251 | ccc; 218; BL ; Below_Left | |
252 | ccc; 220; B ; Below | |
253 | ccc; 222; BR ; Below_Right | |
254 | ccc; 224; L ; Left | |
255 | ccc; 226; R ; Right | |
256 | ccc; 228; AL ; Above_Left | |
257 | ccc; 230; A ; Above | |
258 | ccc; 232; AR ; Above_Right | |
259 | ccc; 233; DB ; Double_Below | |
260 | ccc; 234; DA ; Double_Above | |
261 | ccc; 240; IS ; Iota_Subscript | |
262 | ||
263 | # Decomposition_Type (dt) | |
264 | ||
265 | dt ; can ; Canonical | |
266 | dt ; com ; Compat | |
267 | dt ; enc ; Circle | |
268 | dt ; fin ; Final | |
269 | dt ; font ; Font | |
270 | dt ; fra ; Fraction | |
271 | dt ; init ; Initial | |
272 | dt ; iso ; Isolated | |
273 | dt ; med ; Medial | |
274 | dt ; nar ; Narrow | |
275 | dt ; nb ; Nobreak | |
276 | dt ; none ; None | |
277 | dt ; sml ; Small | |
278 | dt ; sqr ; Square | |
279 | dt ; sub ; Sub | |
280 | dt ; sup ; Super | |
281 | dt ; vert ; Vertical | |
282 | dt ; wide ; Wide | |
283 | ||
284 | # East_Asian_Width (ea) | |
285 | ||
286 | ea ; A ; Ambiguous | |
287 | ea ; F ; Fullwidth | |
288 | ea ; H ; Halfwidth | |
289 | ea ; N ; Neutral | |
290 | ea ; Na ; Narrow | |
291 | ea ; W ; Wide | |
292 | ||
293 | # General_Category (gc) | |
294 | ||
295 | gc ; C ; Other # Cc | Cf | Cn | Co | Cs | |
296 | gc ; Cc ; Control ; cntrl | |
297 | gc ; Cf ; Format | |
298 | gc ; Cn ; Unassigned | |
299 | gc ; Co ; Private_Use | |
300 | gc ; Cs ; Surrogate | |
301 | gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu | |
302 | gc ; LC ; Cased_Letter # Ll | Lt | Lu | |
303 | gc ; Ll ; Lowercase_Letter | |
304 | gc ; Lm ; Modifier_Letter | |
305 | gc ; Lo ; Other_Letter | |
306 | gc ; Lt ; Titlecase_Letter | |
307 | gc ; Lu ; Uppercase_Letter | |
308 | gc ; M ; Mark # Mc | Me | Mn | |
309 | gc ; Mc ; Spacing_Mark | |
310 | gc ; Me ; Enclosing_Mark | |
311 | gc ; Mn ; Nonspacing_Mark | |
312 | gc ; N ; Number # Nd | Nl | No | |
313 | gc ; Nd ; Decimal_Number ; digit | |
314 | gc ; Nl ; Letter_Number | |
315 | gc ; No ; Other_Number | |
316 | gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps | |
317 | gc ; Pc ; Connector_Punctuation | |
318 | gc ; Pd ; Dash_Punctuation | |
319 | gc ; Pe ; Close_Punctuation | |
320 | gc ; Pf ; Final_Punctuation | |
321 | gc ; Pi ; Initial_Punctuation | |
322 | gc ; Po ; Other_Punctuation | |
323 | gc ; Ps ; Open_Punctuation | |
324 | gc ; S ; Symbol # Sc | Sk | Sm | So | |
325 | gc ; Sc ; Currency_Symbol | |
326 | gc ; Sk ; Modifier_Symbol | |
327 | gc ; Sm ; Math_Symbol | |
328 | gc ; So ; Other_Symbol | |
329 | gc ; Z ; Separator # Zl | Zp | Zs | |
330 | gc ; Zl ; Line_Separator | |
331 | gc ; Zp ; Paragraph_Separator | |
332 | gc ; Zs ; Space_Separator | |
333 | ||
334 | # Grapheme_Cluster_Break (GCB) | |
335 | ||
336 | GCB; CN ; Control | |
337 | GCB; CR ; CR | |
338 | GCB; EX ; Extend | |
339 | GCB; L ; L | |
340 | GCB; LF ; LF | |
341 | GCB; LV ; LV | |
342 | GCB; LVT ; LVT | |
343 | GCB; T ; T | |
344 | GCB; V ; V | |
345 | GCB; XX ; Other | |
346 | ||
347 | # Hangul_Syllable_Type (hst) | |
348 | ||
349 | hst; L ; Leading_Jamo | |
350 | hst; LV ; LV_Syllable | |
351 | hst; LVT ; LVT_Syllable | |
352 | hst; NA ; Not_Applicable | |
353 | hst; T ; Trailing_Jamo | |
354 | hst; V ; Vowel_Jamo | |
355 | ||
356 | # Joining_Group (jg) | |
357 | ||
358 | jg ; n/a ; Ain | |
359 | jg ; n/a ; Alaph | |
360 | jg ; n/a ; Alef | |
361 | jg ; n/a ; Beh | |
362 | jg ; n/a ; Beth | |
363 | jg ; n/a ; Dal | |
364 | jg ; n/a ; Dalath_Rish | |
365 | jg ; n/a ; E | |
366 | jg ; n/a ; Fe | |
367 | jg ; n/a ; Feh | |
368 | jg ; n/a ; Final_Semkath | |
369 | jg ; n/a ; Gaf | |
370 | jg ; n/a ; Gamal | |
371 | jg ; n/a ; Hah | |
372 | jg ; n/a ; Hamza_On_Heh_Goal | |
373 | jg ; n/a ; He | |
374 | jg ; n/a ; Heh | |
375 | jg ; n/a ; Heh_Goal | |
376 | jg ; n/a ; Heth | |
377 | jg ; n/a ; Kaf | |
378 | jg ; n/a ; Kaph | |
379 | jg ; n/a ; Khaph | |
380 | jg ; n/a ; Knotted_Heh | |
381 | jg ; n/a ; Lam | |
382 | jg ; n/a ; Lamadh | |
383 | jg ; n/a ; Meem | |
384 | jg ; n/a ; Mim | |
385 | jg ; n/a ; No_Joining_Group | |
386 | jg ; n/a ; Noon | |
387 | jg ; n/a ; Nun | |
388 | jg ; n/a ; Pe | |
389 | jg ; n/a ; Qaf | |
390 | jg ; n/a ; Qaph | |
391 | jg ; n/a ; Reh | |
392 | jg ; n/a ; Reversed_Pe | |
393 | jg ; n/a ; Sad | |
394 | jg ; n/a ; Sadhe | |
395 | jg ; n/a ; Seen | |
396 | jg ; n/a ; Semkath | |
397 | jg ; n/a ; Shin | |
398 | jg ; n/a ; Swash_Kaf | |
399 | jg ; n/a ; Syriac_Waw | |
400 | jg ; n/a ; Tah | |
401 | jg ; n/a ; Taw | |
402 | jg ; n/a ; Teh_Marbuta | |
403 | jg ; n/a ; Teth | |
404 | jg ; n/a ; Waw | |
405 | jg ; n/a ; Yeh | |
406 | jg ; n/a ; Yeh_Barree | |
407 | jg ; n/a ; Yeh_With_Tail | |
408 | jg ; n/a ; Yudh | |
409 | jg ; n/a ; Yudh_He | |
410 | jg ; n/a ; Zain | |
411 | jg ; n/a ; Zhain | |
412 | ||
413 | # Joining_Type (jt) | |
414 | ||
415 | jt ; C ; Join_Causing | |
416 | jt ; D ; Dual_Joining | |
417 | jt ; L ; Left_Joining | |
418 | jt ; R ; Right_Joining | |
419 | jt ; T ; Transparent | |
420 | jt ; U ; Non_Joining | |
421 | ||
422 | # Line_Break (lb) | |
423 | ||
424 | lb ; AI ; Ambiguous | |
425 | lb ; AL ; Alphabetic | |
426 | lb ; B2 ; Break_Both | |
427 | lb ; BA ; Break_After | |
428 | lb ; BB ; Break_Before | |
429 | lb ; BK ; Mandatory_Break | |
430 | lb ; CB ; Contingent_Break | |
431 | lb ; CL ; Close_Punctuation | |
432 | lb ; CM ; Combining_Mark | |
433 | lb ; CR ; Carriage_Return | |
434 | lb ; EX ; Exclamation | |
435 | lb ; GL ; Glue | |
436 | lb ; H2 ; H2 | |
437 | lb ; H3 ; H3 | |
438 | lb ; HY ; Hyphen | |
439 | lb ; ID ; Ideographic | |
440 | lb ; IN ; Inseparable ; Inseperable | |
441 | lb ; IS ; Infix_Numeric | |
442 | lb ; JL ; JL | |
443 | lb ; JT ; JT | |
444 | lb ; JV ; JV | |
445 | lb ; LF ; Line_Feed | |
446 | lb ; NL ; Next_Line | |
447 | lb ; NS ; Nonstarter | |
448 | lb ; NU ; Numeric | |
449 | lb ; OP ; Open_Punctuation | |
450 | lb ; PO ; Postfix_Numeric | |
451 | lb ; PR ; Prefix_Numeric | |
452 | lb ; QU ; Quotation | |
453 | lb ; SA ; Complex_Context | |
454 | lb ; SG ; Surrogate | |
455 | lb ; SP ; Space | |
456 | lb ; SY ; Break_Symbols | |
457 | lb ; WJ ; Word_Joiner | |
458 | lb ; XX ; Unknown | |
459 | lb ; ZW ; ZWSpace | |
460 | ||
461 | # NFC_Quick_Check (NFC_QC) | |
462 | ||
463 | NFC_QC; M ; Maybe | |
464 | NFC_QC; N ; No | |
465 | NFC_QC; Y ; Yes | |
466 | ||
467 | # NFD_Quick_Check (NFD_QC) | |
468 | ||
469 | NFD_QC; N ; No | |
470 | NFD_QC; Y ; Yes | |
471 | ||
472 | # NFKC_Quick_Check (NFKC_QC) | |
473 | ||
474 | NFKC_QC; M ; Maybe | |
475 | NFKC_QC; N ; No | |
476 | NFKC_QC; Y ; Yes | |
477 | ||
478 | # NFKD_Quick_Check (NFKD_QC) | |
479 | ||
480 | NFKD_QC; N ; No | |
481 | NFKD_QC; Y ; Yes | |
482 | ||
483 | # Numeric_Type (nt) | |
484 | ||
485 | nt ; De ; Decimal | |
486 | nt ; Di ; Digit | |
487 | nt ; None ; None | |
488 | nt ; Nu ; Numeric | |
489 | ||
490 | # Script (sc) | |
491 | ||
492 | sc ; Arab ; Arabic | |
493 | sc ; Armn ; Armenian | |
494 | sc ; Beng ; Bengali | |
495 | sc ; Bopo ; Bopomofo | |
496 | sc ; Brai ; Braille | |
497 | sc ; Bugi ; Buginese | |
498 | sc ; Buhd ; Buhid | |
499 | sc ; Cans ; Canadian_Aboriginal | |
500 | sc ; Cher ; Cherokee | |
501 | sc ; Copt ; Coptic ; Qaac | |
502 | sc ; Cprt ; Cypriot | |
503 | sc ; Cyrl ; Cyrillic | |
504 | sc ; Deva ; Devanagari | |
505 | sc ; Dsrt ; Deseret | |
506 | sc ; Ethi ; Ethiopic | |
507 | sc ; Geor ; Georgian | |
508 | sc ; Glag ; Glagolitic | |
509 | sc ; Goth ; Gothic | |
510 | sc ; Grek ; Greek | |
511 | sc ; Gujr ; Gujarati | |
512 | sc ; Guru ; Gurmukhi | |
513 | sc ; Hang ; Hangul | |
514 | sc ; Hani ; Han | |
515 | sc ; Hano ; Hanunoo | |
516 | sc ; Hebr ; Hebrew | |
517 | sc ; Hira ; Hiragana | |
518 | sc ; Hrkt ; Katakana_Or_Hiragana | |
519 | sc ; Ital ; Old_Italic | |
520 | sc ; Kana ; Katakana | |
521 | sc ; Khar ; Kharoshthi | |
522 | sc ; Khmr ; Khmer | |
523 | sc ; Knda ; Kannada | |
524 | sc ; Laoo ; Lao | |
525 | sc ; Latn ; Latin | |
526 | sc ; Limb ; Limbu | |
527 | sc ; Linb ; Linear_B | |
528 | sc ; Mlym ; Malayalam | |
529 | sc ; Mong ; Mongolian | |
530 | sc ; Mymr ; Myanmar | |
531 | sc ; Ogam ; Ogham | |
532 | sc ; Orya ; Oriya | |
533 | sc ; Osma ; Osmanya | |
534 | sc ; Qaai ; Inherited | |
535 | sc ; Runr ; Runic | |
536 | sc ; Shaw ; Shavian | |
537 | sc ; Sinh ; Sinhala | |
538 | sc ; Sylo ; Syloti_Nagri | |
539 | sc ; Syrc ; Syriac | |
540 | sc ; Tagb ; Tagbanwa | |
541 | sc ; Tale ; Tai_Le | |
542 | sc ; Talu ; New_Tai_Lue | |
543 | sc ; Taml ; Tamil | |
544 | sc ; Telu ; Telugu | |
545 | sc ; Tfng ; Tifinagh | |
546 | sc ; Tglg ; Tagalog | |
547 | sc ; Thaa ; Thaana | |
548 | sc ; Thai ; Thai | |
549 | sc ; Tibt ; Tibetan | |
550 | sc ; Ugar ; Ugaritic | |
551 | sc ; Xpeo ; Old_Persian | |
552 | sc ; Yiii ; Yi | |
553 | sc ; Zyyy ; Common | |
554 | ||
555 | # Sentence_Break (SB) | |
556 | ||
557 | SB ; AT ; ATerm | |
558 | SB ; CL ; Close | |
559 | SB ; FO ; Format | |
560 | SB ; LE ; OLetter | |
561 | SB ; LO ; Lower | |
562 | SB ; NU ; Numeric | |
563 | SB ; SE ; Sep | |
564 | SB ; SP ; Sp | |
565 | SB ; ST ; STerm | |
566 | SB ; UP ; Upper | |
567 | SB ; XX ; Other | |
568 | ||
569 | # Word_Break (WB) | |
570 | ||
571 | WB ; EX ; ExtendNumLet | |
572 | WB ; FO ; Format | |
573 | WB ; KA ; Katakana | |
574 | WB ; LE ; ALetter | |
575 | WB ; ML ; MidLetter | |
576 | WB ; MN ; MidNum | |
577 | WB ; NU ; Numeric | |
578 | WB ; XX ; Other |