git.subgeniuskitty.com - OpenSPARC-T2-SAM/.git/blame - sam-t2/devtools/amd64/lib/perl5/5.8.8/unicore/PropValueAliases.txt

Commit	Line	Data
920dae64 AT	1	# PropertyValueAliases-4.1.0.txt
	2	# Date: 2005-03-28, 17:21:48 GMT [MD]
	3	#
	4	# Unicode Character Database
	5	# Copyright (c) 1991-2005 Unicode, Inc.
	6	# For terms of use, see http://www.unicode.org/terms_of_use.html
	7	# For documentation, see UCD.html
	8	#
	9	# This file contains aliases for property values used in the UCD.
	10	# These names can be used for XML formats of UCD data, for regular-expression
	11	# property tests, and other programmatic textual descriptions of Unicode data.
	12	# For information on which properties are normative, see UCD.html.
	13	#
	14	# The names may be translated in appropriate environments, and additional
	15	# aliases may be useful.
	16	#
	17	# FORMAT
	18	#
	19	# Each line describes a property value name.
	20	# This consists of three or more fields, separated by semicolons.
	21	#
	22	# First Field: The first field describes the property for which that
	23	# property value name is used.
	24	#
	25	# Second Field: The second field is an abbreviated name.
	26	# If there is no abbreviated name available, the field is marked with "n/a".
	27	#
	28	# Third Field: The third field is a long name.
	29	#
	30	# In the case of ccc, there are 4 fields. The second field is numeric, third
	31	# is abbreviated, and fourth is long.
	32	#
	33	# The above are the preferred aliases. Other aliases may be listed in additional fields.
	34	#
	35	# Loose matching should be applied to all property names and property values, with
	36	# the exception of String Property values. With loose matching of property names and
	37	# values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
	38	# values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
	39	#
	40	# NOTE: Property value names are NOT unique across properties. For example:
	41	#
	42	# AL means Arabic Letter for the Bidi_Class property, and
	43	# AL means Alpha_Left for the Combining_Class property, and
	44	# AL means Alphabetic for the Line_Break property.
	45	#
	46	# In addition, some property names may be the same as some property value names.
	47	# For example:
	48	#
	49	# sc means the Script property, and
	50	# Sc means the General_Category property value Currency_Symbol (Sc)
	51	#
	52	# The combination of property value and property name is, however, unique.
	53	#
	54	# For more information, see UTS #18: Regular Expression Guidelines
	55	# ================================================
	56
	57
	58	# Age (age)
	59
	60	age; n/a ; 1.1
	61	age; n/a ; 2.0
	62	age; n/a ; 2.1
	63	age; n/a ; 3.0
	64	age; n/a ; 3.1
65	age; n/a ; 3.2
66	age; n/a ; 4.0
67	age; n/a ; 4.1
68	age; n/a ; unassigned
69
70	# Bidi_Class (bc)
71
72	bc ; AL ; Arabic_Letter
73	bc ; AN ; Arabic_Number
74	bc ; B ; Paragraph_Separator
75	bc ; BN ; Boundary_Neutral
76	bc ; CS ; Common_Separator
77	bc ; EN ; European_Number
78	bc ; ES ; European_Separator
79	bc ; ET ; European_Terminator
80	bc ; L ; Left_To_Right
81	bc ; LRE ; Left_To_Right_Embedding
82	bc ; LRO ; Left_To_Right_Override
83	bc ; NSM ; Nonspacing_Mark
84	bc ; ON ; Other_Neutral
85	bc ; PDF ; Pop_Directional_Format
86	bc ; R ; Right_To_Left
87	bc ; RLE ; Right_To_Left_Embedding
88	bc ; RLO ; Right_To_Left_Override
89	bc ; S ; Segment_Separator
90	bc ; WS ; White_Space
91
92	# Block (blk)
93
94	blk; n/a ; Aegean_Numbers
95	blk; n/a ; Alphabetic_Presentation_Forms
96	blk; n/a ; Ancient_Greek_Musical_Notation
97	blk; n/a ; Ancient_Greek_Numbers
98	blk; n/a ; Arabic
99	blk; n/a ; Arabic_Presentation_Forms-A
100	blk; n/a ; Arabic_Presentation_Forms-B
101	blk; n/a ; Arabic_Supplement
102	blk; n/a ; Armenian
103	blk; n/a ; Arrows
104	blk; n/a ; Basic_Latin
105	blk; n/a ; Bengali
106	blk; n/a ; Block_Elements
107	blk; n/a ; Bopomofo
108	blk; n/a ; Bopomofo_Extended
109	blk; n/a ; Box_Drawing
110	blk; n/a ; Braille_Patterns
111	blk; n/a ; Buginese
112	blk; n/a ; Buhid
113	blk; n/a ; Byzantine_Musical_Symbols
114	blk; n/a ; Cherokee
115	blk; n/a ; CJK_Compatibility
116	blk; n/a ; CJK_Compatibility_Forms
117	blk; n/a ; CJK_Compatibility_Ideographs
118	blk; n/a ; CJK_Compatibility_Ideographs_Supplement
119	blk; n/a ; CJK_Radicals_Supplement
120	blk; n/a ; CJK_Strokes
121	blk; n/a ; CJK_Symbols_and_Punctuation
122	blk; n/a ; CJK_Unified_Ideographs
123	blk; n/a ; CJK_Unified_Ideographs_Extension_A
124	blk; n/a ; CJK_Unified_Ideographs_Extension_B
125	blk; n/a ; Combining_Diacritical_Marks
126	blk; n/a ; Combining_Diacritical_Marks_for_Symbols
127	blk; n/a ; Combining_Diacritical_Marks_Supplement
128	blk; n/a ; Combining_Half_Marks
129	blk; n/a ; Control_Pictures
130	blk; n/a ; Coptic
131	blk; n/a ; Currency_Symbols
132	blk; n/a ; Cypriot_Syllabary
133	blk; n/a ; Cyrillic
134	blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary
135	blk; n/a ; Deseret
136	blk; n/a ; Devanagari
137	blk; n/a ; Dingbats
138	blk; n/a ; Enclosed_Alphanumerics
139	blk; n/a ; Enclosed_CJK_Letters_and_Months
140	blk; n/a ; Ethiopic
141	blk; n/a ; Ethiopic_Extended
142	blk; n/a ; Ethiopic_Supplement
143	blk; n/a ; General_Punctuation
144	blk; n/a ; Geometric_Shapes
145	blk; n/a ; Georgian
146	blk; n/a ; Georgian_Supplement
147	blk; n/a ; Glagolitic
148	blk; n/a ; Gothic
149	blk; n/a ; Greek_and_Coptic
150	blk; n/a ; Greek_Extended
151	blk; n/a ; Gujarati
152	blk; n/a ; Gurmukhi
153	blk; n/a ; Halfwidth_and_Fullwidth_Forms
154	blk; n/a ; Hangul_Compatibility_Jamo
155	blk; n/a ; Hangul_Jamo
156	blk; n/a ; Hangul_Syllables
157	blk; n/a ; Hanunoo
158	blk; n/a ; Hebrew
159	blk; n/a ; High_Private_Use_Surrogates
160	blk; n/a ; High_Surrogates
161	blk; n/a ; Hiragana
162	blk; n/a ; Ideographic_Description_Characters
163	blk; n/a ; IPA_Extensions
164	blk; n/a ; Kanbun
165	blk; n/a ; Kangxi_Radicals
166	blk; n/a ; Kannada
167	blk; n/a ; Katakana
168	blk; n/a ; Katakana_Phonetic_Extensions
169	blk; n/a ; Kharoshthi
170	blk; n/a ; Khmer
171	blk; n/a ; Khmer_Symbols
172	blk; n/a ; Lao
173	blk; n/a ; Latin-1_Supplement
174	blk; n/a ; Latin_Extended-A
175	blk; n/a ; Latin_Extended-B
176	blk; n/a ; Latin_Extended_Additional
177	blk; n/a ; Letterlike_Symbols
178	blk; n/a ; Limbu
179	blk; n/a ; Linear_B_Ideograms
180	blk; n/a ; Linear_B_Syllabary
181	blk; n/a ; Low_Surrogates
182	blk; n/a ; Malayalam
183	blk; n/a ; Mathematical_Alphanumeric_Symbols
184	blk; n/a ; Mathematical_Operators
185	blk; n/a ; Miscellaneous_Mathematical_Symbols-A
186	blk; n/a ; Miscellaneous_Mathematical_Symbols-B
187	blk; n/a ; Miscellaneous_Symbols
188	blk; n/a ; Miscellaneous_Symbols_and_Arrows
189	blk; n/a ; Miscellaneous_Technical
190	blk; n/a ; Modifier_Tone_Letters
191	blk; n/a ; Mongolian
192	blk; n/a ; Musical_Symbols
193	blk; n/a ; Myanmar
194	blk; n/a ; New_Tai_Lue
195	blk; n/a ; No_Block
196	blk; n/a ; Number_Forms
197	blk; n/a ; Ogham
198	blk; n/a ; Old_Italic
199	blk; n/a ; Old_Persian
200	blk; n/a ; Optical_Character_Recognition
201	blk; n/a ; Oriya
202	blk; n/a ; Osmanya
203	blk; n/a ; Phonetic_Extensions
204	blk; n/a ; Phonetic_Extensions_Supplement
205	blk; n/a ; Private_Use_Area
206	blk; n/a ; Runic
207	blk; n/a ; Shavian
208	blk; n/a ; Sinhala
209	blk; n/a ; Small_Form_Variants
210	blk; n/a ; Spacing_Modifier_Letters
211	blk; n/a ; Specials
212	blk; n/a ; Superscripts_and_Subscripts
213	blk; n/a ; Supplemental_Arrows-A
214	blk; n/a ; Supplemental_Arrows-B
215	blk; n/a ; Supplemental_Mathematical_Operators
216	blk; n/a ; Supplemental_Punctuation
217	blk; n/a ; Supplementary_Private_Use_Area-A
218	blk; n/a ; Supplementary_Private_Use_Area-B
219	blk; n/a ; Syloti_Nagri
220	blk; n/a ; Syriac
221	blk; n/a ; Tagalog
222	blk; n/a ; Tagbanwa
223	blk; n/a ; Tags
224	blk; n/a ; Tai_Le
225	blk; n/a ; Tai_Xuan_Jing_Symbols
226	blk; n/a ; Tamil
227	blk; n/a ; Telugu
228	blk; n/a ; Thaana
229	blk; n/a ; Thai
230	blk; n/a ; Tibetan
231	blk; n/a ; Tifinagh
232	blk; n/a ; Ugaritic
233	blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
234	blk; n/a ; Variation_Selectors
235	blk; n/a ; Variation_Selectors_Supplement
236	blk; n/a ; Vertical_Forms
237	blk; n/a ; Yi_Radicals
238	blk; n/a ; Yi_Syllables
239	blk; n/a ; Yijing_Hexagram_Symbols
240
241	# Canonical_Combining_Class (ccc)
242
243	ccc; 0; NR ; Not_Reordered
244	ccc; 1; OV ; Overlay
245	ccc; 7; NK ; Nukta
246	ccc; 8; KV ; Kana_Voicing
247	ccc; 9; VR ; Virama
248	ccc; 200; ATBL ; Attached_Below_Left
249	ccc; 202; ATB ; Attached_Below
250	ccc; 216; ATAR ; Attached_Above_Right
251	ccc; 218; BL ; Below_Left
252	ccc; 220; B ; Below
253	ccc; 222; BR ; Below_Right
254	ccc; 224; L ; Left
255	ccc; 226; R ; Right
256	ccc; 228; AL ; Above_Left
257	ccc; 230; A ; Above
258	ccc; 232; AR ; Above_Right
259	ccc; 233; DB ; Double_Below
260	ccc; 234; DA ; Double_Above
261	ccc; 240; IS ; Iota_Subscript
262
263	# Decomposition_Type (dt)
264
265	dt ; can ; Canonical
266	dt ; com ; Compat
267	dt ; enc ; Circle
268	dt ; fin ; Final
269	dt ; font ; Font
270	dt ; fra ; Fraction
271	dt ; init ; Initial
272	dt ; iso ; Isolated
273	dt ; med ; Medial
274	dt ; nar ; Narrow
275	dt ; nb ; Nobreak
276	dt ; none ; None
277	dt ; sml ; Small
278	dt ; sqr ; Square
279	dt ; sub ; Sub
280	dt ; sup ; Super
281	dt ; vert ; Vertical
282	dt ; wide ; Wide
283
284	# East_Asian_Width (ea)
285
286	ea ; A ; Ambiguous
287	ea ; F ; Fullwidth
288	ea ; H ; Halfwidth
289	ea ; N ; Neutral
290	ea ; Na ; Narrow
291	ea ; W ; Wide
292
293	# General_Category (gc)
294
295	gc ; C ; Other # Cc \| Cf \| Cn \| Co \| Cs
296	gc ; Cc ; Control ; cntrl
297	gc ; Cf ; Format
298	gc ; Cn ; Unassigned
299	gc ; Co ; Private_Use
300	gc ; Cs ; Surrogate
301	gc ; L ; Letter # Ll \| Lm \| Lo \| Lt \| Lu
302	gc ; LC ; Cased_Letter # Ll \| Lt \| Lu
303	gc ; Ll ; Lowercase_Letter
304	gc ; Lm ; Modifier_Letter
305	gc ; Lo ; Other_Letter
306	gc ; Lt ; Titlecase_Letter
307	gc ; Lu ; Uppercase_Letter
308	gc ; M ; Mark # Mc \| Me \| Mn
309	gc ; Mc ; Spacing_Mark
310	gc ; Me ; Enclosing_Mark
311	gc ; Mn ; Nonspacing_Mark
312	gc ; N ; Number # Nd \| Nl \| No
313	gc ; Nd ; Decimal_Number ; digit
314	gc ; Nl ; Letter_Number
315	gc ; No ; Other_Number
316	gc ; P ; Punctuation ; punct # Pc \| Pd \| Pe \| Pf \| Pi \| Po \| Ps
317	gc ; Pc ; Connector_Punctuation
318	gc ; Pd ; Dash_Punctuation
319	gc ; Pe ; Close_Punctuation
320	gc ; Pf ; Final_Punctuation
321	gc ; Pi ; Initial_Punctuation
322	gc ; Po ; Other_Punctuation
323	gc ; Ps ; Open_Punctuation
324	gc ; S ; Symbol # Sc \| Sk \| Sm \| So
325	gc ; Sc ; Currency_Symbol
326	gc ; Sk ; Modifier_Symbol
327	gc ; Sm ; Math_Symbol
328	gc ; So ; Other_Symbol
329	gc ; Z ; Separator # Zl \| Zp \| Zs
330	gc ; Zl ; Line_Separator
331	gc ; Zp ; Paragraph_Separator
332	gc ; Zs ; Space_Separator
333
334	# Grapheme_Cluster_Break (GCB)
335
336	GCB; CN ; Control
337	GCB; CR ; CR
338	GCB; EX ; Extend
339	GCB; L ; L
340	GCB; LF ; LF
341	GCB; LV ; LV
342	GCB; LVT ; LVT
343	GCB; T ; T
344	GCB; V ; V
345	GCB; XX ; Other
346
347	# Hangul_Syllable_Type (hst)
348
349	hst; L ; Leading_Jamo
350	hst; LV ; LV_Syllable
351	hst; LVT ; LVT_Syllable
352	hst; NA ; Not_Applicable
353	hst; T ; Trailing_Jamo
354	hst; V ; Vowel_Jamo
355
356	# Joining_Group (jg)
357
358	jg ; n/a ; Ain
359	jg ; n/a ; Alaph
360	jg ; n/a ; Alef
361	jg ; n/a ; Beh
362	jg ; n/a ; Beth
363	jg ; n/a ; Dal
364	jg ; n/a ; Dalath_Rish
365	jg ; n/a ; E
366	jg ; n/a ; Fe
367	jg ; n/a ; Feh
368	jg ; n/a ; Final_Semkath
369	jg ; n/a ; Gaf
370	jg ; n/a ; Gamal
371	jg ; n/a ; Hah
372	jg ; n/a ; Hamza_On_Heh_Goal
373	jg ; n/a ; He
374	jg ; n/a ; Heh
375	jg ; n/a ; Heh_Goal
376	jg ; n/a ; Heth
377	jg ; n/a ; Kaf
378	jg ; n/a ; Kaph
379	jg ; n/a ; Khaph
380	jg ; n/a ; Knotted_Heh
381	jg ; n/a ; Lam
382	jg ; n/a ; Lamadh
383	jg ; n/a ; Meem
384	jg ; n/a ; Mim
385	jg ; n/a ; No_Joining_Group
386	jg ; n/a ; Noon
387	jg ; n/a ; Nun
388	jg ; n/a ; Pe
389	jg ; n/a ; Qaf
390	jg ; n/a ; Qaph
391	jg ; n/a ; Reh
392	jg ; n/a ; Reversed_Pe
393	jg ; n/a ; Sad
394	jg ; n/a ; Sadhe
395	jg ; n/a ; Seen
396	jg ; n/a ; Semkath
397	jg ; n/a ; Shin
398	jg ; n/a ; Swash_Kaf
399	jg ; n/a ; Syriac_Waw
400	jg ; n/a ; Tah
401	jg ; n/a ; Taw
402	jg ; n/a ; Teh_Marbuta
403	jg ; n/a ; Teth
404	jg ; n/a ; Waw
405	jg ; n/a ; Yeh
406	jg ; n/a ; Yeh_Barree
407	jg ; n/a ; Yeh_With_Tail
408	jg ; n/a ; Yudh
409	jg ; n/a ; Yudh_He
410	jg ; n/a ; Zain
411	jg ; n/a ; Zhain
412
413	# Joining_Type (jt)
414
415	jt ; C ; Join_Causing
416	jt ; D ; Dual_Joining
417	jt ; L ; Left_Joining
418	jt ; R ; Right_Joining
419	jt ; T ; Transparent
420	jt ; U ; Non_Joining
421
422	# Line_Break (lb)
423
424	lb ; AI ; Ambiguous
425	lb ; AL ; Alphabetic
426	lb ; B2 ; Break_Both
427	lb ; BA ; Break_After
428	lb ; BB ; Break_Before
429	lb ; BK ; Mandatory_Break
430	lb ; CB ; Contingent_Break
431	lb ; CL ; Close_Punctuation
432	lb ; CM ; Combining_Mark
433	lb ; CR ; Carriage_Return
434	lb ; EX ; Exclamation
435	lb ; GL ; Glue
436	lb ; H2 ; H2
437	lb ; H3 ; H3
438	lb ; HY ; Hyphen
439	lb ; ID ; Ideographic
440	lb ; IN ; Inseparable ; Inseperable
441	lb ; IS ; Infix_Numeric
442	lb ; JL ; JL
443	lb ; JT ; JT
444	lb ; JV ; JV
445	lb ; LF ; Line_Feed
446	lb ; NL ; Next_Line
447	lb ; NS ; Nonstarter
448	lb ; NU ; Numeric
449	lb ; OP ; Open_Punctuation
450	lb ; PO ; Postfix_Numeric
451	lb ; PR ; Prefix_Numeric
452	lb ; QU ; Quotation
453	lb ; SA ; Complex_Context
454	lb ; SG ; Surrogate
455	lb ; SP ; Space
456	lb ; SY ; Break_Symbols
457	lb ; WJ ; Word_Joiner
458	lb ; XX ; Unknown
459	lb ; ZW ; ZWSpace
460
461	# NFC_Quick_Check (NFC_QC)
462
463	NFC_QC; M ; Maybe
464	NFC_QC; N ; No
465	NFC_QC; Y ; Yes
466
467	# NFD_Quick_Check (NFD_QC)
468
469	NFD_QC; N ; No
470	NFD_QC; Y ; Yes
471
472	# NFKC_Quick_Check (NFKC_QC)
473
474	NFKC_QC; M ; Maybe
475	NFKC_QC; N ; No
476	NFKC_QC; Y ; Yes
477
478	# NFKD_Quick_Check (NFKD_QC)
479
480	NFKD_QC; N ; No
481	NFKD_QC; Y ; Yes
482
483	# Numeric_Type (nt)
484
485	nt ; De ; Decimal
486	nt ; Di ; Digit
487	nt ; None ; None
488	nt ; Nu ; Numeric
489
490	# Script (sc)
491
492	sc ; Arab ; Arabic
493	sc ; Armn ; Armenian
494	sc ; Beng ; Bengali
495	sc ; Bopo ; Bopomofo
496	sc ; Brai ; Braille
497	sc ; Bugi ; Buginese
498	sc ; Buhd ; Buhid
499	sc ; Cans ; Canadian_Aboriginal
500	sc ; Cher ; Cherokee
501	sc ; Copt ; Coptic ; Qaac
502	sc ; Cprt ; Cypriot
503	sc ; Cyrl ; Cyrillic
504	sc ; Deva ; Devanagari
505	sc ; Dsrt ; Deseret
506	sc ; Ethi ; Ethiopic
507	sc ; Geor ; Georgian
508	sc ; Glag ; Glagolitic
509	sc ; Goth ; Gothic
510	sc ; Grek ; Greek
511	sc ; Gujr ; Gujarati
512	sc ; Guru ; Gurmukhi
513	sc ; Hang ; Hangul
514	sc ; Hani ; Han
515	sc ; Hano ; Hanunoo
516	sc ; Hebr ; Hebrew
517	sc ; Hira ; Hiragana
518	sc ; Hrkt ; Katakana_Or_Hiragana
519	sc ; Ital ; Old_Italic
520	sc ; Kana ; Katakana
521	sc ; Khar ; Kharoshthi
522	sc ; Khmr ; Khmer
523	sc ; Knda ; Kannada
524	sc ; Laoo ; Lao
525	sc ; Latn ; Latin
526	sc ; Limb ; Limbu
527	sc ; Linb ; Linear_B
528	sc ; Mlym ; Malayalam
529	sc ; Mong ; Mongolian
530	sc ; Mymr ; Myanmar
531	sc ; Ogam ; Ogham
532	sc ; Orya ; Oriya
533	sc ; Osma ; Osmanya
534	sc ; Qaai ; Inherited
535	sc ; Runr ; Runic
536	sc ; Shaw ; Shavian
537	sc ; Sinh ; Sinhala
538	sc ; Sylo ; Syloti_Nagri
539	sc ; Syrc ; Syriac
540	sc ; Tagb ; Tagbanwa
541	sc ; Tale ; Tai_Le
542	sc ; Talu ; New_Tai_Lue
543	sc ; Taml ; Tamil
544	sc ; Telu ; Telugu
545	sc ; Tfng ; Tifinagh
546	sc ; Tglg ; Tagalog
547	sc ; Thaa ; Thaana
548	sc ; Thai ; Thai
549	sc ; Tibt ; Tibetan
550	sc ; Ugar ; Ugaritic
551	sc ; Xpeo ; Old_Persian
552	sc ; Yiii ; Yi
553	sc ; Zyyy ; Common
554
555	# Sentence_Break (SB)
556
557	SB ; AT ; ATerm
558	SB ; CL ; Close
559	SB ; FO ; Format
560	SB ; LE ; OLetter
561	SB ; LO ; Lower
562	SB ; NU ; Numeric
563	SB ; SE ; Sep
564	SB ; SP ; Sp
565	SB ; ST ; STerm
566	SB ; UP ; Upper
567	SB ; XX ; Other
568
569	# Word_Break (WB)
570
571	WB ; EX ; ExtendNumLet
572	WB ; FO ; Format
573	WB ; KA ; Katakana
574	WB ; LE ; ALetter
575	WB ; ML ; MidLetter
576	WB ; MN ; MidNum
577	WB ; NU ; Numeric
578	WB ; XX ; Other