Initial commit of OpenSPARC T2 design and verification files.
[OpenSPARC-T2-DV] / tools / perl-5.8.0 / lib / 5.8.0 / Locale / Script.pm
CommitLineData
86530b38
AT
1#
2# Locale::Script - ISO codes for script identification (ISO 15924)
3#
4# $Id: Script.pm,v 2.2 2002/07/10 16:33:28 neilb Exp $
5#
6
7package Locale::Script;
8use strict;
9require 5.002;
10
11require Exporter;
12use Carp;
13use Locale::Constants;
14
15
16#-----------------------------------------------------------------------
17# Public Global Variables
18#-----------------------------------------------------------------------
19use vars qw($VERSION @ISA @EXPORT @EXPORT_OK);
20$VERSION = sprintf("%d.%02d", q$Revision: 2.2 $ =~ /(\d+)\.(\d+)/);
21@ISA = qw(Exporter);
22@EXPORT = qw(code2script script2code
23 all_script_codes all_script_names
24 script_code2code
25 LOCALE_CODE_ALPHA_2 LOCALE_CODE_ALPHA_3 LOCALE_CODE_NUMERIC);
26
27#-----------------------------------------------------------------------
28# Private Global Variables
29#-----------------------------------------------------------------------
30my $CODES = [];
31my $COUNTRIES = [];
32
33
34#=======================================================================
35#
36# code2script ( CODE [, CODESET ] )
37#
38#=======================================================================
39sub code2script
40{
41 my $code = shift;
42 my $codeset = @_ > 0 ? shift : LOCALE_CODE_DEFAULT;
43
44
45 return undef unless defined $code;
46
47 #-------------------------------------------------------------------
48 # Make sure the code is in the right form before we use it
49 # to look up the corresponding script.
50 # We have to sprintf because the codes are given as 3-digits,
51 # with leading 0's. Eg 070 for Egyptian demotic.
52 #-------------------------------------------------------------------
53 if ($codeset == LOCALE_CODE_NUMERIC)
54 {
55 return undef if ($code =~ /\D/);
56 $code = sprintf("%.3d", $code);
57 }
58 else
59 {
60 $code = lc($code);
61 }
62
63 if (exists $CODES->[$codeset]->{$code})
64 {
65 return $CODES->[$codeset]->{$code};
66 }
67 else
68 {
69 #---------------------------------------------------------------
70 # no such script code!
71 #---------------------------------------------------------------
72 return undef;
73 }
74}
75
76
77#=======================================================================
78#
79# script2code ( SCRIPT [, CODESET ] )
80#
81#=======================================================================
82sub script2code
83{
84 my $script = shift;
85 my $codeset = @_ > 0 ? shift : LOCALE_CODE_DEFAULT;
86
87
88 return undef unless defined $script;
89 $script = lc($script);
90 if (exists $COUNTRIES->[$codeset]->{$script})
91 {
92 return $COUNTRIES->[$codeset]->{$script};
93 }
94 else
95 {
96 #---------------------------------------------------------------
97 # no such script!
98 #---------------------------------------------------------------
99 return undef;
100 }
101}
102
103
104#=======================================================================
105#
106# script_code2code ( CODE, IN-CODESET, OUT-CODESET )
107#
108#=======================================================================
109sub script_code2code
110{
111 (@_ == 3) or croak "script_code2code() takes 3 arguments!";
112
113 my $code = shift;
114 my $inset = shift;
115 my $outset = shift;
116 my $outcode;
117 my $script;
118
119
120 return undef if $inset == $outset;
121 $script = code2script($code, $inset);
122 return undef if not defined $script;
123 $outcode = script2code($script, $outset);
124 return $outcode;
125}
126
127
128#=======================================================================
129#
130# all_script_codes()
131#
132#=======================================================================
133sub all_script_codes
134{
135 my $codeset = @_ > 0 ? shift : LOCALE_CODE_DEFAULT;
136
137 return keys %{ $CODES->[$codeset] };
138}
139
140
141#=======================================================================
142#
143# all_script_names()
144#
145#=======================================================================
146sub all_script_names
147{
148 my $codeset = @_ > 0 ? shift : LOCALE_CODE_DEFAULT;
149
150 return values %{ $CODES->[$codeset] };
151}
152
153
154#=======================================================================
155#
156# initialisation code - stuff the DATA into the ALPHA2 hash
157#
158#=======================================================================
159{
160 my ($alpha2, $alpha3, $numeric);
161 my $script;
162
163
164 while (<DATA>)
165 {
166 next unless /\S/;
167 chop;
168 ($alpha2, $alpha3, $numeric, $script) = split(/:/, $_, 4);
169
170 $CODES->[LOCALE_CODE_ALPHA_2]->{$alpha2} = $script;
171 $COUNTRIES->[LOCALE_CODE_ALPHA_2]->{"\L$script"} = $alpha2;
172
173 if ($alpha3)
174 {
175 $CODES->[LOCALE_CODE_ALPHA_3]->{$alpha3} = $script;
176 $COUNTRIES->[LOCALE_CODE_ALPHA_3]->{"\L$script"} = $alpha3;
177 }
178
179 if ($numeric)
180 {
181 $CODES->[LOCALE_CODE_NUMERIC]->{$numeric} = $script;
182 $COUNTRIES->[LOCALE_CODE_NUMERIC]->{"\L$script"} = $numeric;
183 }
184
185 }
186
187 close(DATA);
188}
189
1901;
191
192__DATA__
193am:ama:130:Aramaic
194ar:ara:160:Arabic
195av:ave:151:Avestan
196bh:bhm:300:Brahmi (Ashoka)
197bi:bid:372:Buhid
198bn:ben:325:Bengali
199bo:bod:330:Tibetan
200bp:bpm:285:Bopomofo
201br:brl:570:Braille
202bt:btk:365:Batak
203bu:bug:367:Buginese (Makassar)
204by:bys:550:Blissymbols
205ca:cam:358:Cham
206ch:chu:221:Old Church Slavonic
207ci:cir:291:Cirth
208cm:cmn:402:Cypro-Minoan
209co:cop:205:Coptic
210cp:cpr:403:Cypriote syllabary
211cy:cyr:220:Cyrillic
212ds:dsr:250:Deserel (Mormon)
213dv:dvn:315:Devanagari (Nagari)
214ed:egd:070:Egyptian demotic
215eg:egy:050:Egyptian hieroglyphs
216eh:egh:060:Egyptian hieratic
217el:ell:200:Greek
218eo:eos:210:Etruscan and Oscan
219et:eth:430:Ethiopic
220gl:glg:225:Glagolitic
221gm:gmu:310:Gurmukhi
222gt:gth:206:Gothic
223gu:guj:320:Gujarati
224ha:han:500:Han ideographs
225he:heb:125:Hebrew
226hg:hgl:420:Hangul
227hm:hmo:450:Pahawh Hmong
228ho:hoo:371:Hanunoo
229hr:hrg:410:Hiragana
230hu:hun:176:Old Hungarian runic
231hv:hvn:175:Kok Turki runic
232hy:hye:230:Armenian
233iv:ivl:610:Indus Valley
234ja:jap:930:(alias for Han + Hiragana + Katakana)
235jl:jlg:445:Cherokee syllabary
236jw:jwi:360:Javanese
237ka:kam:241:Georgian (Mxedruli)
238kh:khn:931:(alias for Hangul + Han)
239kk:kkn:411:Katakana
240km:khm:354:Khmer
241kn:kan:345:Kannada
242kr:krn:357:Karenni (Kayah Li)
243ks:kst:305:Kharoshthi
244kx:kax:240:Georgian (Xucuri)
245la:lat:217:Latin
246lf:laf:215:Latin (Fraktur variant)
247lg:lag:216:Latin (Gaelic variant)
248lo:lao:356:Lao
249lp:lpc:335:Lepcha (Rong)
250md:mda:140:Mandaean
251me:mer:100:Meroitic
252mh:may:090:Mayan hieroglyphs
253ml:mlm:347:Malayalam
254mn:mon:145:Mongolian
255my:mya:350:Burmese
256na:naa:400:Linear A
257nb:nbb:401:Linear B
258og:ogm:212:Ogham
259or:ory:327:Oriya
260os:osm:260:Osmanya
261ph:phx:115:Phoenician
262ph:pah:150:Pahlavi
263pl:pld:282:Pollard Phonetic
264pq:pqd:295:Klingon plQaD
265pr:prm:227:Old Permic
266ps:pst:600:Phaistos Disk
267rn:rnr:211:Runic (Germanic)
268rr:rro:620:Rongo-rongo
269sa:sar:110:South Arabian
270si:sin:348:Sinhala
271sj:syj:137:Syriac (Jacobite variant)
272sl:slb:440:Unified Canadian Aboriginal Syllabics
273sn:syn:136:Syriac (Nestorian variant)
274sw:sww:281:Shavian (Shaw)
275sy:syr:135:Syriac (Estrangelo)
276ta:tam:346:Tamil
277tb:tbw:373:Tagbanwa
278te:tel:340:Telugu
279tf:tfn:120:Tifnagh
280tg:tag:370:Tagalog
281th:tha:352:Thai
282tn:tna:170:Thaana
283tw:twr:290:Tengwar
284va:vai:470:Vai
285vs:vsp:280:Visible Speech
286xa:xas:000:Cuneiform, Sumero-Akkadian
287xf:xfa:105:Cuneiform, Old Persian
288xk:xkn:412:(alias for Hiragana + Katakana)
289xu:xug:106:Cuneiform, Ugaritic
290yi:yii:460:Yi
291zx:zxx:997:Unwritten language
292zy:zyy:998:Undetermined script
293zz:zzz:999:Uncoded script