1# PropertyValueAliases-4.1.0.txt
2# Date: 2005-03-28, 17:21:48 GMT [MD]
3#
4# Unicode Character Database
5# Copyright (c) 1991-2005 Unicode, Inc.
6# For terms of use, see http://www.unicode.org/terms_of_use.html
7# For documentation, see UCD.html
8#
9# This file contains aliases for property values used in the UCD.
10# These names can be used for XML formats of UCD data, for regular-expression
11# property tests, and other programmatic textual descriptions of Unicode data.
12# For information on which properties are normative, see UCD.html.
13#
14# The names may be translated in appropriate environments, and additional
15# aliases may be useful.
16#
17# FORMAT
18#
19# Each line describes a property value name.
20# This consists of three or more fields, separated by semicolons.
21#
22# First Field: The first field describes the property for which that
23# property value name is used.
24#
25# Second Field: The second field is an abbreviated name.
26# If there is no abbreviated name available, the field is marked with "n/a".
27#
28# Third Field: The third field is a long name.
29#
30# In the case of ccc, there are 4 fields. The second field is numeric, third
31# is abbreviated, and fourth is long.
32#
33# The above are the preferred aliases. Other aliases may be listed in additional fields.
34#
35# Loose matching should be applied to all property names and property values, with
36# the exception of String Property values. With loose matching of property names and
37# values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
38# values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
39#
40# NOTE: Property value names are NOT unique across properties. For example:
41#
42#   AL means Arabic Letter for the Bidi_Class property, and
43#   AL means Alpha_Left for the Combining_Class property, and
44#   AL means Alphabetic for the Line_Break property.
45#
46# In addition, some property names may be the same as some property value names.
47# For example:
48#
49#   sc means the Script property, and
50#   Sc means the General_Category property value Currency_Symbol (Sc)
51#
52# The combination of property value and property name is, however, unique.
53#
54# For more information, see UTS #18: Regular Expression Guidelines
55# ================================================
56
57
58# Age (age)
59
60age; n/a       ; 1.1
61age; n/a       ; 2.0
62age; n/a       ; 2.1
63age; n/a       ; 3.0
64age; n/a       ; 3.1
65age; n/a       ; 3.2
66age; n/a       ; 4.0
67age; n/a       ; 4.1
68age; n/a       ; unassigned
69
70# Bidi_Class (bc)
71
72bc ; AL        ; Arabic_Letter
73bc ; AN        ; Arabic_Number
74bc ; B         ; Paragraph_Separator
75bc ; BN        ; Boundary_Neutral
76bc ; CS        ; Common_Separator
77bc ; EN        ; European_Number
78bc ; ES        ; European_Separator
79bc ; ET        ; European_Terminator
80bc ; L         ; Left_To_Right
81bc ; LRE       ; Left_To_Right_Embedding
82bc ; LRO       ; Left_To_Right_Override
83bc ; NSM       ; Nonspacing_Mark
84bc ; ON        ; Other_Neutral
85bc ; PDF       ; Pop_Directional_Format
86bc ; R         ; Right_To_Left
87bc ; RLE       ; Right_To_Left_Embedding
88bc ; RLO       ; Right_To_Left_Override
89bc ; S         ; Segment_Separator
90bc ; WS        ; White_Space
91
92# Block (blk)
93
94blk; n/a       ; Aegean_Numbers
95blk; n/a       ; Alphabetic_Presentation_Forms
96blk; n/a       ; Ancient_Greek_Musical_Notation
97blk; n/a       ; Ancient_Greek_Numbers
98blk; n/a       ; Arabic
99blk; n/a       ; Arabic_Presentation_Forms-A
100blk; n/a       ; Arabic_Presentation_Forms-B
101blk; n/a       ; Arabic_Supplement
102blk; n/a       ; Armenian
103blk; n/a       ; Arrows
104blk; n/a       ; Basic_Latin
105blk; n/a       ; Bengali
106blk; n/a       ; Block_Elements
107blk; n/a       ; Bopomofo
108blk; n/a       ; Bopomofo_Extended
109blk; n/a       ; Box_Drawing
110blk; n/a       ; Braille_Patterns
111blk; n/a       ; Buginese
112blk; n/a       ; Buhid
113blk; n/a       ; Byzantine_Musical_Symbols
114blk; n/a       ; Cherokee
115blk; n/a       ; CJK_Compatibility
116blk; n/a       ; CJK_Compatibility_Forms
117blk; n/a       ; CJK_Compatibility_Ideographs
118blk; n/a       ; CJK_Compatibility_Ideographs_Supplement
119blk; n/a       ; CJK_Radicals_Supplement
120blk; n/a       ; CJK_Strokes
121blk; n/a       ; CJK_Symbols_and_Punctuation
122blk; n/a       ; CJK_Unified_Ideographs
123blk; n/a       ; CJK_Unified_Ideographs_Extension_A
124blk; n/a       ; CJK_Unified_Ideographs_Extension_B
125blk; n/a       ; Combining_Diacritical_Marks
126blk; n/a       ; Combining_Diacritical_Marks_for_Symbols
127blk; n/a       ; Combining_Diacritical_Marks_Supplement
128blk; n/a       ; Combining_Half_Marks
129blk; n/a       ; Control_Pictures
130blk; n/a       ; Coptic
131blk; n/a       ; Currency_Symbols
132blk; n/a       ; Cypriot_Syllabary
133blk; n/a       ; Cyrillic
134blk; n/a       ; Cyrillic_Supplement              ; Cyrillic_Supplementary
135blk; n/a       ; Deseret
136blk; n/a       ; Devanagari
137blk; n/a       ; Dingbats
138blk; n/a       ; Enclosed_Alphanumerics
139blk; n/a       ; Enclosed_CJK_Letters_and_Months
140blk; n/a       ; Ethiopic
141blk; n/a       ; Ethiopic_Extended
142blk; n/a       ; Ethiopic_Supplement
143blk; n/a       ; General_Punctuation
144blk; n/a       ; Geometric_Shapes
145blk; n/a       ; Georgian
146blk; n/a       ; Georgian_Supplement
147blk; n/a       ; Glagolitic
148blk; n/a       ; Gothic
149blk; n/a       ; Greek_and_Coptic
150blk; n/a       ; Greek_Extended
151blk; n/a       ; Gujarati
152blk; n/a       ; Gurmukhi
153blk; n/a       ; Halfwidth_and_Fullwidth_Forms
154blk; n/a       ; Hangul_Compatibility_Jamo
155blk; n/a       ; Hangul_Jamo
156blk; n/a       ; Hangul_Syllables
157blk; n/a       ; Hanunoo
158blk; n/a       ; Hebrew
159blk; n/a       ; High_Private_Use_Surrogates
160blk; n/a       ; High_Surrogates
161blk; n/a       ; Hiragana
162blk; n/a       ; Ideographic_Description_Characters
163blk; n/a       ; IPA_Extensions
164blk; n/a       ; Kanbun
165blk; n/a       ; Kangxi_Radicals
166blk; n/a       ; Kannada
167blk; n/a       ; Katakana
168blk; n/a       ; Katakana_Phonetic_Extensions
169blk; n/a       ; Kharoshthi
170blk; n/a       ; Khmer
171blk; n/a       ; Khmer_Symbols
172blk; n/a       ; Lao
173blk; n/a       ; Latin-1_Supplement
174blk; n/a       ; Latin_Extended-A
175blk; n/a       ; Latin_Extended-B
176blk; n/a       ; Latin_Extended_Additional
177blk; n/a       ; Letterlike_Symbols
178blk; n/a       ; Limbu
179blk; n/a       ; Linear_B_Ideograms
180blk; n/a       ; Linear_B_Syllabary
181blk; n/a       ; Low_Surrogates
182blk; n/a       ; Malayalam
183blk; n/a       ; Mathematical_Alphanumeric_Symbols
184blk; n/a       ; Mathematical_Operators
185blk; n/a       ; Miscellaneous_Mathematical_Symbols-A
186blk; n/a       ; Miscellaneous_Mathematical_Symbols-B
187blk; n/a       ; Miscellaneous_Symbols
188blk; n/a       ; Miscellaneous_Symbols_and_Arrows
189blk; n/a       ; Miscellaneous_Technical
190blk; n/a       ; Modifier_Tone_Letters
191blk; n/a       ; Mongolian
192blk; n/a       ; Musical_Symbols
193blk; n/a       ; Myanmar
194blk; n/a       ; New_Tai_Lue
195blk; n/a       ; No_Block
196blk; n/a       ; Number_Forms
197blk; n/a       ; Ogham
198blk; n/a       ; Old_Italic
199blk; n/a       ; Old_Persian
200blk; n/a       ; Optical_Character_Recognition
201blk; n/a       ; Oriya
202blk; n/a       ; Osmanya
203blk; n/a       ; Phonetic_Extensions
204blk; n/a       ; Phonetic_Extensions_Supplement
205blk; n/a       ; Private_Use_Area
206blk; n/a       ; Runic
207blk; n/a       ; Shavian
208blk; n/a       ; Sinhala
209blk; n/a       ; Small_Form_Variants
210blk; n/a       ; Spacing_Modifier_Letters
211blk; n/a       ; Specials
212blk; n/a       ; Superscripts_and_Subscripts
213blk; n/a       ; Supplemental_Arrows-A
214blk; n/a       ; Supplemental_Arrows-B
215blk; n/a       ; Supplemental_Mathematical_Operators
216blk; n/a       ; Supplemental_Punctuation
217blk; n/a       ; Supplementary_Private_Use_Area-A
218blk; n/a       ; Supplementary_Private_Use_Area-B
219blk; n/a       ; Syloti_Nagri
220blk; n/a       ; Syriac
221blk; n/a       ; Tagalog
222blk; n/a       ; Tagbanwa
223blk; n/a       ; Tags
224blk; n/a       ; Tai_Le
225blk; n/a       ; Tai_Xuan_Jing_Symbols
226blk; n/a       ; Tamil
227blk; n/a       ; Telugu
228blk; n/a       ; Thaana
229blk; n/a       ; Thai
230blk; n/a       ; Tibetan
231blk; n/a       ; Tifinagh
232blk; n/a       ; Ugaritic
233blk; n/a       ; Unified_Canadian_Aboriginal_Syllabics
234blk; n/a       ; Variation_Selectors
235blk; n/a       ; Variation_Selectors_Supplement
236blk; n/a       ; Vertical_Forms
237blk; n/a       ; Yi_Radicals
238blk; n/a       ; Yi_Syllables
239blk; n/a       ; Yijing_Hexagram_Symbols
240
241# Canonical_Combining_Class (ccc)
242
243ccc;   0; NR   ; Not_Reordered
244ccc;   1; OV   ; Overlay
245ccc;   7; NK   ; Nukta
246ccc;   8; KV   ; Kana_Voicing
247ccc;   9; VR   ; Virama
248ccc; 200; ATBL ; Attached_Below_Left
249ccc; 202; ATB  ; Attached_Below
250ccc; 216; ATAR ; Attached_Above_Right
251ccc; 218; BL   ; Below_Left
252ccc; 220; B    ; Below
253ccc; 222; BR   ; Below_Right
254ccc; 224; L    ; Left
255ccc; 226; R    ; Right
256ccc; 228; AL   ; Above_Left
257ccc; 230; A    ; Above
258ccc; 232; AR   ; Above_Right
259ccc; 233; DB   ; Double_Below
260ccc; 234; DA   ; Double_Above
261ccc; 240; IS   ; Iota_Subscript
262
263# Decomposition_Type (dt)
264
265dt ; can       ; Canonical
266dt ; com       ; Compat
267dt ; enc       ; Circle
268dt ; fin       ; Final
269dt ; font      ; Font
270dt ; fra       ; Fraction
271dt ; init      ; Initial
272dt ; iso       ; Isolated
273dt ; med       ; Medial
274dt ; nar       ; Narrow
275dt ; nb        ; Nobreak
276dt ; none      ; None
277dt ; sml       ; Small
278dt ; sqr       ; Square
279dt ; sub       ; Sub
280dt ; sup       ; Super
281dt ; vert      ; Vertical
282dt ; wide      ; Wide
283
284# East_Asian_Width (ea)
285
286ea ; A         ; Ambiguous
287ea ; F         ; Fullwidth
288ea ; H         ; Halfwidth
289ea ; N         ; Neutral
290ea ; Na        ; Narrow
291ea ; W         ; Wide
292
293# General_Category (gc)
294
295gc ; C         ; Other                            # Cc | Cf | Cn | Co | Cs
296gc ; Cc        ; Control                          ; cntrl
297gc ; Cf        ; Format
298gc ; Cn        ; Unassigned
299gc ; Co        ; Private_Use
300gc ; Cs        ; Surrogate
301gc ; L         ; Letter                           # Ll | Lm | Lo | Lt | Lu
302gc ; LC        ; Cased_Letter                     # Ll | Lt | Lu
303gc ; Ll        ; Lowercase_Letter
304gc ; Lm        ; Modifier_Letter
305gc ; Lo        ; Other_Letter
306gc ; Lt        ; Titlecase_Letter
307gc ; Lu        ; Uppercase_Letter
308gc ; M         ; Mark                             # Mc | Me | Mn
309gc ; Mc        ; Spacing_Mark
310gc ; Me        ; Enclosing_Mark
311gc ; Mn        ; Nonspacing_Mark
312gc ; N         ; Number                           # Nd | Nl | No
313gc ; Nd        ; Decimal_Number                   ; digit
314gc ; Nl        ; Letter_Number
315gc ; No        ; Other_Number
316gc ; P         ; Punctuation                      ; punct                            # Pc | Pd | Pe | Pf | Pi | Po | Ps
317gc ; Pc        ; Connector_Punctuation
318gc ; Pd        ; Dash_Punctuation
319gc ; Pe        ; Close_Punctuation
320gc ; Pf        ; Final_Punctuation
321gc ; Pi        ; Initial_Punctuation
322gc ; Po        ; Other_Punctuation
323gc ; Ps        ; Open_Punctuation
324gc ; S         ; Symbol                           # Sc | Sk | Sm | So
325gc ; Sc        ; Currency_Symbol
326gc ; Sk        ; Modifier_Symbol
327gc ; Sm        ; Math_Symbol
328gc ; So        ; Other_Symbol
329gc ; Z         ; Separator                        # Zl | Zp | Zs
330gc ; Zl        ; Line_Separator
331gc ; Zp        ; Paragraph_Separator
332gc ; Zs        ; Space_Separator
333
334# Grapheme_Cluster_Break (GCB)
335
336GCB; CN        ; Control
337GCB; CR        ; CR
338GCB; EX        ; Extend
339GCB; L         ; L
340GCB; LF        ; LF
341GCB; LV        ; LV
342GCB; LVT       ; LVT
343GCB; T         ; T
344GCB; V         ; V
345GCB; XX        ; Other
346
347# Hangul_Syllable_Type (hst)
348
349hst; L         ; Leading_Jamo
350hst; LV        ; LV_Syllable
351hst; LVT       ; LVT_Syllable
352hst; NA        ; Not_Applicable
353hst; T         ; Trailing_Jamo
354hst; V         ; Vowel_Jamo
355
356# Joining_Group (jg)
357
358jg ; n/a       ; Ain
359jg ; n/a       ; Alaph
360jg ; n/a       ; Alef
361jg ; n/a       ; Beh
362jg ; n/a       ; Beth
363jg ; n/a       ; Dal
364jg ; n/a       ; Dalath_Rish
365jg ; n/a       ; E
366jg ; n/a       ; Fe
367jg ; n/a       ; Feh
368jg ; n/a       ; Final_Semkath
369jg ; n/a       ; Gaf
370jg ; n/a       ; Gamal
371jg ; n/a       ; Hah
372jg ; n/a       ; Hamza_On_Heh_Goal
373jg ; n/a       ; He
374jg ; n/a       ; Heh
375jg ; n/a       ; Heh_Goal
376jg ; n/a       ; Heth
377jg ; n/a       ; Kaf
378jg ; n/a       ; Kaph
379jg ; n/a       ; Khaph
380jg ; n/a       ; Knotted_Heh
381jg ; n/a       ; Lam
382jg ; n/a       ; Lamadh
383jg ; n/a       ; Meem
384jg ; n/a       ; Mim
385jg ; n/a       ; No_Joining_Group
386jg ; n/a       ; Noon
387jg ; n/a       ; Nun
388jg ; n/a       ; Pe
389jg ; n/a       ; Qaf
390jg ; n/a       ; Qaph
391jg ; n/a       ; Reh
392jg ; n/a       ; Reversed_Pe
393jg ; n/a       ; Sad
394jg ; n/a       ; Sadhe
395jg ; n/a       ; Seen
396jg ; n/a       ; Semkath
397jg ; n/a       ; Shin
398jg ; n/a       ; Swash_Kaf
399jg ; n/a       ; Syriac_Waw
400jg ; n/a       ; Tah
401jg ; n/a       ; Taw
402jg ; n/a       ; Teh_Marbuta
403jg ; n/a       ; Teth
404jg ; n/a       ; Waw
405jg ; n/a       ; Yeh
406jg ; n/a       ; Yeh_Barree
407jg ; n/a       ; Yeh_With_Tail
408jg ; n/a       ; Yudh
409jg ; n/a       ; Yudh_He
410jg ; n/a       ; Zain
411jg ; n/a       ; Zhain
412
413# Joining_Type (jt)
414
415jt ; C         ; Join_Causing
416jt ; D         ; Dual_Joining
417jt ; L         ; Left_Joining
418jt ; R         ; Right_Joining
419jt ; T         ; Transparent
420jt ; U         ; Non_Joining
421
422# Line_Break (lb)
423
424lb ; AI        ; Ambiguous
425lb ; AL        ; Alphabetic
426lb ; B2        ; Break_Both
427lb ; BA        ; Break_After
428lb ; BB        ; Break_Before
429lb ; BK        ; Mandatory_Break
430lb ; CB        ; Contingent_Break
431lb ; CL        ; Close_Punctuation
432lb ; CM        ; Combining_Mark
433lb ; CR        ; Carriage_Return
434lb ; EX        ; Exclamation
435lb ; GL        ; Glue
436lb ; H2        ; H2
437lb ; H3        ; H3
438lb ; HY        ; Hyphen
439lb ; ID        ; Ideographic
440lb ; IN        ; Inseparable                      ; Inseperable
441lb ; IS        ; Infix_Numeric
442lb ; JL        ; JL
443lb ; JT        ; JT
444lb ; JV        ; JV
445lb ; LF        ; Line_Feed
446lb ; NL        ; Next_Line
447lb ; NS        ; Nonstarter
448lb ; NU        ; Numeric
449lb ; OP        ; Open_Punctuation
450lb ; PO        ; Postfix_Numeric
451lb ; PR        ; Prefix_Numeric
452lb ; QU        ; Quotation
453lb ; SA        ; Complex_Context
454lb ; SG        ; Surrogate
455lb ; SP        ; Space
456lb ; SY        ; Break_Symbols
457lb ; WJ        ; Word_Joiner
458lb ; XX        ; Unknown
459lb ; ZW        ; ZWSpace
460
461# NFC_Quick_Check (NFC_QC)
462
463NFC_QC; M      ; Maybe
464NFC_QC; N      ; No
465NFC_QC; Y      ; Yes
466
467# NFD_Quick_Check (NFD_QC)
468
469NFD_QC; N      ; No
470NFD_QC; Y      ; Yes
471
472# NFKC_Quick_Check (NFKC_QC)
473
474NFKC_QC; M     ; Maybe
475NFKC_QC; N     ; No
476NFKC_QC; Y     ; Yes
477
478# NFKD_Quick_Check (NFKD_QC)
479
480NFKD_QC; N     ; No
481NFKD_QC; Y     ; Yes
482
483# Numeric_Type (nt)
484
485nt ; De        ; Decimal
486nt ; Di        ; Digit
487nt ; None      ; None
488nt ; Nu        ; Numeric
489
490# Script (sc)
491
492sc ; Arab      ; Arabic
493sc ; Armn      ; Armenian
494sc ; Beng      ; Bengali
495sc ; Bopo      ; Bopomofo
496sc ; Brai      ; Braille
497sc ; Bugi      ; Buginese
498sc ; Buhd      ; Buhid
499sc ; Cans      ; Canadian_Aboriginal
500sc ; Cher      ; Cherokee
501sc ; Copt      ; Coptic                           ; Qaac
502sc ; Cprt      ; Cypriot
503sc ; Cyrl      ; Cyrillic
504sc ; Deva      ; Devanagari
505sc ; Dsrt      ; Deseret
506sc ; Ethi      ; Ethiopic
507sc ; Geor      ; Georgian
508sc ; Glag      ; Glagolitic
509sc ; Goth      ; Gothic
510sc ; Grek      ; Greek
511sc ; Gujr      ; Gujarati
512sc ; Guru      ; Gurmukhi
513sc ; Hang      ; Hangul
514sc ; Hani      ; Han
515sc ; Hano      ; Hanunoo
516sc ; Hebr      ; Hebrew
517sc ; Hira      ; Hiragana
518sc ; Hrkt      ; Katakana_Or_Hiragana
519sc ; Ital      ; Old_Italic
520sc ; Kana      ; Katakana
521sc ; Khar      ; Kharoshthi
522sc ; Khmr      ; Khmer
523sc ; Knda      ; Kannada
524sc ; Laoo      ; Lao
525sc ; Latn      ; Latin
526sc ; Limb      ; Limbu
527sc ; Linb      ; Linear_B
528sc ; Mlym      ; Malayalam
529sc ; Mong      ; Mongolian
530sc ; Mymr      ; Myanmar
531sc ; Ogam      ; Ogham
532sc ; Orya      ; Oriya
533sc ; Osma      ; Osmanya
534sc ; Qaai      ; Inherited
535sc ; Runr      ; Runic
536sc ; Shaw      ; Shavian
537sc ; Sinh      ; Sinhala
538sc ; Sylo      ; Syloti_Nagri
539sc ; Syrc      ; Syriac
540sc ; Tagb      ; Tagbanwa
541sc ; Tale      ; Tai_Le
542sc ; Talu      ; New_Tai_Lue
543sc ; Taml      ; Tamil
544sc ; Telu      ; Telugu
545sc ; Tfng      ; Tifinagh
546sc ; Tglg      ; Tagalog
547sc ; Thaa      ; Thaana
548sc ; Thai      ; Thai
549sc ; Tibt      ; Tibetan
550sc ; Ugar      ; Ugaritic
551sc ; Xpeo      ; Old_Persian
552sc ; Yiii      ; Yi
553sc ; Zyyy      ; Common
554
555# Sentence_Break (SB)
556
557SB ; AT        ; ATerm
558SB ; CL        ; Close
559SB ; FO        ; Format
560SB ; LE        ; OLetter
561SB ; LO        ; Lower
562SB ; NU        ; Numeric
563SB ; SE        ; Sep
564SB ; SP        ; Sp
565SB ; ST        ; STerm
566SB ; UP        ; Upper
567SB ; XX        ; Other
568
569# Word_Break (WB)
570
571WB ; EX        ; ExtendNumLet
572WB ; FO        ; Format
573WB ; KA        ; Katakana
574WB ; LE        ; ALetter
575WB ; ML        ; MidLetter
576WB ; MN        ; MidNum
577WB ; NU        ; Numeric
578WB ; XX        ; Other
579