4 % This file is part of the GNU C Library and contains locale data.
5 % The Free Software Foundation does not claim any copyright interest
6 % in the locale data contained in this file. The foregoing does not
7 % affect the license of the GNU C Library as a whole. It does not
8 % exempt you from the conditions of the license if your use would
9 % otherwise be governed by that license.
11 % Uzbek (latin) language locale for Uzbekistan
12 % Source: Bobir Ismailov
13 % Contact: Bobir Ismailov, Pablo Saratxaga, Mashrab Kuvatov
14 % Email: bobir_is@yahoo.com, pablo@mandrakesoft.com, kmashrab@uni-bremen.de
24 % 2002-09-09 Mashrab Kuvatov <kmashrab@uni-bremen.de>
25 % LC_TIME-day: Changed the first letter of all day names to upper case.
26 % LC_TIME-mon: Changed the first letter of all month names to upper case.
27 % Fixed a typo. September is not Senyabr, but Sentyabr.
28 % LC_TIME-abmon: Corrected "Yav" (Yanvar) to "Yan".
30 % 2003-02-24 Mashrab Kuvatov <kmashrab@uni-bremen.de>
31 % Changed charset to UTF-8
33 % ?????????? Pablo Saratxaga <pablo@mandrakesoft.com>
34 % LC_CTYPE: Added transliteration from cyrillic to latin.
35 % LC_COLLATE: Added reodering definition.
38 title "Uzbek (latin) locale for Uzbekistan"
39 source "Bobir Ismailov"
41 contact "Bobir Ismailov, Pablo Saratxaga, Mashrab Kuvatov"
42 email "bobir_is@yahoo.com, pablo@mandrakesoft.com, kmashrab@uni-bremen.de"
46 territory "Uzbekistan"
50 category "i18n:2012";LC_IDENTIFICATION
51 category "i18n:2012";LC_CTYPE
52 category "i18n:2012";LC_COLLATE
53 category "i18n:2012";LC_TIME
54 category "i18n:2012";LC_NUMERIC
55 category "i18n:2012";LC_MONETARY
56 category "i18n:2012";LC_MESSAGES
57 category "i18n:2012";LC_PAPER
58 category "i18n:2012";LC_NAME
59 category "i18n:2012";LC_ADDRESS
60 category "i18n:2012";LC_TELEPHONE
61 category "i18n:2012";LC_MEASUREMENT
68 include "translit_combining";""
73 <U0430> "<U0061>" % a= -> a
74 <U0431> "<U0062>" % b= -> b
75 <U0432> "<U0076>" % v= -> v
76 <U0433> "<U0067>" % g= -> g
77 <U0434> "<U0064>" % d= -> d
78 <U0435> "<U0065>" % e= -> e (ye also, but context dependent)
79 <U0451> "<U0079><U006F>" % io -> yo
80 <U0436> "<U006A>" % z% -> j
81 <U0437> "<U007A>" % z= -> z
82 <U0438> "<U0069>" % i= -> i
83 <U0439> "<U0079>" % j= -> y
84 <U043A> "<U006B>" % k= -> k
85 <U043B> "<U006C>" % l= -> l
86 <U043C> "<U006D>" % m= -> m
87 <U043D> "<U006E>" % n= -> n
88 <U043E> "<U006F>" % o= -> o
89 <U043F> "<U0070>" % p= -> p
90 <U0440> "<U0072>" % r= -> r
91 <U0441> "<U0073>" % s= -> s
92 <U0442> "<U0074>" % t= -> t
93 <U0443> "<U0075>" % u= -> u
94 <U0444> "<U0066>" % f= -> f
95 <U0445> "<U0078>" % h= -> x
96 <U0446> "<U0074><U0073>" % c= -> ts
97 <U0447> "<U0063><U0068>" % c% -> ch
98 <U0448> "<U0073><U0068>" % s% -> sh
99 <U0449> "<U0073><U0068>" % shcha -> sh
100 <U044A> "<U0027>" % hard sign= -> '
101 <U044B> "<U0069>" % yeru -> 1
102 <U044C> "" % soft sign omitted. not in latin-uzbek alphabet. stupid, but it is a fact.
103 <U044D> "<U0065>" % je= -> e
104 <U044E> "<U0079><U0075>" % ju -> yu
105 <U044F> "<U0079><U0061>" % ja -> ya
106 <U045E> "<U006F><U0027>" % v% -> o'
107 <U049B> "<U0071>" % k,= -> q
108 <U0493> "<U0067><U0027>" % g-= -> g'
109 <U04B3> "<U0068>" % h,= -> h
113 <U0410> "<U0041>" % a= -> a
114 <U0411> "<U0042>" % b= -> b
115 <U0412> "<U0056>" % v= -> v
116 <U0413> "<U0047>" % g= -> g
117 <U0414> "<U0044>" % d= -> d
118 <U0415> "<U0045>" % e= -> e (ye also, but context dependent)
119 <U0401> "<U0059><U006F>" % io -> yo
120 <U0416> "<U004A>" % z% -> j
121 <U0417> "<U005A>" % z= -> z
122 <U0418> "<U0049>" % i= -> i
123 <U0419> "<U0059>" % j= -> y
124 <U041A> "<U004B>" % k= -> k
125 <U041B> "<U004C>" % l= -> l
126 <U041C> "<U004D>" % m= -> m
127 <U041D> "<U004E>" % n= -> n
128 <U041E> "<U004F>" % o= -> o
129 <U041F> "<U0050>" % p= -> p
130 <U0420> "<U0052>" % r= -> r
131 <U0421> "<U0053>" % s= -> s
132 <U0422> "<U0054>" % t= -> t
133 <U0423> "<U0055>" % u= -> u
134 <U0424> "<U0046>" % f= -> f
135 <U0425> "<U0058>" % h= -> x
136 <U0426> "<U0054><U0073>" % c= -> ts
137 <U0427> "<U0043><U0068>" % c% -> ch
138 <U0428> "<U0053><U0068>" % s% -> sh
139 <U0429> "<U0053><U0068>" % shcha -> sh
140 <U042A> "<U0027>" % hard sign= -> '
141 <U042B> "<U0049>" % yeru -> i
142 <U042C> "" % soft sign omitted. not in latin-uzbek alphabet. stupid, but it is a fact.
143 <U042D> "<U0045>" % je -> e
144 <U042E> "<U0059><U0075>" % ju -> yu
145 <U042F> "<U0059><U0061>" % ja -> ya
146 <U040E> "<U004F><U0027>" % v% -> o'
147 <U049A> "<U0051>" % k,= -> q
148 <U0492> "<U0047><U0027>" % g-= -> g'
149 <U04B2> "<U0048>" % h,= -> h
151 % various punctuation
152 <U02BB> "<U0027>" % ‘ -> '
158 % CLDR collation rules for Uzbek:
159 % (see: https://unicode.org/cldr/trac/browser/trunk/common/collation/uz.xml)
162 % <collation type="standard"><cr><![CDATA[
163 % # The following letters sort after z, see
164 % # https://en.wikipedia.org/wiki/Uzbek_alphabet#Alphabetical_order
165 % # Native speaker+linguists say that
166 % # the digraph ⟨ng⟩ and the symbol ⟨ʼ⟩ are not considered separate letters.
168 % # Reset between the last z-like letter and ezh.
170 % # U+02BB ʻ MODIFIER LETTER TURNED COMMA is hard to type, so make
171 % # equivalent contractions with U+2018 ‘ LEFT SINGLE QUOTATION MARK
172 % # and U+0027 APOSTROPHE.
173 % # (https://en.wikipedia.org/wiki/Uzbek_alphabet#Distinct_characters)
174 % # Remember that a pair of apostrophes encodes just one of them.
175 % &[before 1]ʒ<oʻ=o‘=o''<<<Oʻ=O‘=O''
176 % <gʻ=g‘=g''<<<Gʻ=G‘=G''
179 % ]]></cr></collation>
182 % And CLDR also lists the following
184 % (see: https://unicode.org/cldr/trac/browser/trunk/common/main/uz.xml)
186 % <exemplarCharacters type="index">[A B D E F G H I J K L M N O P Q R S T U V X Y Z {Oʻ} {Gʻ} {Sh} {Ch}]</exemplarCharacters>
189 collating-symbol <g'-digraph>
190 collating-symbol <o'-digraph>
191 collating-element <g-turned-comma> from "g<U02BB>"
192 collating-element <G-turned-comma> from "G<U02BB>"
193 collating-element <o-turned-comma> from "o<U02BB>"
194 collating-element <O-turned-comma> from "O<U02BB>"
195 % Unfortunately we cannot use “left single quotation mark” because
196 % it fails when creating the uz_UZ.iso88591 locale. In UTF-8 it works
197 % but in ISO-8859-1 one gets error messages that it uses the same
198 % encoding as “turned comma”
199 % collating-element <g-left-single-quotation-mark> from "g<U2018>"
200 % collating-element <G-left-single-quotation-mark> from "G<U2018>"
201 % collating-element <o-left-single-quotation-mark> from "o<U2018>"
202 % collating-element <O-left-single-quotation-mark> from "O<U2018>"
203 collating-element <g-double-apostrophe> from "g''"
204 collating-element <G-double-apostrophe> from "G''"
205 collating-element <o-double-apostrophe> from "o''"
206 collating-element <O-double-apostrophe> from "O''"
207 collating-symbol <sh-digraph>
208 collating-element <sh> from "sh"
209 collating-element <sH> from "sH"
210 collating-element <Sh> from "Sh"
211 collating-element <SH> from "SH"
212 collating-symbol <ch-digraph>
213 collating-element <ch> from "ch"
214 collating-element <cH> from "cH"
215 collating-element <Ch> from "Ch"
216 collating-element <CH> from "CH"
218 reorder-after <AFTER-Z>
224 <o-turned-comma> <o'-digraph>;"<BASE><BASE>";"<MIN><MIN>";<VRNT1>
225 <O-turned-comma> <o'-digraph>;"<BASE><BASE>";"<CAP><MIN>";<VRNT1>
226 % <o-left-single-quotation-mark> <o'-digraph>;"<BASE><BASE>";"<MIN><MIN>";<VRNT2>
227 % <O-left-single-quotation-mark> <o'-digraph>;"<BASE><BASE>";"<CAP><MIN>";<VRNT2>
228 <o-double-apostrophe> <o'-digraph>;"<BASE><BASE>";"<MIN><MIN>";<VRNT3>
229 <O-double-apostrophe> <o'-digraph>;"<BASE><BASE>";"<CAP><MIN>";<VRNT3>
230 <g-turned-comma> <g'-digraph>;"<BASE><BASE>";"<MIN><MIN>";<VRNT1>
231 <G-turned-comma> <g'-digraph>;"<BASE><BASE>";"<CAP><MIN>";<VRNT1>
232 % <g-left-single-quotation-mark> <g'-digraph>;"<BASE><BASE>";"<MIN><MIN>";<VRNT2>
233 % <G-left-single-quotation-mark> <g'-digraph>;"<BASE><BASE>";"<CAP><MIN>";<VRNT2>
234 <g-double-apostrophe> <g'-digraph>;"<BASE><BASE>";"<MIN><MIN>";<VRNT3>
235 <G-double-apostrophe> <g'-digraph>;"<BASE><BASE>";"<CAP><MIN>";<VRNT3>
236 <sh> <sh-digraph>;"<BASE><BASE>";"<MIN><MIN>";IGNORE
237 <sH> <sh-digraph>;"<BASE><BASE>";"<MIN><CAP>";IGNORE
238 <Sh> <sh-digraph>;"<BASE><BASE>";"<CAP><MIN>";IGNORE
239 <SH> <sh-digraph>;"<BASE><BASE>";"<CAP><CAP>";IGNORE
240 <ch> <ch-digraph>;"<BASE><BASE>";"<MIN><MIN>";IGNORE
241 <cH> <ch-digraph>;"<BASE><BASE>";"<MIN><CAP>";IGNORE
242 <Ch> <ch-digraph>;"<BASE><BASE>";"<CAP><MIN>";IGNORE
243 <CH> <ch-digraph>;"<BASE><BASE>";"<CAP><CAP>";IGNORE
250 int_curr_symbol "UZS "
251 currency_symbol "so<U02BB>m"
252 mon_decimal_point "."
253 mon_thousands_sep ","
303 d_t_fmt "%T, %d %B, %Y yil, %A"
308 date_fmt "%d %B, %Y yil, %A"
314 % Note: "No" is "yo‘q" which conflicts with English "yes".
315 % This is why "jo‘q" & "jJ" is also accepted as "no".
316 yesexpr "^[+1hH<U04B2><U04B3>]"
317 noexpr "^[-0nNyYjJ<U0419><U0439>]"
328 tel_int_fmt "+%c %a %l"
338 name_fmt "%d%t%f%t%g%t%m"
342 % FIXME: what is miss ?
344 % FIXME: what is ms ?
349 % format: %C%N%S%N%T%N%s %h%N%f%N%b%N%d%N%e %r%N%a%N%z
350 % but %S seems not recognized yet ? so %C%N%T%N%s %h%N%f%N%b%N%d%N%e %r%N%a%N%z
352 postal_fmt "%C%N%T%N%s %h%N%f%N%b%N%d%N%e %r%N%a%N%z"
353 country_name "O<U02BB>zbekiston"
354 country_post "UZ" % ??
358 % FIXME: ISBN number?
361 lang_name "o<U2018>zbek"