Update copyright year to 2014 by running admin/update-copyright.
[emacs.git] / lisp / language / ind-util.el
blobf5c29a0db1a0f4d9868cfcead020850d06bbdcdc
1 ;;; ind-util.el --- Transliteration and Misc. Tools for Indian Languages -*- coding: utf-8-emacs; -*-
3 ;; Copyright (C) 2001-2014 Free Software Foundation, Inc.
5 ;; Maintainer: KAWABATA, Taichi <kawabata@m17n.org>
6 ;; Keywords: multilingual, Indian, Devanagari
8 ;; This file is part of GNU Emacs.
10 ;; GNU Emacs is free software: you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation, either version 3 of the License, or
13 ;; (at your option) any later version.
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
23 ;;; Commentary:
25 ;; This file provides conversion between UCS and various
26 ;; transliteration schemes, such as ITRANS, kyoto-harvard and aiba
27 ;; methods. It also provides conversion between IS 13194 and UCS.
28 ;; Finally, this program provides the compatibility support with
29 ;; old implementation of Devanagari script.
31 ;;; Code:
33 ;;; Transliteration
35 ;; The followings provide the various transliteration schemes (such as
36 ;; ITRANS, kyoto-harvard, and Aiba) of Indian scripts. They are also
37 ;; used in quail/indian.el for typing Indian script in Emacs.
39 (eval-and-compile
41 (defun indian-regexp-of-hashtbl-keys (hashtbl)
42 "Returns the regular expression of hashtable keys."
43 (let (keys)
44 (maphash (lambda (key val) (push key keys)) hashtbl)
45 (regexp-opt keys)))
47 (defvar indian-dev-base-table
49 (;; VOWELS (18)
50 (?अ nil) (?आ ?ा) (?इ ?ि) (?ई ?ी) (?उ ?ु) (?ऊ ?ू)
51 (?ऋ ?ृ) (?ऌ ?ॢ) (?ऍ ?ॅ) (?ऎ ?ॆ) (?ए ?े) (?ऐ ?ै)
52 (?ऑ ?ॉ) (?ऒ ?ॊ) (?ओ ?ो) (?औ ?ौ) (?ॠ ?ॄ) (?ॡ ?ॣ))
53 (;; CONSONANTS (currently 42, including special cases)
54 ?क ?ख ?ग ?घ ?ङ ;; GUTTRULS
55 ?च ?छ ?ज ?झ ?ञ ;; PALATALS
56 ?ट ?ठ ?ड ?ढ ?ण ;; CEREBRALS
57 ?त ?थ ?द ?ध ?न ?ऩ ;; DENTALS
58 ?प ?फ ?ब ?भ ?म ;; LABIALS
59 ?य ?र ?ऱ ?ल ?ळ ?ऴ ?व ;; SEMIVOWELS
60 ?श ?ष ?स ?ह ;; SIBILANTS
61 ?क़ ?ख़ ?ग़ ?ज़ ?ड़ ?ढ़ ?फ़ ?य़ ;; NUKTAS
62 "ज्ञ" "क्ष")
63 (;; Misc Symbols (7)
64 ?ँ ?ं ?ः ?ऽ ?् ?ॐ ?।)
65 (;; Digits (10)
66 ?० ?१ ?२ ?३ ?४ ?५ ?६ ?७ ?८ ?९)
67 (;; Inscript-extra (4) (#, $, ^, *, ])
68 "्र" "र्" "त्र" "श्र" "़")))
70 ;; Punjabi is also known as Gurmukhi.
71 (defvar indian-pnj-base-table
73 (;; VOWELS
74 (?ਅ nil) (?ਆ ?ਾ) (?ਇ ?ਿ) (?ਈ ?ੀ) (?ਉ ?ੁ) (?ਊ ?ੂ)
75 nil nil nil nil (?ਏ ?ੇ) (?ਐ ?ੈ)
76 nil nil (?ਓ ?ੋ) (?ਔ ?ੌ) nil nil)
77 (;; CONSONANTS
78 ?ਕ ?ਖ ?ਗ ?ਘ ?ਙ ;; GUTTRULS
79 ?ਚ ?ਛ ?ਜ ?ਝ ?ਞ ;; PALATALS
80 ?ਟ ?ਠ ?ਡ ?ਢ ?ਣ ;; CEREBRALS
81 ?ਤ ?ਥ ?ਦ ?ਧ ?ਨ nil ;; DENTALS
82 ?ਪ ?ਫ ?ਬ ?ਭ ?ਮ ;; LABIALS
83 ?ਯ ?ਰ nil ?ਲ ?ਲ਼ nil ?ਵ ;; SEMIVOWELS
84 ?ਸ਼ nil ?ਸ ?ਹ ;; SIBILANTS
85 nil ?ਖ਼ ?ਗ਼ ?ਜ਼ ?ੜ nil ?ਫ਼ nil ;; NUKTAS
86 "ਜ੍ਞ" nil)
87 (;; Misc Symbols (7)
88 nil ?ਂ nil nil ?੍ nil nil) ;; ek onkar, etc.
89 (;; Digits
90 ?੦ ?੧ ?੨ ?੩ ?੪ ?੫ ?੬ ?੭ ?੮ ?੯)
91 (;; Inscript-extra (4) (#, $, ^, *, ])
92 "੍ਰ" "ਰ੍" "ਤ੍ਰ" "ਸ਼੍ਰ" "਼")))
94 (defvar indian-gjr-base-table
96 (;; VOWELS
97 (?અ nil) (?આ ?ા) (?ઇ ?િ) (?ઈ ?ી) (?ઉ ?ુ) (?ઊ ?ૂ)
98 (?ઋ ?ૃ) nil (?ઍ ?ૅ) nil (?એ ?ે) (?ઐ ?ૈ)
99 (?ઑ ?ૉ) nil (?ઓ ?ો) (?ઔ ?ૌ) (?ૠ ?ૄ) nil)
100 (;; CONSONANTS
101 ?ક ?ખ ?ગ ?ઘ ?ઙ ;; GUTTRULS
102 ?ચ ?છ ?જ ?ઝ ?ઞ ;; PALATALS
103 ?ટ ?ઠ ?ડ ?ઢ ?ણ ;; CEREBRALS
104 ?ત ?થ ?દ ?ધ ?ન nil ;; DENTALS
105 ?પ ?ફ ?બ ?ભ ?મ ;; LABIALS
106 ?ય ?ર nil ?લ ?ળ nil ?વ ;; SEMIVOWELS
107 ?શ ?ષ ?સ ?હ ;; SIBILANTS
108 nil nil nil nil nil nil nil nil ;; NUKTAS
109 "જ્ઞ" "ક્ષ")
110 (;; Misc Symbols (7)
111 ?ઁ ?ં ?ઃ ?ઽ ?્ ?ૐ nil)
112 (;; Digits
113 ?૦ ?૧ ?૨ ?૩ ?૪ ?૫ ?૬ ?૭ ?૮ ?૯)
114 (;; Inscript-extra (4) (#, $, ^, *, ])
115 "્ર" "ર્" "ત્ર" "શ્ર" "઼")))
117 (defvar indian-ori-base-table
119 (;; VOWELS
120 (?ଅ nil) (?ଆ ?ା) (?ଇ ?ି) (?ଈ ?ୀ) (?ଉ ?ୁ) (?ଊ ?ୂ)
121 (?ଋ ?ୃ) (?ଌ nil) nil nil (?ଏ ?େ) (?ଐ ?ୈ)
122 nil nil (?ଓ ?ୋ) (?ଔ ?ୌ) (?ୠ nil) (?ୡ nil))
123 (;; CONSONANTS
124 ?କ ?ଖ ?ଗ ?ଘ ?ଙ ;; GUTTRULS
125 ?ଚ ?ଛ ?ଜ ?ଝ ?ଞ ;; PALATALS
126 ?ଟ ?ଠ ?ଡ ?ଢ ?ଣ ;; CEREBRALS
127 ?ତ ?ଥ ?ଦ ?ଧ ?ନ nil ;; DENTALS
128 ?ପ ?ଫ ?ବ ?ଭ ?ମ ;; LABIALS
129 ?ଯ ?ର nil ?ଲ ?ଳ nil nil ;; SEMIVOWELS
130 ?ଶ ?ଷ ?ସ ?ହ ;; SIBILANTS
131 nil nil nil nil ?ଡ଼ ?ଢ଼ nil ?ୟ ;; NUKTAS
132 "ଜ୍ଞ" "କ୍ଷ")
133 (;; Misc Symbols
134 ?ଁ ?ଂ ?ଃ ?ଽ ?୍ nil nil)
135 (;; Digits
136 ?୦ ?୧ ?୨ ?୩ ?୪ ?୫ ?୬ ?୭ ?୮ ?୯)
137 (;; Inscript-extra (4) (#, $, ^, *, ])
138 "୍ର" "ର୍" "ତ୍ର" "ଶ୍ର" "଼")))
140 (defvar indian-bng-base-table
142 (;; VOWELS
143 (?অ nil) (?আ ?া) (?ই ?ি) (?ঈ ?ী) (?উ ?ু) (?ঊ ?ূ)
144 (?ঋ ?ৃ) (?ঌ ?ৢ) nil nil (?এ ?ে) (?ঐ ?ৈ)
145 nil nil (?ও ?ো) (?ঔ ?ৌ) (?ৠ ?ৄ) (?ৡ ?ৣ))
146 (;; CONSONANTS
147 ?ক ?খ ?গ ?ঘ ?ঙ ;; GUTTRULS
148 ?চ ?ছ ?জ ?ঝ ?ঞ ;; PALATALS
149 ?ট ?ঠ ?ড ?ঢ ?ণ ;; CEREBRALS
150 ?ত ?থ ?দ ?ধ ?ন nil ;; DENTALS
151 ?প ?ফ ?ব ?ভ ?ম ;; LABIALS
152 ?য ?র nil ?ল nil nil nil ;; SEMIVOWELS
153 ?শ ?ষ ?স ?হ ;; SIBILANTS
154 nil nil nil nil ?ড় ?ঢ় nil ?য় ;; NUKTAS
155 "জ্ঞ" "ক্ষ")
156 (;; Misc Symbols
157 ?ঁ ?ং ?ঃ nil ?্ nil nil)
158 (;; Digits
159 ?০ ?১ ?২ ?৩ ?৪ ?৫ ?৬ ?৭ ?৮ ?৯)
160 (;; Inscript-extra (4) (#, $, ^, *, ])
161 "্র" "র্" "ত্র" "শ্র" "়")))
163 (defvar indian-asm-base-table
165 (;; VOWELS
166 (?অ nil) (?আ ?া) (?ই ?ি) (?ঈ ?ী) (?উ ?ু) (?ঊ ?ূ)
167 (?ঋ ?ৃ) (?ঌ ?ৢ) nil nil (?এ ?ে) (?ঐ ?ৈ)
168 nil nil (?ও ?ো) (?ঔ ?ৌ) (?ৠ ?ৄ) (?ৡ ?ৣ))
169 (;; CONSONANTS
170 ?ক ?খ ?গ ?ঘ ?ঙ ;; GUTTRULS
171 ?চ ?ছ ?জ ?ঝ ?ঞ ;; PALATALS
172 ?ট ?ঠ ?ড ?ঢ ?ণ ;; CEREBRALS
173 ?ত ?থ ?দ ?ধ ?ন nil ;; DENTALS
174 ?প ?ফ ?ব ?ভ ?ম ;; LABIALS
175 ?য ?ৰ nil ?ল nil nil ?ৱ ;; SEMIVOWELS
176 ?শ ?ষ ?স ?হ ;; SIBILANTS
177 nil nil nil nil ?ড় ?ঢ় nil ?য় ;; NUKTAS
178 "জ্ঞ" "ক্ষ")
179 (;; Misc Symbols
180 ?ঁ ?ং ?ঃ nil ?্ nil nil)
181 (;; Digits
182 ?০ ?১ ?২ ?৩ ?৪ ?৫ ?৬ ?৭ ?৮ ?৯)
183 (;; Inscript-extra (4) (#, $, ^, *, ])
184 "্ৰ" "ৰ্" "ত্ৰ" "শ্ৰ" "়")))
186 (defvar indian-tlg-base-table
188 (;; VOWELS
189 (?అ nil) (?ఆ ?ా) (?ఇ ?ి) (?ఈ ?ీ) (?ఉ ?ు) (?ఊ ?ూ)
190 (?ఋ ?ృ) (?ఌ nil) nil (?ఏ ?ే) (?ఎ ?ె) (?ఐ ?ై)
191 nil (?ఓ ?ో) (?ఒ ?ొ) (?ఔ ?ౌ) (?ౠ ?ౄ) (?ౡ nil))
192 (;; CONSONANTS
193 ?క ?ఖ ?గ ?ఘ ?ఙ ;; GUTTRULS
194 ?చ ?ఛ ?జ ?ఝ ?ఞ ;; PALATALS
195 ?ట ?ఠ ?డ ?ఢ ?ణ ;; CEREBRALS
196 ?త ?థ ?ద ?ధ ?న nil ;; DENTALS
197 ?ప ?ఫ ?బ ?భ ?మ ;; LABIALS
198 ?య ?ర ?ఱ ?ల ?ళ nil ?వ ;; SEMIVOWELS
199 ?శ ?ష ?స ?హ ;; SIBILANTS
200 nil nil nil nil nil nil nil nil ;; NUKTAS
201 "జ్ఞ" "క్ష")
202 (;; Misc Symbols
203 ?ఁ ?ం ?ః nil ?్ nil nil)
204 (;; Digits
205 ?౦ ?౧ ?౨ ?౩ ?౪ ?౫ ?౬ ?౭ ?౮ ?౯)
206 (;; Inscript-extra (4) (#, $, ^, *, ])
207 "్ర" "ర్" "త్ర" "శ్ర" nil)))
209 (defvar indian-knd-base-table
211 (;; VOWELS
212 (?ಅ nil) (?ಆ ?ಾ) (?ಇ ?ಿ) (?ಈ ?ೀ) (?ಉ ?ು) (?ಊ ?ೂ)
213 (?ಋ ?ೃ) (?ಌ nil) nil (?ಏ ?ೇ) (?ಎ ?ೆ) (?ಐ ?ೈ)
214 nil (?ಓ ?ೋ) (?ಒ ?ೊ) (?ಔ ?ೌ) (?ೠ ?ೄ) (?ೡ nil))
215 (;; CONSONANTS
216 ?ಕ ?ಖ ?ಗ ?ಘ ?ಙ ;; GUTTRULS
217 ?ಚ ?ಛ ?ಜ ?ಝ ?ಞ ;; PALATALS
218 ?ಟ ?ಠ ?ಡ ?ಢ ?ಣ ;; CEREBRALS
219 ?ತ ?ಥ ?ದ ?ಧ ?ನ nil ;; DENTALS
220 ?ಪ ?ಫ ?ಬ ?ಭ ?ಮ ;; LABIALS
221 ?ಯ ?ರ ?ಱ ?ಲ ?ಳ nil ?ವ ;; SEMIVOWELS
222 ?ಶ ?ಷ ?ಸ ?ಹ ;; SIBILANTS
223 nil nil nil nil nil nil ?ೞ nil ;; NUKTAS
224 "ಜ್ಞ" "ಕ್ಷ")
225 (;; Misc Symbols
226 nil ?ಂ ?ಃ nil ?್ nil nil)
227 (;; Digits
228 ?೦ ?೧ ?೨ ?೩ ?೪ ?೫ ?೬ ?೭ ?೮ ?೯)
229 (;; Inscript-extra (4) (#, $, ^, *, ])
230 "್ರ" "ರ್" "ತ್ರ" "ಶ್ರ" nil)))
232 (defvar indian-mlm-base-table
234 (;; VOWELS
235 (?അ nil) (?ആ ?ാ) (?ഇ ?ി) (?ഈ ?ീ) (?ഉ ?ു) (?ഊ ?ൂ)
236 (?ഋ ?ൃ) (?ഌ nil) nil (?ഏ ?േ) (?എ ?െ) (?ഐ ?ൈ)
237 nil (?ഓ ?ോ) (?ഒ ?ൊ) (?ഔ ?ൌ) nil nil)
238 (;; CONSONANTS
239 ?ക ?ഖ ?ഗ ?ഘ ?ങ ;; GUTTRULS
240 ?ച ?ഛ ?ജ ?ഝ ?ഞ ;; PALATALS
241 ?ട ?ഠ ?ഡ ?ഢ ?ണ ;; CEREBRALS
242 ?ത ?ഥ ?ദ ?ധ ?ന nil ;; DENTALS
243 ?പ ?ഫ ?ബ ?ഭ ?മ ;; LABIALS
244 ?യ ?ര ?റ ?ല ?ള ?ഴ ?വ ;; SEMIVOWELS
245 ?ശ ?ഷ ?സ ?ഹ ;; SIBILANTS
246 nil nil nil nil nil nil nil nil ;; NUKTAS
247 "ജ്ഞ" "ക്ഷ")
248 (;; Misc Symbols
249 nil ?ം ?ഃ nil ?് nil nil)
250 (;; Digits
251 ?൦ ?൧ ?൨ ?൩ ?൪ ?൫ ?൬ ?൭ ?൮ ?൯)
252 (;; Inscript-extra (4) (#, $, ^, *, ])
253 "്ര" "ര്" "ത്ര" "ശ്ര" nil)))
255 (defvar indian-tml-base-table
257 (;; VOWELS
258 (?அ nil) (?ஆ ?ா) (?இ ?ி) (?ஈ ?ீ) (?உ ?ு) (?ஊ ?ூ)
259 nil nil nil (?ஏ ?ே) (?எ ?ெ) (?ஐ ?ை)
260 nil (?ஓ ?ோ) (?ஒ ?ொ) (?ஔ ?ௌ) nil nil)
261 (;; CONSONANTS
262 ?க nil nil nil ?ங ;; GUTTRULS
263 ?ச nil ?ஜ nil ?ஞ ;; PALATALS
264 ?ட nil nil nil ?ண ;; CEREBRALS
265 ?த nil nil nil ?ந ?ன ;; DENTALS
266 ?ப nil nil nil ?ம ;; LABIALS
267 ?ய ?ர ?ற ?ல ?ள ?ழ ?வ ;; SEMIVOWELS
268 nil ?ஷ ?ஸ ?ஹ ;; SIBILANTS
269 nil nil nil nil nil nil nil nil ;; NUKTAS
270 "ஜ்ஞ" "க்ஷ")
271 (;; Misc Symbols
272 nil ?ஂ ?ஃ nil ?் nil nil)
273 (;; Digits
274 ?௦ ?௧ ?௨ ?௩ ?௪ ?௫ ?௬ ?௭ ?௮ ?௯)
275 (;; Inscript-extra (4) (#, $, ^, *, ])
276 "்ர" "ர்" "த்ர" nil nil)))
278 (defvar indian-base-table-to-language-alist
279 '((indian-dev-base-table . "Devanagari")
280 (indian-pnj-base-table . "Punjabi")
281 (indian-ori-base-table . "Oriya")
282 (indian-bng-base-table . "Bengali")
283 (indian-asm-base-table . "Assamese")
284 (indian-tlg-base-table . "Telugu")
285 (indian-knd-base-table . "Kannada")
286 (indian-mlm-base-table . "Malayalam")
287 (indian-tml-base-table . "Tamil")))
289 (defvar indian-itrans-v5-table
290 '(;; for encode/decode
291 (;; vowels -- 18
292 "a" ("aa" "A") "i" ("ii" "I") "u" ("uu" "U")
293 ("RRi" "R^i") ("LLi" "L^i") (".c" "e.c") "E" "e" "ai"
294 "o.c" "O" "o" "au" ("RRI" "R^I") ("LLI" "L^I"))
295 (;; consonants -- 40
296 "k" "kh" "g" "gh" ("~N" "N^")
297 "ch" ("Ch" "chh") "j" "jh" ("~n" "JN")
298 "T" "Th" "D" "Dh" "N"
299 "t" "th" "d" "dh" "n" "nh"
300 "p" "ph" "b" "bh" "m"
301 "y" "r" "rh" "l" ("L" "ld") nil ("v" "w")
302 "sh" ("Sh" "shh") "s" "h"
303 "q" "K" "G" ("J" "z") ".D" ".Dh" "f" ("Y" "yh")
304 ("GY" "dny") "x")
305 (;; misc -- 7
306 ".N" (".n" "M") "H" ".a" ".h" ("AUM" "OM") "..")))
308 (defvar indian-itrans-v5-table-for-tamil
309 '(;; for encode/decode
310 (;; vowels -- 18
311 "a" ("aa" "A") "i" ("ii" "I") "u" ("uu" "U")
312 ("RRi" "R^i") ("LLi" "L^i") (".c" "e.c") "E" "e" "ai"
313 "o.c" "O" "o" "au" ("RRI" "R^I") ("LLI" "L^I"))
314 (;; consonants -- 40
315 "k" "kh" "g" "gh" ("~N" "N^")
316 "ch" ("Ch" "chh") "j" "jh" ("~n" "JN")
317 "T" "Th" "D" "Dh" "N"
318 "t" "th" "d" "dh" "n" "nh"
319 "p" "ph" "b" "bh" "m"
320 "y" "r" "rh" "l" ("L" "ld") ("J" "z") ("v" "w")
321 "sh" ("Sh" "shh") "s" "h"
322 "q" "K" "G" nil ".D" ".Dh" "f" ("Y" "yh")
323 ("GY" "dny") "x")
324 (;; misc -- 7
325 ".N" (".n" "M") "H" ".a" ".h" ("AUM" "OM") "..")))
327 (defvar indian-kyoto-harvard-table
328 '(;; for encode/decode
329 (;; vowel
330 "a" ("A" "aa") "i" ("I" "ii") "u" ("U" "uu")
331 "R" ("L" "lR") nil nil "e" "ai"
332 nil nil "o" "au" ("q" "RR" "Q") ("E" "LL" "lRR"))
333 (;; consonant
334 "k" "kh" "g" "gh" "G"
335 "c" "ch" "j" "jh" "J"
336 "T" "Th" "D" "Dh" "N"
337 "t" "th" "d" "dh" "n" nil
338 "p" "ph" "b" "bh" "m"
339 "y" "r" nil "l" "L" nil "v"
340 ("z" "Z") "S" "s" "h"
341 nil nil nil nil nil nil nil nil
342 nil nil)
343 (;; misc
344 nil "M" "H" "'" nil "." nil)))
346 (defvar indian-harvard-table
347 '(;; for encode/decode
348 (;; vowel
349 "a" ("A" "aa") "i" ("I" "ii") "u" ("U" "uu")
350 "R" ("L" "lR") nil nil "e" "ai"
351 nil nil "o" "au" ("RR" "q" "Q") ("LL" "E" "lRR"))
352 (;; consonant
353 "k" "kh" "g" "gh" "G"
354 "c" "ch" "j" "jh" "J"
355 "T" "Th" "D" "Dh" "N"
356 "t" "th" "d" "dh" "n" nil
357 "p" "ph" "b" "bh" "m"
358 "y" "r" nil "l" "L" nil "v"
359 ("z" "Z") "S" "s" "h"
360 nil nil nil nil nil nil nil nil
361 nil nil)
362 (;; misc
363 nil "M" "H" "'" nil "." nil)))
365 (defvar indian-tokyo-table
366 '(;; for encode/decode
367 (;; vowel
368 "a" ("A" "aa") "i" ("I" "ii") "u" ("U" "uu")
369 "R" ("L" "lR") nil nil "e" "ai"
370 nil nil "o" "au" ("Q" "RR" "q") ("E" "LL" "lRR"))
371 (;; consonant
372 "k" "kh" "g" "gh" "G"
373 "c" "ch" "j" "jh" "J"
374 "T" "Th" "D" "Dh" "N"
375 "t" "th" "d" "dh" "n" nil
376 "p" "ph" "b" "bh" "m"
377 "y" "r" nil "l" "L" nil "v"
378 ("Z" "z") "S" "s" "h"
379 nil nil nil nil nil nil nil nil
380 nil nil)
381 (;; misc
382 nil "M" "H" "'" nil "." nil)))
384 (defvar indian-aiba-table
385 '(;; for encode/decode
386 (;; vowel
387 "a" "aa" "i" "ii" "u" "uu"
388 ".r" ".l" nil nil "e" "ai"
389 nil nil "o" "au" "~r" "~l")
390 (;; consonant
391 "k" "kh" "g" "gh" "^n"
392 "c" "ch" "j" "jh" "~n"
393 ".t" ".th" ".d" ".dh" ".n"
394 "t" "th" "d" "dh" "n" nil
395 "p" "ph" "b" "bh" "m"
396 "y" "r" nil "l" nil nil "v"
397 "^s" ".s" "s" "h"
398 nil nil nil nil nil nil nil nil
399 nil nil)
400 (;; misc
401 nil ".m" ".h" "'" nil "." nil)))
403 (defun combinatorial (head &rest tail)
404 (if tail
405 (apply 'append
406 (mapcar (lambda (y) (mapcar (lambda (x) (cons x y)) head))
407 (apply 'combinatorial tail)))
408 (mapcar 'list head)))
410 (defun indian--puthash-char (char trans-char hashtbls)
411 (let ((encode-hash (car hashtbls)) ;; char -> trans
412 (decode-hash (cdr hashtbls)) ;; trans -> char
414 ;; char -- nil / char / string (/ list of vowel & matra)
415 ;; trans-char -- nil / string / list of strings
416 (when (and char trans-char)
417 (if (stringp trans-char) (setq trans-char (list trans-char)))
418 (if (characterp char) (setq char (char-to-string char)))
419 (puthash char (car trans-char) encode-hash)
420 (dolist (trans trans-char)
421 (puthash trans char decode-hash)))))
423 (defun indian--map (f l1 l2)
424 (while l1
425 (funcall f (pop l1) (pop l2))))
427 (defun indian--puthash-v (v trans-v hashtbls)
428 (indian--map
429 (lambda (v trans-v)
430 (indian--puthash-char (car v) trans-v hashtbls))
431 v trans-v))
433 (defun indian--puthash-c (c trans-c halant hashtbls)
434 (indian--map
435 (lambda (c trans-c)
436 (if (characterp c) (setq c (char-to-string c)))
437 (indian--puthash-char (concat c halant) trans-c hashtbls))
438 c trans-c))
440 (defun indian--puthash-m (m trans-m hashtbls)
441 (indian--map
442 (lambda (m trans-m)
443 (indian--puthash-char m trans-m hashtbls))
444 m trans-m))
446 (defun indian--puthash-cv (c trans-c v trans-v hashtbls)
447 (indian--map
448 (lambda (c trans-c)
449 (indian--map
450 (lambda (v trans-v)
451 (when (and c trans-c v trans-v)
452 (if (characterp c) (setq c (char-to-string c)))
453 (setq v (if (characterp (cadr v)) (char-to-string (cadr v)) ""))
454 (if (stringp trans-c) (setq trans-c (list trans-c)))
455 (if (stringp trans-v) (setq trans-v (list trans-v)))
456 (indian--puthash-char
457 (concat c v)
458 (mapcar (lambda (x) (apply 'concat x))
459 (combinatorial trans-c trans-v))
460 hashtbls)))
461 v trans-v))
462 c trans-c))
464 (defun indian-make-hash (table trans-table)
465 "Indian Transliteration Hash for decode/encode"
466 (let* ((encode-hash (make-hash-table :test 'equal))
467 (decode-hash (make-hash-table :test 'equal))
468 (hashtbls (cons encode-hash decode-hash))
469 (vowels (elt table 0))
470 (consonants (elt table 1))
471 (misc (elt table 2))
472 (digits (elt table 3))
473 (halant (char-to-string (elt misc 4)))
474 (trans-vowels (elt trans-table 0))
475 (trans-consonants (elt trans-table 1))
476 (trans-misc (elt trans-table 2))
477 (trans-digits '("0" "1" "2" "3" "4" "5" "6" "7" "8" "9")))
478 (indian--puthash-v vowels trans-vowels hashtbls)
479 (indian--puthash-c consonants trans-consonants halant hashtbls)
480 (indian--puthash-cv consonants trans-consonants
481 vowels trans-vowels hashtbls)
482 (indian--puthash-m misc trans-misc hashtbls)
483 (indian--puthash-m digits trans-digits hashtbls)
484 hashtbls))
486 (defvar indian-dev-itrans-v5-hash
487 (indian-make-hash indian-dev-base-table
488 indian-itrans-v5-table))
489 (defvar indian-dev-kyoto-harvard-hash
490 (indian-make-hash indian-dev-base-table
491 indian-kyoto-harvard-table))
492 (defvar indian-dev-aiba-hash
493 (indian-make-hash indian-dev-base-table
494 indian-aiba-table))
496 (defvar indian-pnj-itrans-v5-hash
497 (indian-make-hash indian-pnj-base-table
498 indian-itrans-v5-table))
500 (defvar indian-gjr-itrans-v5-hash
501 (indian-make-hash indian-gjr-base-table
502 indian-itrans-v5-table))
504 (defvar indian-ori-itrans-v5-hash
505 (indian-make-hash indian-ori-base-table
506 indian-itrans-v5-table))
508 (defvar indian-bng-itrans-v5-hash
509 (indian-make-hash indian-bng-base-table
510 indian-itrans-v5-table))
512 (defvar indian-asm-itrans-v5-hash
513 (indian-make-hash indian-asm-base-table
514 indian-itrans-v5-table))
516 (defvar indian-tlg-itrans-v5-hash
517 (indian-make-hash indian-tlg-base-table
518 indian-itrans-v5-table))
520 (defvar indian-knd-itrans-v5-hash
521 (indian-make-hash indian-knd-base-table
522 indian-itrans-v5-table))
524 (defvar indian-mlm-itrans-v5-hash
525 (indian-make-hash indian-mlm-base-table
526 indian-itrans-v5-table))
528 (defvar indian-tml-itrans-v5-hash
529 (indian-make-hash indian-tml-base-table
530 indian-itrans-v5-table-for-tamil))
533 (defmacro indian-translate-region (from to hashtable encode-p)
534 `(save-excursion
535 (save-restriction
536 (let ((regexp ,(indian-regexp-of-hashtbl-keys
537 (if encode-p (car (eval hashtable))
538 (cdr (eval hashtable))))))
539 (narrow-to-region from to)
540 (goto-char (point-min))
541 (while (re-search-forward regexp nil t)
542 (let ((matchstr (gethash (match-string 0)
543 (if ,encode-p
544 (car ,hashtable)
545 (cdr ,hashtable)))))
546 (if matchstr (replace-match matchstr))))))))
550 (defun indian-dev-itrans-v5-encode-region (from to)
551 (interactive "r")
552 (indian-translate-region
553 from to indian-dev-itrans-v5-hash t))
555 (defun indian-dev-itrans-v5-decode-region (from to)
556 (interactive "r")
557 (indian-translate-region
558 from to indian-dev-itrans-v5-hash nil))
560 (defun indian-dev-kyoto-harvard-encode-region (from to)
561 (interactive "r")
562 (indian-translate-region
563 from to indian-dev-kyoto-harvard-hash t))
565 (defun indian-dev-kyoto-harvard-decode-region (from to)
566 (interactive "r")
567 (indian-translate-region
568 from to indian-dev-kyoto-harvard-hash nil))
570 (defun indian-dev-aiba-encode-region (from to)
571 (interactive "r")
572 (indian-translate-region
573 from to indian-dev-aiba-hash t))
575 (defun indian-dev-aiba-decode-region (from to)
576 (interactive "r")
577 (indian-translate-region
578 from to indian-dev-aiba-hash nil))
583 ;;; IS 13194 utilities
585 ;; The followings provide conversion between IS 13194 (ISCII) and UCS.
587 (let
588 ;;Unicode vs IS13194 ;; only Devanagari is supported now.
589 ((ucs-devanagari-to-is13194-alist
590 '((?\x0900 . "[U+0900]")
591 (?\x0901 . "")
592 (?\x0902 . "")
593 (?\x0903 . "")
594 (?\x0904 . "[U+0904]")
595 (?\x0905 . "")
596 (?\x0906 . "")
597 (?\x0907 . "")
598 (?\x0908 . "")
599 (?\x0909 . "")
600 (?\x090a . "")
601 (?\x090b . "")
602 (?\x090c . "")
603 (?\x090d . "")
604 (?\x090e . "")
605 (?\x090f . "")
606 (?\x0910 . "")
607 (?\x0911 . "")
608 (?\x0912 . "")
609 (?\x0913 . "")
610 (?\x0914 . "")
611 (?\x0915 . "")
612 (?\x0916 . "")
613 (?\x0917 . "")
614 (?\x0918 . "")
615 (?\x0919 . "")
616 (?\x091a . "")
617 (?\x091b . "")
618 (?\x091c . "")
619 (?\x091d . "")
620 (?\x091e . "")
621 (?\x091f . "")
622 (?\x0920 . "")
623 (?\x0921 . "")
624 (?\x0922 . "")
625 (?\x0923 . "")
626 (?\x0924 . "")
627 (?\x0925 . "")
628 (?\x0926 . "")
629 (?\x0927 . "")
630 (?\x0928 . "")
631 (?\x0929 . "")
632 (?\x092a . "")
633 (?\x092b . "")
634 (?\x092c . "")
635 (?\x092d . "")
636 (?\x092e . "")
637 (?\x092f . "")
638 (?\x0930 . "")
639 (?\x0931 . "")
640 (?\x0932 . "")
641 (?\x0933 . "")
642 (?\x0934 . "")
643 (?\x0935 . "")
644 (?\x0936 . "")
645 (?\x0937 . "")
646 (?\x0938 . "")
647 (?\x0939 . "")
648 (?\x093a . "[U+093a]")
649 (?\x093b . "[U+093b]")
650 (?\x093c . "")
651 (?\x093d . "")
652 (?\x093e . "")
653 (?\x093f . "")
654 (?\x0940 . "")
655 (?\x0941 . "")
656 (?\x0942 . "")
657 (?\x0943 . "")
658 (?\x0944 . "")
659 (?\x0945 . "")
660 (?\x0946 . "")
661 (?\x0947 . "")
662 (?\x0948 . "")
663 (?\x0949 . "")
664 (?\x094a . "")
665 (?\x094b . "")
666 (?\x094c . "")
667 (?\x094d . "")
668 (?\x094e . "[U+094e]")
669 (?\x094f . "[U+094f]")
670 (?\x0950 . "")
671 (?\x0951 . "")
672 (?\x0952 . "")
673 (?\x0953 . "[DEVANAGARI GRAVE ACCENT]")
674 (?\x0954 . "[DEVANAGARI ACUTE ACCENT]")
675 (?\x0955 . "[U+0955]")
676 (?\x0956 . "[U+0956]")
677 (?\x0957 . "[U+0957]")
678 (?\x0958 . "")
679 (?\x0959 . "")
680 (?\x095a . "")
681 (?\x095b . "")
682 (?\x095c . "")
683 (?\x095d . "")
684 (?\x095e . "")
685 (?\x095f . "")
686 (?\x0960 . "")
687 (?\x0961 . "")
688 (?\x0962 . "")
689 (?\x0963 . "")
690 (?\x0964 . "")
691 (?\x0965 . "")
692 (?\x0966 . "")
693 (?\x0967 . "")
694 (?\x0968 . "")
695 (?\x0969 . "")
696 (?\x096a . "")
697 (?\x096b . "")
698 (?\x096c . "")
699 (?\x096d . "")
700 (?\x096e . "")
701 (?\x096f . "")
702 (?\x0970 . "[U+0970]")
703 (?\x0971 . "[U+0971]")
704 (?\x0972 . "[U+0972]")
705 (?\x0973 . "[U+0973]")
706 (?\x0974 . "[U+0974]")
707 (?\x0975 . "[U+0975]")
708 (?\x0976 . "[U+0976]")
709 (?\x0977 . "[U+0977]")
710 (?\x0978 . "[U+0978]")
711 (?\x0979 . "[U+0979]")
712 (?\x097a . "[U+097a]")
713 (?\x097b . "[U+097b]")
714 (?\x097c . "[U+097c]")
715 (?\x097d . "[U+097d]")
716 (?\x097e . "[U+097e]")
717 (?\x097f . "[U+097f]")))
718 (ucs-bengali-to-is13194-alist nil)
719 (ucs-assamese-to-is13194-alist nil)
720 (ucs-gurmukhi-to-is13194-alist nil)
721 (ucs-gujarati-to-is13194-alist nil)
722 (ucs-oriya-to-is13194-alist nil)
723 (ucs-tamil-to-is13194-alist nil)
724 (ucs-telugu-to-is13194-alist nil)
725 (ucs-malayalam-to-is13194-alist nil)
726 (ucs-kannada-to-is13194-alist nil))
727 (dolist (script '(devanagari bengali assamese gurmukhi gujarati
728 oriya tamil telugu malayalam kannada))
729 (let ((hashtable (intern (concat "is13194-to-ucs-"
730 (symbol-name script) "-hashtbl" )))
731 (regexp (intern (concat "is13194-to-ucs-"
732 (symbol-name script) "-regexp"))))
733 (set hashtable (make-hash-table :test 'equal :size 128))
734 (dolist (x (eval (intern (concat "ucs-" (symbol-name script)
735 "-to-is13194-alist"))))
736 (put-char-code-property (car x) 'script script)
737 (put-char-code-property (car x) 'iscii (cdr x))
738 (puthash (cdr x) (char-to-string (car x)) (eval hashtable)))
739 (set regexp (indian-regexp-of-hashtbl-keys (eval hashtable))))))
741 (defvar is13194-default-repertory 'devanagari)
743 (defvar is13194-repertory-to-ucs-script
744 `((DEF ?\x40 ,is13194-default-repertory)
745 (RMN ?\x41 ,is13194-default-repertory)
746 (DEV ?\x42 devanagari)
747 (BNG ?\x43 bengali)
748 (TML ?\x44 tamil)
749 (TLG ?\x45 telugu)
750 (ASM ?\x46 bengali)
751 (ORI ?\x47 oriya)
752 (KND ?\x48 kannada)
753 (MLM ?\x49 malayalam)
754 (GJR ?\x4a gujarati)
755 (PNJ ?\x4b gurmukhi)))
757 ;; for guiding find-variable function.
758 (defvar is13194-to-ucs-devanagari-hashtbl nil)
759 (defvar is13194-to-ucs-devanagari-regexp nil)
760 (defvar is13194-to-ucs-bengali-hashtbl nil)
761 (defvar is13194-to-ucs-bengali-regexp nil)
762 (defvar is13194-to-ucs-assamese-hashtbl nil)
763 (defvar is13194-to-ucs-assamese-regexp nil)
764 (defvar is13194-to-ucs-gurmukhi-hashtbl nil)
765 (defvar is13194-to-ucs-gurmukhi-regexp nil)
766 (defvar is13194-to-ucs-gujarati-hashtbl nil)
767 (defvar is13194-to-ucs-gujarati-regexp nil)
768 (defvar is13194-to-ucs-oriya-hashtbl nil)
769 (defvar is13194-to-ucs-oriya-regexp nil)
770 (defvar is13194-to-ucs-tamil-hashtbl nil)
771 (defvar is13194-to-ucs-tamil-regexp nil)
772 (defvar is13194-to-ucs-telugu-hashtbl nil)
773 (defvar is13194-to-ucs-telugu-regexp nil)
774 (defvar is13194-to-ucs-malayalam-hashtbl nil)
775 (defvar is13194-to-ucs-malayalam-regexp nil)
776 (defvar is13194-to-ucs-kannada-hashtbl nil)
777 (defvar is13194-to-ucs-kannada-regexp nil)
779 (defvar ucs-to-is13194-regexp
780 ;; only Devanagari is supported now.
781 (concat "[" (char-to-string #x0900)
782 "-" (char-to-string #x097f) "]")
783 "Regexp that matches to conversion")
785 (defun ucs-to-iscii-region (from to)
786 "Converts the indian UCS characters in the region to ISCII.
787 Returns new end position."
788 (interactive "r")
789 ;; only Devanagari is supported now.
790 (save-excursion
791 (save-restriction
792 (narrow-to-region from to)
793 (goto-char (point-min))
794 (let* ((current-repertory is13194-default-repertory))
795 (while (re-search-forward ucs-to-is13194-regexp nil t)
796 (replace-match
797 (get-char-code-property (string-to-char (match-string 0))
798 'iscii))))
799 (point-max))))
801 (defun iscii-to-ucs-region (from to)
802 "Converts the ISCII characters in the region to UCS.
803 Returns new end position."
804 (interactive "r")
805 ;; only Devanagari is supported now.
806 (save-excursion
807 (save-restriction
808 (narrow-to-region from to)
809 (goto-char (point-min))
810 (let* ((current-repertory is13194-default-repertory)
811 (current-hashtable
812 (intern (concat "is13194-to-ucs-"
813 (symbol-name current-repertory) "-hashtbl")))
814 (current-regexp
815 (intern (concat "is13194-to-ucs-"
816 (symbol-name current-repertory) "-regexp")))
817 (re (eval current-regexp))
818 (hash (eval current-hashtable)))
819 (while (re-search-forward re nil t)
820 (replace-match (gethash (match-string 0) hash ""))))
821 (point-max))))
823 ;;;###autoload
824 (defun indian-compose-region (from to)
825 "Compose the region according to `composition-function-table'."
826 (interactive "r")
827 (save-excursion
828 (save-restriction
829 (let ((pos from) newpos func (max to))
830 (narrow-to-region from to)
831 (while (< pos max)
832 (setq func (aref composition-function-table (char-after pos)))
833 (if (fboundp func)
834 (setq newpos (funcall func pos nil)
835 pos (if (and (integerp newpos) (> newpos pos))
836 newpos (1+ pos)))
837 (setq pos (1+ pos))))))))
839 ;;;###autoload
840 (defun indian-compose-string (string)
841 (with-temp-buffer
842 (insert string)
843 (indian-compose-region (point-min) (point-max))
844 (buffer-string)))
846 ;;;###autoload
847 (defun in-is13194-post-read-conversion (len)
848 (let ((pos (point)) endpos)
849 (setq endpos (iscii-to-ucs-region pos (+ pos len)))
850 (- endpos pos)))
852 ;;;###autoload
853 (defun in-is13194-pre-write-conversion (from to)
854 (let ((buf (current-buffer)))
855 (set-buffer (generate-new-buffer " *temp*"))
856 (if (stringp from)
857 (insert from)
858 (insert-buffer-substring buf from to))
859 (ucs-to-iscii-region (point-min) (point-max))
860 nil))
865 ;;; Backward Compatibility support programs
867 ;; The following provides the conversion from old-implementation of
868 ;; Emacs Devanagari script to UCS.
870 (defconst indian-2-colum-to-ucs
872 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
873 ;;2120
874 ("" . "ँ")
875 ("" . "ं")
876 ("" . "ः")
877 ("" . "अ")
878 ("" . "आ")
879 ("" . "इ")
880 ("" . "ई")
881 ("" . "उ")
882 ("" . "ऊ")
883 ("" . "ऋ")
884 ("" . "रृ")
885 ("" . "ऎ")
886 ("" . "ए")
887 ("" . "ऐ")
888 ("" . "ऍ")
889 ("" . "ऒ")
890 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
891 ;;2130
892 ("" . "ओ")
893 ("" . "औ")
894 ("" . "ऑ")
895 ("" . "क")
896 ("" . "ख")
897 ("" . "ग")
898 ("" . "घ")
899 ("" . "ङ")
900 ("" . "च")
901 ("" . "छ")
902 ("" . "ज")
903 ("" . "झ")
904 ("" . "ञ")
905 ("" . "ट")
906 ("" . "ठ")
907 ("" . "ड")
908 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
909 ;;2140
910 ("" . "ढ")
911 ("" . "ण")
912 ("" . "त")
913 ("" . "थ")
914 ("" . "द")
915 ("" . "ध")
916 ("" . "न")
917 ("" . "ऩ")
918 ("" . "प")
919 ("" . "फ")
920 ("" . "ब")
921 ("" . "भ")
922 ("" . "म")
923 ("" . "य")
924 ("" . "य़")
925 ("" . "र")
926 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
927 ;;2150
928 ("" . "ऱ")
929 ("" . "ल")
930 ("" . "ळ")
931 ("" . "ऴ")
932 ("" . "व")
933 ("" . "श")
934 ("" . "ष")
935 ("" . "स")
936 ("" . "ह")
937 ("" . "ा")
938 ("" . "ि")
939 ("" . "ी")
940 ("" . "ु")
941 ("" . "ू")
942 ("" . "ृ")
943 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
944 ;;2160
945 ("" . "ॆ")
946 ("" . "े")
947 ("" . "ै")
948 ("" . "ॅ")
949 ("" . "ॊ")
950 ("" . "ो")
951 ("" . "ौ")
952 ("" . "ॉ")
953 ("" . "्")
954 ("" . "़")
955 ("" . "।")
956 ("" . "॥")
957 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
958 ;;2170
959 ("" . "०")
960 ("" . "१")
961 ("" . "२")
962 ("" . "३")
963 ("" . "४")
964 ("" . "५")
965 ("" . "६")
966 ("" . "७")
967 ("" . "८")
968 ("" . "९")
969 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
970 ;;2220
971 ("" . "ज़्र")
972 ("" . "फ़्र")
973 ("" . "क्र")
974 ("" . "ग्र")
975 ("" . "त्र")
976 ("" . "प्र")
977 ("" . "फ्र")
978 ("" . "श्र")
979 ("" . "रु")
980 ("" . "रू")
981 ("" . "ऱु")
982 ("" . "ऱू")
983 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
984 ;;2230
985 ("" . "क्")
986 ("" . "ख्")
987 ("" . "ग्")
988 ("" . "घ्")
989 ("" . "च्")
990 ("" . "च्र्")
991 ("" . "ज्")
992 ("" . "झ्")
993 ("" . "ञ्")
994 ("" . "ञ्")
995 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
996 ;;2240
997 ("" . "ण्")
998 ("" . "त्")
999 ("" . "थ्")
1000 ("" . "ध्")
1001 ("" . "न्")
1002 ("" . "ऩ्")
1003 ("" . "प्")
1004 ("" . "फ्")
1005 ("" . "ब्")
1006 ("" . "ब्")
1007 ("" . "भ्")
1008 ("" . "म्")
1009 ("" . "य्")
1010 ("" . "य़्")
1011 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1012 ;;2250
1013 ("" . "ल्")
1014 ("" . "ळ्")
1015 ("" . "ऴ्")
1016 ("" . "व्")
1017 ("" . "श्")
1018 ("" . "ष्")
1019 ("" . "स्")
1020 ("" . "्य")
1021 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1022 ;;2260
1023 ("" . "ग्र्")
1024 ("" . "घ्न्")
1025 ("" . "त्त्")
1026 ("" . "त्र्")
1027 ("" . "ध्न्")
1028 ("" . "ध्र्")
1029 ("" . "प्त्")
1030 ("" . "श्च्")
1031 ("" . "श्र्")
1032 ("" . "श्व्")
1033 ("" . "न्न्")
1034 ("" . "क्ष्")
1035 ("" . "ज्ञ्")
1036 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1037 ;;2270
1038 ("" . "र्")
1039 ("" . "्र")
1040 ("" . "्र")
1041 ("" . "क़्")
1042 ("" . "ख़्")
1043 ("" . "ग़्")
1044 ("" . "फ़्")
1045 ("" . "ज़्")
1046 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1047 ;;2320
1048 ("" . "ॐ")
1049 ("" . "ऌ")
1050 ("" . "रॄ")
1051 ("" . "ॡ")
1052 ("" . "रॣ")
1053 ("" . "ॠ")
1054 ("" . "रॢ")
1055 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1056 ;;2330
1057 ("" . "क़")
1058 ("" . "ख़")
1059 ("" . "ग़")
1060 ("" . "ज़")
1061 ("" . "ड़")
1062 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1063 ;;2340
1064 ("" . "ढ़")
1065 ("" . "फ़")
1066 ("" . "ऽ")
1067 ("" . "ॄ")
1068 ("" . "ॢ")
1069 ("" . "ॣ")
1070 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1071 ;;2350
1072 ("" . "म्न")
1073 ("" . "म्ल")
1074 ("" . "हृ")
1075 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1076 ;;2360
1077 ("" . "ल्ल")
1078 ("" . "व्न")
1079 ("" . "व्व")
1080 ("" . "श्च")
1081 ("" . "श्न")
1082 ("" . "श्ब")
1083 ("" . "श्ल")
1084 ("" . "श्व")
1085 ("" . "ष्ट्र्य")
1086 ("" . "ष्ट्य")
1087 ("" . "ष्ट्व")
1088 ("" . "ष्ट")
1089 ("" . "ष्ठ")
1090 ("" . "स्न")
1091 ("" . "स्र")
1092 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1093 ;;2370
1094 ("" . "ह्ण")
1095 ("" . "ह्न")
1096 ("" . "ह्म")
1097 ("" . "ह्य")
1098 ("" . "ह्र")
1099 ("" . "ह्ल")
1100 ("" . "ह्व")
1101 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1102 ;;2420
1103 ("" . "क्त्र्य")
1104 ("" . "क्त्व")
1105 ("" . "क्त्य")
1106 ("" . "क्न्य")
1107 ("" . "क्र्य")
1108 ("" . "क्व्य")
1109 ("" . "क्क")
1110 ("" . "क्त")
1111 ("" . "क्न")
1112 ("" . "क्म")
1113 ("" . "क्य")
1114 ("" . "क्ल")
1115 ("" . "क्व")
1116 ("" . "क्ष")
1117 ("" . "घ्न")
1118 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1119 ;;2430
1120 ("" . "ङ्क्त्य")
1121 ("" . "ङ्क्ष्व")
1122 ("" . "ङ्क्त")
1123 ("" . "ङ्क्ष")
1124 ("" . "ङ्घ्र")
1125 ("" . "ङ्क्य")
1126 ("" . "ङ्ख्य")
1127 ("" . "ङ्ग्य")
1128 ("" . "ङ्घ्य")
1129 ("" . "ङ्क")
1130 ("" . "ङ्ख")
1131 ("" . "ङ्ग")
1132 ("" . "ङ्घ")
1133 ("" . "ङ्ङ")
1134 ("" . "ङ्न")
1135 ("" . "ङ्म")
1136 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1137 ;;2440
1138 ("" . "ङ्य")
1139 ("" . "च्च")
1140 ("" . "च्ञ")
1141 ("" . "छ्य")
1142 ("" . "ज्र")
1143 ("" . "ज्ञ")
1144 ("" . "ञ्च")
1145 ("" . "ञ्ज")
1146 ("" . "ट्क")
1147 ("" . "ट्ट")
1148 ("" . "ट्ठ")
1149 ("" . "ट्य")
1150 ("" . "ठ्य")
1151 ("" . "ड्ग्य")
1152 ("" . "ड्घ्र")
1153 ("" . "ड्र्य")
1154 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1155 ;;2450
1156 ("" . "ड्ग")
1157 ("" . "ड्घ")
1158 ("" . "ड्ड")
1159 ("" . "ड्म")
1160 ("" . "ड्य")
1161 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1162 ;;2460
1163 ("" . "ढ्य")
1164 ("" . "त्त")
1165 ("" . "त्न")
1166 ("" . "द्द्य")
1167 ("" . "द्ध्य")
1168 ("" . "द्भ्य")
1169 ("" . "द्र्य")
1170 ("" . "द्व्य")
1171 ("" . "द्ग्र")
1172 ("" . "द्घ्र")
1173 ("" . "द्द्व")
1174 ("" . "द्ध्व")
1175 ("" . "द्ग")
1176 ("" . "द्घ")
1177 ("" . "द्द")
1178 ("" . "द्ध")
1179 ;; 0 1 2 3 4 5 6 7 8 9 a b c d e f
1180 ;;2470
1181 ("" . "द्न")
1182 ("" . "द्ब")
1183 ("" . "द्भ")
1184 ("" . "द्म")
1185 ("" . "द्य")
1186 ("" . "द्व")
1187 ("" . "ध्न")
1188 ("" . "न्न")
1189 ("" . "प्त")
1190 ("" . "प्न")
1191 ("" . "प्ल")
1192 ("" . "ब्न")
1193 ("" . "ब्ब")
1194 ("" . "ब्व")
1195 ("" . "भ्न")))
1197 (defconst indian-2-column-to-ucs-regexp
1198 "\\|\\|[]\\|[-]")
1200 (put 'indian-2-column-to-ucs-chartable 'char-table-extra-slots 1)
1201 (defconst indian-2-column-to-ucs-chartable
1202 (let ((table (make-char-table 'indian-2-column-to-ucs-chartable))
1203 (alist nil))
1204 (dolist (elt indian-2-colum-to-ucs)
1205 (if (= (length (car elt)) 1)
1206 (aset table (aref (car elt) 0) (cdr elt))
1207 (setq alist (cons elt alist))))
1208 (set-char-table-extra-slot table 0 alist)
1209 table))
1211 ;;;###autoload
1212 (defun indian-2-column-to-ucs-region (from to)
1213 "Convert old Emacs Devanagari characters to UCS."
1214 (interactive "r")
1215 (save-excursion
1216 (save-restriction
1217 (let ((pos from)
1218 (alist (char-table-extra-slot indian-2-column-to-ucs-chartable 0)))
1219 (narrow-to-region from to)
1220 (decompose-region from to)
1221 (goto-char (point-min))
1222 (while (re-search-forward indian-2-column-to-ucs-regexp nil t)
1223 (let ((len (- (match-end 0) (match-beginning 0)))
1224 subst)
1225 (if (= len 1)
1226 (setq subst (aref indian-2-column-to-ucs-chartable
1227 (char-after (match-beginning 0))))
1228 (setq subst (cdr (assoc (match-string 0) alist))))
1229 (replace-match (if subst subst "?"))))
1230 (indian-compose-region (point-min) (point-max))))))
1232 (provide 'ind-util)
1234 ;;; ind-util.el ends here