(latexenc-find-file-coding-system): Don't inherit the EOL part of the
[emacs.git] / lisp / term / internal.el
blob87a78d2e9a259a803f328e9cd94f5da5ee4f39e2
1 ;;; internal.el --- support for PC internal terminal -*- coding: raw-text; no-byte-compile: t -*-
3 ;; Copyright (C) 1993, 1994, 1998, 1999, 2001 Free Software Foundation, Inc.
5 ;; Author: Morten Welinder <terra@diku.dk>
7 ;; This file is part of GNU Emacs.
9 ;; GNU Emacs is free software; you can redistribute it and/or modify
10 ;; it under the terms of the GNU General Public License as published by
11 ;; the Free Software Foundation; either version 2, or (at your option)
12 ;; any later version.
14 ;; GNU Emacs is distributed in the hope that it will be useful,
15 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
16 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 ;; GNU General Public License for more details.
19 ;; You should have received a copy of the GNU General Public License
20 ;; along with GNU Emacs; see the file COPYING. If not, write to the
21 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
22 ;; Boston, MA 02111-1307, USA.
24 ;;; Commentary:
26 ;;; Code:
28 ;; ---------------------------------------------------------------------------
29 ;; keyboard setup -- that's simple!
30 (set-input-mode nil nil 0)
31 (define-key function-key-map [backspace] "\177") ; Normal behaviour for BS
32 (define-key function-key-map [delete] "\C-d") ; ... and Delete
33 (define-key function-key-map [tab] [?\t])
34 (define-key function-key-map [linefeed] [?\n])
35 (define-key function-key-map [clear] [11])
36 (define-key function-key-map [return] [13])
37 (define-key function-key-map [escape] [?\e])
38 (define-key function-key-map [M-backspace] [?\M-\d])
39 (define-key function-key-map [M-delete] [?\M-d])
40 (define-key function-key-map [M-tab] [?\M-\t])
41 (define-key function-key-map [M-linefeed] [?\M-\n])
42 (define-key function-key-map [M-clear] [?\M-\013])
43 (define-key function-key-map [M-return] [?\M-\015])
44 (define-key function-key-map [M-escape] [?\M-\e])
45 (put 'backspace 'ascii-character 127)
46 (put 'delete 'ascii-character 127)
47 (put 'tab 'ascii-character ?\t)
48 (put 'linefeed 'ascii-character ?\n)
49 (put 'clear 'ascii-character 12)
50 (put 'return 'ascii-character 13)
51 (put 'escape 'ascii-character ?\e)
53 ;; ----------------------------------------------------------------------
54 ;; DOS display setup
55 ;; =================
57 ;; DOS can only support a single font. On most systems (with the
58 ;; possible exception of Far Eastern DOS versions), this means that
59 ;; two character sets are available at any given time: the ASCII
60 ;; charset, and a single national charset, usually mapped to codes
61 ;; above 128 (i.e., with 8th bit set). Which national charset is
62 ;; supported depends on the codepage loaded by the system when it
63 ;; boots; usually, this codepage cannot be changed without
64 ;; rebooting.
66 ;; Since each codepage can usually display character of a single
67 ;; MULE charset, Emacs can display a single MULE charset with the
68 ;; glyphs of the current codepage. The mapping from DOS codepages
69 ;; to MULE charsets is established by the charset property of the
70 ;; cpNNN-decode-table variables in codepage.el, which also
71 ;; defines translation tables for each such pair, and a bunch of
72 ;; functions to generate coding systems that use those translation
73 ;; tables to convert codepage-encoded text to the appropriate MULE
74 ;; charset and back. When Emacs starts on DOS, it automatically
75 ;; sets its default coding systems for file I/O and terminal output
76 ;; according to the currend DOS codepage, given by the
77 ;; `dos-codepage' variable.
79 ;; This leaves us with the problem of displaying character sets
80 ;; other than the one which maps directly into the current codepage.
81 ;; The following functions and variables handle this nuisance by
82 ;; defining a display table where each character that doesn't have a
83 ;; glyph in some codepage is mapped to a string which represents it.
84 ;; For example, a small c with cedilla is mapped to the string
85 ;; "{,c}" (the braces serve as a sign that this is a single
86 ;; character). A nice feature of the display tables is that Emacs
87 ;; knows that the string represents a single character, and thus
88 ;; cursor motion works as you'd expect: a single `C-f' moves past
89 ;; the entire string which represents a single character.
90 ;; ----------------------------------------------------------------------
92 (defvar IT-character-translations
94 (latin-iso8859-1
95 . [255 "!I" "|c" "Pd" "$$" "Ye" "|" "SE" "\"" "(c)"
96 "_a" "<<" "~" "--" "(R)" "'-" "^o" "+-" "^2" "^3"
97 "'" "u" ".P" "^." "'," "^1" "_o" ">>" "1/4" "1/2"
98 "3/4" "?I" "`A" "A'" "A^" "~A" "\"A" "Ao" "AE" ",C"
99 "`E" "E'" "E^" "\"E" "`I" "I'" "I^" "\"I" "-D" "~N"
100 "`O" "O'" "O^" "~O" "\"O" "*x" "/O" "`U" "U'" "U^"
101 "\"U" "Y'" "-P" "ss" "`a" "a'" "a^" "~a" "\"a" "ao"
102 "ae" ",c" "`e" "e'" "e^" "\"e" "`i" "i'" "i^" "\"i"
103 "-d" "~n" "`o" "o'" "o^" "~o" "\"o" "-:" "/o" "`u"
104 "u'" "u^" "\"u" "y'" "-p" "\"y"]
106 (latin-iso8859-2
107 . [255 "A;" "'(" "/L" "$$" "L<" "S'" "SE" "\"" "S<"
108 ",S" "T<" "Z'" "--" "Z<" "Z^." "^o" "a;" "';" "/l"
109 "'" "l<" "s'" "'<" "'," "s<" ",s" "t<" "z'" "'"
110 "z<" "z^." "R'" "A'" "A^" "A(" "\"A" "L'" "C'" ",C"
111 "C<" "E'" "E;" "E:" "E<" "I'" "I^" "D<" "/D" "N'"
112 "N<" "O'" "O^" "O''" "\"O" "*x" "R<" "U^0" "U'" "U''"
113 "\"U" "Y'" ",T" "ss" "r'" "a'" "a^" "a(" "\"a" "l'"
114 "c'" ",c" "c<" "e'" "e;" "\"e" "e<" "i'" "i^" "d<"
115 "/d" "n'" "n<" "o'" "o^" "o''" "\"o" "-:" "r<" "u^0"
116 "u'" "u''" "\"u" "y'" ",t" "'."]
118 (latin-iso8859-3
119 . [255 "/H" "'(" "Pd" "$$" " " "H^" "SE" "\"" "I^."
120 ",S" "G(" "J^" "--" " " "Z^." "^o" "/h" "^2" "^3"
121 "'" "u" "h^" "." "'," "i^." ",s" "g(" "j^" "1/2"
122 " " "z^." "`A" "A'" "A^" " " "\"A" "C^." "C^" ",C"
123 "`E" "E'" "E^" "\"E" "`I" "I'" "I^" "\"I" " " "~N"
124 "`O" "O'" "O^" "G^." "\"O" "*x" "G^" "`U" "U'" "U^"
125 "\"U" "U(" "S^" "ss" "`a" "a'" "a^" " " "\"a" "c^."
126 "c^" ",c" "`e" "e'" "e^" "\"e" "`i" "i'" "i^" "\"i"
127 " " "~n" "`o" "o'" "o^" "g^." "\"o" "-:" "g^" "`u"
128 "u'" "u^" "\"u" "u(" "s^" "^."]
130 (latin-iso8859-4
131 . [255 "A;" "kk" ",R" "$$" "?I" ",L" "SE" "\"" "S<"
132 "E-" ",G" "/T" "--" "Z<" "'-" "^o" "a;" "';" ",r"
133 "'" "~i" ",l" "'<" "'," "s<" "e-" ",g" "/t" "NG"
134 "z<" "ng" "A-" "A'" "A^" "~A" "\"A" "Ao" "AE" "I;"
135 "C<" "E'" "E;" "\"E" "E^." "I'" "I^" "I-" "/D" ",N"
136 "O-" ",K" "O^" "~O" "\"O" "*x" "/O" "U;" "U'" "U^"
137 "\"U" "~U" "U-" "ss" "a-" "a'" "a^" "~a" "\"a" "ao"
138 "ae" "i;" "c<" "e'" "e;" "\"e" "e^." "i'" "i^" "i-"
139 "/d" ",n" "o-" ",k" "o^" "~o" "\"o" "-:" "/o" "u;"
140 "u'" "u^" "\"u" "~u" "u-" "^."]
142 (cyrillic-iso8859-5
143 . [255 "\"E" "Dj" "Gj" "IE" "Dz" "Ii" "Ji" "JE" "Lj"
144 "Nj" "Ts" "Kj" 240 "V%" "Dzh" 65 "B=" 66 226
145 68 69 "Z%" 51 85 "J=" 75 "L=" 77 72
146 79 "P=" 80 67 84 89 232 88 "C=" "C%"
147 "S%" "Sc" "=\"" "Y=" "%\"" "Ee" "Yu" "Ya" 97 98
148 "v=" "g=" 103 101 "z%" "z=" 117 "j=" 107 "l="
149 "m=" "n=" 111 110 112 99 "t=" 121 "f=" 120
150 "c=" "c%" "s%" "sc" "='" "y=" "%'" "ee" "yu" "ya"
151 "N0" "\"e" "dj" "gj" "ie" "dz" "ii" "ji" "je" "lj"
152 "nj" "ts" "kj" 21 "v%" "dzh"]
154 (arabic-iso8859-6
155 . [255 nil nil nil "$$" nil nil nil nil nil
156 nil nil ",+" "--" nil nil nil nil nil nil
157 nil nil nil nil nil nil nil ";+" nil nil
158 nil "?+" nil "H'" "aM" "aH" "wH" "ah" "yH"
159 "a+" "b+" "tm" "t+" "tk" "g+" "hk" "x+" "d+" "dk"
160 "r+" "z+" "s+" "sn" "c+" "dd" "tj" "zH" "e+" "i+"
161 nil nil nil nil nil "++" "f+" "q+" "k+" "l+"
162 "m+" "n+" "h+" "w+" "j+" "y+" ":+" "\"+" "=+" "/+"
163 "'+" "1+" "3+" "0+" nil nil nil nil nil nil
164 nil nil nil nil nil nil nil]
166 (greek-iso8859-7
167 . [255 "9'" "'9" "Pd" nil nil "|" "SE" "\"" "(c)"
168 nil "<<" "~" "--" nil "-M" "^o" "+-" "^2" "^3"
169 "'" "'%" "'A" "^." "'E" "'H" "'I" ">>" "'O" "1/2"
170 "'Y" "W%" "i3" 65 66 "G*" "D*" 69 90 72
171 "TH" 73 74 "L*" 77 78 "C*" 79 "P*" 80
172 nil "S*" 84 89 "F*" 88 "Q*" "W*" "\"I" "\"Y"
173 "a%" "e%" "y%" "i%" "u3" "a*" "b*" "g*" "d*" "e*"
174 "z*" "y*" "h*" "i*" 107 "l*" "m*" "n*" "c*" 111
175 "p*" "r*" "*s" "s*" "t*" 117 "f*" "x*" "q*" "w*"
176 "\"i" "\"u" "'o" "'u" "'w" nil]
178 ;; Note: some of the characters undefined according to ISO 8859-8
179 ;; in the ranges 190..220 and 250..255 are replaced with SI 1311-1
180 ;; points (Niqud) and bidi formatting characters
181 (hebrew-iso8859-8
182 . [255 nil "|c" "Pd" "$$" "Ye" "|" "SE" "\"" "(c)"
183 "*x" "<<" "~" "--" "(R)" "'-" "^o" "+-" "^2" "^3"
184 "'" "u" ".P" "^." "'," "^1" "-:" ">>" "1/4" "1/2"
185 "3/4" nil ":'" "v:" "-:" "-':" ".'" ".." "v'" "-'"
186 "-," "`." nil "\\." "(.)" "|'" "`-" "`=" "||" nil
187 nil "::" nil nil nil nil nil nil nil "LRO"
188 "RLO" "PDF" nil "=2" "A+" "B+" "G+" "D+" "H+" "W+"
189 "Z+" "X+" "Tj" "J+" "K%" "K+" "L+" "M%" "M+" "N%"
190 "N+" "S+" "E+" "P%" "P+" "Zj" "ZJ" "Q+" "R+" "Sh"
191 "T+" "LRE" "RLE" "LRM" "RLM" nil]
193 (latin-iso8859-9
194 . [255 "!I" "|c" "Pd" "$$" "Ye" "|" "SE" "\"" "(c)"
195 "_a" "<<" "~" "--" "(R)" "'-" "^o" "+-" "^2" "^3"
196 "'" "u" ".P" "^." "'," "^1" "_o" ">>" "1/4" "1/2"
197 "3/4" "?I" "`A" "A'" "A^" "~A" "\"A" "Ao" "AE" ",C"
198 "`E" "E'" "E^" "\"E" "`I" "I'" "I^" "\"I" "G(" "~N"
199 "`O" "O'" "O^" "~O" "\"O" "*x" "/O" "`U" "U'" "U^"
200 "\"U" "I^." ",S" "ss" "`a" "a'" "a^" "~a" "\"a" "ao"
201 "ae" ",c" "`e" "e'" "e<" "\"e" "e^." "i'" "i^" "i-"
202 "g(" "~n" "`o" "o'" "o^" "~o" "\"o" "-:" "/o" "`u"
203 "u'" "u^" "\"u" "i." ",s" "\"y"]
205 (latin-iso8859-14
206 . [255 "B`" "b`" "Pd" "C`" "c`" "D`" "SE" "`W" "(c)"
207 "W'" "d`" "`Y" "--" "(R)" "\"Y" "F`" "f`" "G`" "g`"
208 "M`" "m`" ".P" "P`" "`w" "p`" "w'" "S`" "`y" "\"W"
209 "\"w" "s`" "`A" "A'" "A^" "~A" "\"A" "Ao" "AE" ",C"
210 "`E" "E'" "E^" "\"E" "`I" "I'" "I^" "\"I" "W^" "~N"
211 "`O" "O'" "O^" "~O" "\"O" "T`" "/O" "`U" "U'" "U^"
212 "\"U" "Y'" "Y^" "ss" "`a" "a'" "a^" "~a" "\"a" "ao"
213 "ae" ",c" "`e" "e'" "e^" "\"e" "`i" "i'" "i^" "\"i"
214 "w^" "~n" "`o" "o'" "o^" "~o" "\"o" "t`" "/o" "`u"
215 "u'" "u^" "\"u" "y'" "y^" "\"y"]
217 (latin-iso8859-15
218 . [255 "!I" "|c" "Pd" "E=" "Ye" "S<" "SE" "s<" "(c)"
219 "_a" "<<" "~" "--" "(R)" "'-" "^o" "+-" "^2" "^3"
220 "Z<" "u" ".P" "^." "z<" "^1" "_o" ">>" "OE" "oe"
221 "\"Y" "?I" "`A" "A'" "A^" "~A" "\"A" "Ao" "AE" ",C"
222 "`E" "E'" "E^" "\"E" "`I" "I'" "I^" "\"I" "-D" "~N"
223 "`O" "O'" "O^" "~O" "\"O" "*x" "/O" "`U" "U'" "U^"
224 "\"U" "Y'" "|P" "ss" "`a" "a'" "a^" "~a" "\"a" "ao"
225 "ae" ",c" "`e" "e'" "e^" "\"e" "`i" "i'" "i^" "\"i"
226 "-d" "~n" "`o" "o'" "o^" "~o" "\"o" "-:" "/o" "`u"
227 "u'" "u^" "\"u" "y'" "|p" "\"y"]
230 "An alist of MULE ISO-8859 character sets and the strings that
231 should be used to represent the characters from each set on a DOS
232 terminal which does not have corresponding glyphs built into the
233 installed codepage.")
235 (defun IT-display-table-setup (codepage &optional table)
236 "Set up display table TABLE for a DOS terminal which supports
237 glyphs built into the codepage CODEPAGE.
239 If TABLE is nil or omitted, `standard-display-table' is used."
240 (let* ((surrogates IT-character-translations)
241 (disp-tab (or table standard-display-table))
242 (built-in-set (cp-charset-for-codepage codepage))
243 (offset (cp-offset-for-codepage codepage))
244 (cp-decoder
245 (symbol-value (intern-soft (format "%s-decode-table" codepage))))
246 (cp-decoder-len (length cp-decoder))
247 (c offset)
248 association chset)
249 ;; Undo the effects of previous call (where they may have used
250 ;; a different codepage) by reverting the display table for the
251 ;; built-in charset to its pristine shape.
252 (while (< c 256)
253 (aset disp-tab (make-char built-in-set c) nil)
254 (setq c (1+ c)))
255 (while surrogates
256 (setq association (car surrogates))
257 (setq chset (car association))
258 (let* ((vector (cdr association))
259 (veclen (length vector))
260 (i 0)
261 glyph)
262 (while (< i veclen)
263 (setq glyph (aref vector i))
264 (or glyph (setq glyph dos-unsupported-char-glyph))
265 (if (or (not (equal chset built-in-set))
266 (>= i cp-decoder-len)
267 (null (aref cp-decoder i)))
268 (aset disp-tab (make-char chset (+ i (logand offset 127)))
269 (vconcat
270 (if (numberp glyph)
271 (char-to-string glyph)
272 (if (> (length glyph) 1) (concat "{" glyph "}")
273 glyph)))))
274 (setq i (1+ i))))
275 (setq surrogates (cdr surrogates)))))
277 (defvar IT-unicode-translations
279 (mule-unicode-0100-24ff ; charset
280 256 ; base
281 256 563 ; first, last
282 [ "A-" "a-" "A(" "a(" "A;" "a;" "C'" "c'" "C>" "c>" ; Latin Extended-A
283 "C." "c." "C<" "c<" "D<" "d<" "D/" "d/" "E-" "e-"
284 "E(" "e(" "E." "e." "E;" "e;" "E<" "e<" "G>" "g>"
285 "G(" "g(" "G." "g." "G," "g," "H>" "h>" "H/" "h/"
286 "I~" "i~" "I-" "i-" "I(" "i(" "I;" "i;" "I." "i."
287 "IJ" "ij" "J>" "j>" "K," "k," "kk" "L'" "l'" "L,"
288 "l," "L<" "l<" "L." "l." "L/" "l/" "N'" "n'" "N,"
289 "n," "N<" "n<" "'n" "NG" "ng" "O-" "o-" "O(" "o("
290 "O\"" "o\"" "OE" "oe" "R'" "r'" "R," "r," "R<" "r<"
291 "S'" "s'" "S>" "s>" "S," "s," "S<" "s<" "T," "t,"
292 "T<" "t<" "T/" "t/" "U~" "u~" "U-" "u-" "U(" "u("
293 "U0" "u0" "U\"" "u\"" "U;" "u;" "W>" "w>" "Y>" "y>"
294 "Y:" "Z'" "z'" "Z." "z." "Z<" "z<" "s1" ; 017f
295 "b/" "B2" "=B" "=b" "B6" "b6" "!C" "C2" "c2" "-D" ;Lat. Extended-B
296 "D2" "=D" "=d" "!d" "!E" "-E" "Eps" "F2" "f2" "G2"
297 "V0" "hv" "io" "-I" "K2" "k2" "-l" "la-" "!M" "2N"
298 "n_" "-O" "O9" "o9" "OI" "oi" "P2" "p2" "'R" "!S"
299 "!s" "Esh" "!esh" "t~" "T2" "t2" "T~" "U9" "u9" "Ups"
300 "V2" "Y2" "y2" "Z/" "z/" "ED" "!ED" "!ed" "ed;" "2/"
301 "5-" "_5-" "ts" "wn" "|_" "||" "|=" "!_" "DZ<" "Dz<"
302 "dz<" "LJ3" "Lj3" "lj3" "NJ3" "Nj3" "nj3" "A<" "a<" "I<"
303 "i<" "O<" "o<" "U<" "u<" "U:-" "u:-" "U:'" "u:'" "U:<"
304 "u:<" "U:!" "u:!" "e1" "A:-" "a:-" "A.-" "a.-" "AE-" "ae-"
305 "G/" "g/" "G<" "g<" "K<" "k<" "O;" "o;" "O1" "o1"
306 "EZ" "ez" "j<" "DZ3" "Dz3" "dz3" "G'" "g'" "Hv" "Wn"
307 "N`" "n`" "AA'" "aa'" "AE'" "ae'" "O/'" "o/'" "A!!" "a!!"
308 "A)" "a)" "E!!" "e!!" "E)" "e)" "I!!" "i!!" "I)" "i)"
309 "O!!" "o!!" "O)" "o)" "R!!" "r!!" "R)" "r)" "U!!" "u!!"
310 "U)" "u)" ",S" ",s" ",T" ",t" "'3" "'3_" "H<" "h<"
311 nil nil "8" "8_" "Z2" "z2" "A." "a." "E," "e,"
312 "O:-" "o:-" "O~-" "o~-" "O." "o." "O.-" "o.-" "Y-" "y-"] ; 0x233
316 (mule-unicode-0100-24ff ; charset
317 256 ; base
318 884 1123 ; first, last
319 [ "'" "," nil nil nil nil "j3" nil nil nil ; Greek
320 "?;" nil nil nil nil nil "'*" "'%" "A%" ".*"
321 "E%" "Y%" "I%" nil "O%" nil "U%" "W%" "i3" "A*"
322 "B*" "G*" "D*" "E*" "Z*" "H*" "Th*" "I*" "K*" "L*"
323 "M*" "N*" "C*" "O*" "P*" "R*" nil "S*" "T*" "U*"
324 "F*" "X*" "Q*" "W*" "J*" "V*" "a%" "e%" "y%" "i%"
325 "u3" "a*" "b*" "g*" "d*" "e*" "z*" "h*" "th*" "i*"
326 "k*" "l*" "m*" "n*" "c*" "o*" "p*" "r*" "*s" "s*"
327 "t*" "u*" "f*" "x*" "q*" "w*" "j*" "v*" "o%" "u%"
328 "w%" nil "b3" "th%" "U2*" "'U2*" "U:2*" "ph*" "pi*" "ka*"
329 nil nil "Sti" "sti" "Dig" "dig" "Kop" "kop" "Sam" "sam"
330 "She" "she" "Fei" "fei" "Khe" "khe" "Hor" "hor" "Gan" "gan"
331 "Shi" "shi" "Dei" "dei" "ka*" "rh*" "ls*" "yo*" nil nil
332 nil nil nil nil nil nil nil nil nil nil
333 "IE'" "E:" "D%" "G%" "IE" "DS" "II" "YI" "J%" "LJ" ; Cyrillic
334 "NJ" "Ts" "KJ" "`I=" "V%" "DZ" 65 "B=" 66 "G="
335 68 69 "Z%" 51 85 "J=" 75 "L=" 77 72
336 79 "P=" 80 67 84 89 "F=" 88 "C=" "C%"
337 "S%" "Sc" "=\"" "Y=" "%\"" "Ee" "JU" "JA" 97 "b="
338 98 "g=" 103 101 "z%" "z=" 117 "j=" 107 "l="
339 109 "n=" 111 "p=" 112 99 "t=" 121 "f=" 120
340 "c=" "c%" "s%" "sc" "='" "y=" "%'" "ee" "ju" "ja"
341 "ie'" "e:" "d%" "g%" "ie" "ds" "ii" "yi" "j%" "lj"
342 "nj" "ts" "kj" "v%" "`i=" "dz" "OM=" "om=" "Y3" "y3"] ; 0x463
345 (mule-unicode-0100-24ff ; charset
346 256 ; base
347 1454 1645 ; first, last
348 [ nil nil ":'" "v:" "-:" "-':" ".'" ".." "v'" "-'"
349 "-," "`." nil "\\." "(.)" "|'" "`-" nil "||" nil
350 nil "::" nil nil nil nil nil nil nil nil
351 nil nil nil nil
352 "A+" "B+" "G+" "D+" "H+" "W+" "Z+" "X+" "Tj" "J+" ; Hebrew
353 "K%" "K+" "L+" "M%" "M+" "N%" "N+" "S+" "E+" "P%"
354 "P+" "Zj" "ZJ" "Q+" "R+" "Sh" "T+" nil nil nil
355 nil nil "WW+" "WJ+" "JJ+" "'+" "\"+" nil nil nil
356 nil nil nil nil nil nil nil nil nil nil
357 nil nil nil nil nil nil nil nil nil nil
358 ",+" nil nil nil nil nil nil nil nil nil ; Arabic
359 nil nil nil nil nil ";+" nil nil nil "?+"
360 nil "H'" "aM" "aH" "wH" "ah" "yH" "a+" "b+" "tm"
361 "t+" "tk" "g+" "hk" "x+" "d+" "dk" "r+" "z+" "s+"
362 "sn" "c+" "dd" "tj" "zH" "e+" "i+" nil nil nil
363 nil nil "++" "f+" "q+" "k+" "l+" "m+" "n+" "h+"
364 "w+" "j+" "y+" ":+" "\"+" "=+" "/+" "'+" "1+" "3+"
365 "0+" nil nil nil nil nil nil nil nil nil
366 nil nil nil nil "0a" "1a" "2a" "3a" "4a" "5a"
367 "6a" "7a" "8a" "9a" "a%" "a." "a," "a*" ]
370 (mule-unicode-0100-24ff ; charset
371 256 ; base
372 7680 9450 ; first, last
373 [ "A-0" "a-0" "B." "b." "B-." "b-." "B_" "b_" "C,'" "c,'" ; Lat Ext Add
374 "D." "d." "D-." "d-." "D_" "d_" "D," "d," "D->" "d->"
375 "E-!" "e-!" "E-'" "e-'" "E->" "e->" "E-?" "e-?" "E,(" "e,("
376 "F." "f." "G-" "g-" "H." "h." "H-." "h-." "H:" "h:"
377 "H," "h," "H-(" "h-(" "I-?" "i-?" "I:'" "i:'" "K'" "k'"
378 "K-." "k-." "K_" "k_" "L-." "l-." "_L-." "_l-." "L_" "l_"
379 "L->" "l->" "M'" "m'" "M." "m." "M-." "m-." "N." "n."
380 "N-." "n-." "N_" "n_" "N->" "n->" "O?'" "o?'" "O?:" "o?:"
381 "O-!" "o-!" "O-'" "o-'" "P'" "p'" "P." "p." "R." "r."
382 "R-." "r-." "_R-." "_r-." "R_" "r_" "S." "s." "S-." "s-."
383 "S'." "s'." "S<." "s<." ".S-." ".s-." "T." "t." "T-." "t-."
384 "T_" "t_" "T->" "t->" "U_:" "u_:" "U-?" "u-?" "U->" "u->"
385 "U?'" "u?'" "U-:" "u-:" "V?" "v?" "V-." "v-." "W!" "w!"
386 "W'" "w'" "W:" "w:" "W." "w." "W-." "w-." "X." "x."
387 "X:" "x:" "Y." "y." "Z>" "z>" "Z-." "z-." "Z_" "z_"
388 "h_" "t:" "w0" "y0" "a))" "s1." nil nil nil nil
389 "A-." "a-." "A2" "a2" "A>'" "a>'" "A>!" "a>!" "A>2" "a>2"
390 "A>~" "a>~" ".A>" ".a>" "A('" "a('" "A(!" "a(!" "A(2" "a(2"
391 "A(~" "a(~" ".A(" ".a(" "E-." "e-." "E2" "e2" "E~" "e~"
392 "E>'" "e>'" "E>!" "e>!" "E>2" "e>2" "E>~" "e>~" ".E>" ".e>"
393 "I2" "i2" "I-." "i-." "O-." "o-." "O2" "o2" "O>'" "o>'"
394 "O>!" "o>!" "O>2" "o>2" "O>~" "o>~" ".O>" ".o>" "O9'" "o9'"
395 "O9!" "o9!" "O92" "o92" "O9~" "o9~" ".O9" ".o9" "U-." "u-."
396 "U2" "u2" "U9'" "u9'" "U9!" "u9!" "U92" "u92" "U9~" "u9~"
397 ".U9" ".u9" "Y!" "y!" "Y-." "y-." "Y2" "y2" "Y~" "y~"
398 nil nil nil nil nil nil "a*," "a*;" nil nil ; Greek Ext (0x1f00)
399 nil nil nil nil "A*," "A*;" nil nil nil nil
400 nil nil "e*," "e*;" nil nil nil nil nil nil
401 "E*," "E*;" nil nil nil nil nil nil "y*," "y*;"
402 nil nil nil nil nil nil "Y*," "Y*;" nil nil
403 nil nil nil nil "i*," "i*;" nil nil nil nil
404 nil nil "I*," "I*;" nil nil nil nil nil nil
405 "o*," "o*;" nil nil nil nil nil nil "O*," "O*;"
406 nil nil nil nil nil nil "u*," "u*;" nil nil
407 nil nil nil nil nil "U*;" nil nil nil nil
408 nil nil "w*," "w*;" nil nil nil nil nil nil
409 "W*," "W*;" nil nil nil nil nil nil "a*!" "a*'"
410 "e*!" "e*'" "y*!" "y*'" "i*!" "i*'" "o*!" "o*'" "u*!" "u*'"
411 "w*!" "w*'" nil nil nil nil nil nil nil nil
412 nil nil nil nil nil nil nil nil nil nil
413 nil nil nil nil nil nil nil nil nil nil
414 nil nil nil nil nil nil nil nil nil nil
415 nil nil nil nil nil nil nil nil nil nil
416 nil nil "a*(" "a*-" nil "a*j" nil nil "a*~" nil
417 "A*(" "A*-" "A*!" "A*'" "A*J" ")*" "J3" ",," "?*" "?:"
418 nil "y*j" nil nil "y*?" nil "E*!" "E*'" "Y*!" "Y*'"
419 "Y*J" ",!" ",'" "?," "i*(" "i*-" nil nil nil nil
420 "i*?" nil "I*(" "I*-" "I*!" "I*'" nil ";!" ";'" "?;"
421 "u*(" "u*-" nil nil "r*," "r*;" "u*?" nil "U*(" "U*-"
422 "U*!" "U*'" "R*;" "!:" ":'" "!*" nil nil nil "w*j"
423 nil nil "w*?" nil "O*!" "O*'" "W*!" "W*'" "W*J" "/*"
424 ";;" nil nil nil "1N" "1M" "3M" "4M" "6M" nil ; Gen Punct
425 nil "1T" "1H" nil nil nil "LRM" "RLM" "-1" nil
426 nil "--" "---" "===" "!2" "=2" "6`" "'9" ".9" "9'"
427 "``" "''" ":9" "9``" "/-" "/=" "sb" "3b" nil ".."
428 "..." ".-" "LSep" "PSep" "LR[" "RL[" "PDF" "LRO" "RLO" 255
429 "%o" "%oo" "'" "''" "\"'" "`" "``" "```" ".^" "<,"
430 ",>" ":X" "!!" "?!" "'-" nil nil nil nil "-b"
431 "/f" nil nil nil nil nil nil nil nil nil
432 nil nil nil nil nil nil nil nil nil nil
433 nil nil nil nil nil nil nil nil nil nil
434 nil nil nil nil nil nil nil nil nil nil
435 nil nil nil nil "^0" nil nil nil "^4" "^5"
436 "^6" "^7" "^8" "^9" "^+" "^-" "^=" "^(" "^)" "^n"
437 "_0" "_1" "_2" "_3" "_4" "_5" "_6" "_7" "_8" "_9"
438 "_+" "_-" "_=" "_(" "_)" nil nil nil nil nil
439 nil nil nil nil nil nil nil nil nil nil
440 nil nil nil nil nil "Ff" "Li" nil nil "Pt"
441 nil "W=" "NIS" nil "E=" nil nil nil nil nil
442 nil nil nil nil nil nil nil nil nil nil
443 nil nil nil nil nil nil nil nil nil nil
444 nil nil nil nil nil nil nil nil nil nil
445 nil nil nil nil nil nil nil nil nil nil
446 nil nil nil nil nil nil nil nil nil nil
447 nil nil nil nil nil nil nil nil nil nil
448 nil nil nil nil nil nil nil nil nil nil
449 nil nil nil nil nil nil nil nil "a/c" "a/s"
450 nil "oC" nil "c/o" "c/u" "=e" nil "oF" nil nil
451 nil nil "-h" "=h" nil nil nil nil nil nil
452 "N0" "PO" nil nil nil nil "Re" nil "Rx" nil
453 "SM" "TEL" "TM" nil nil nil "Om" nil nil nil
454 "oK" "AO" nil nil "Est" nil nil nil nil nil
455 nil "Aleph" "Bet" "Gimel" "Dalet" "=i=" nil nil nil nil
456 nil nil nil nil nil nil nil nil nil nil
457 nil nil nil nil nil nil nil nil nil nil
458 nil "1/3" "2/3" "1/5" "2/5" "3/5" "4/5" "1/6" "5/6" "1/8"
459 "3/8" "5/8" "7/8" "1/" ".I" "II" "III" "IV" ".V" "VI"
460 "VII" "VIII" "IX" "X" "XI" "XII" ".L" ".C" ".D" ".M"
461 ".i" "ii" "iii" "iv" ".v" "vi" "vii" "viii" "ix" ".x"
462 "xi" ".l" ".c" ".d" ".m" "CD" "DD" "CoD" "CI" nil
463 nil nil nil nil nil nil nil nil nil nil
464 nil "<-" "|^" "->" "|v" "<->" "v|^" "^\\" "/^" "\\v"
465 "v/" "<-/" "/->" "<~" "~>" "<<-" "|^^" "->>" "|vv" "<-<"
466 ">->" "<-|" "_|^" "|->" "-|v" "_v|^" "<-?" "?->" "<-o" "o->"
467 "<~>" "<-/>" nil nil nil nil nil nil nil nil
468 nil nil nil nil nil nil nil nil nil nil
469 nil nil nil nil nil nil nil nil nil nil
470 nil nil nil "<=/" "<=/>" "/=>" "<=" "||^" "=>" "||v"
471 "<=>" "v||^" "^\\\\" "//^" "\\\\v" "v//" "<-=" "=->" nil nil
472 nil nil "<.." ":^" "..>" ":v" nil nil "<::" "::^"
473 "::>" "::v" nil nil nil nil nil nil nil nil
474 nil nil nil nil nil nil nil nil nil nil
475 nil nil nil nil "FA" "C." "dP" "TE" "~TE" "/0"
476 "DE" "NB" "(-" "~(-" "e-" "-)" "~-)" "-e" "QED" "*P"
477 nil "+Z" "--" "-+" ".+" "./" ".\\" "*-" "Ob" "Sb"
478 "SQR" "CBR" nil "0(" "00" "-L" "-V" nil nil ".|"
479 "~.|" "||" "/||" "AND" "OR" "(U" ")U" "In" "DI" nil
480 "Io" nil nil nil nil nil ".:" ":." ":R" "::"
481 ".-." "-:" ":-:" ":~:" "?~" "~?" "??" nil nil "/~"
482 "-~" "~-" "/~-" "~=" "~/=" "/~=" "~~" "/~~" nil nil
483 "=?" ")(" "v^" "^_" ".=" "=;" ".=." nil ":=" "=:"
484 nil "=o" "=)" "=^" "=v" "*=" "=<>" "=df" nil "?="
485 "!=" "-=" "!-=" "==" "=<" ">=" nil nil nil nil
486 "<<" ">>" "()" "/)(" "!<" "!>" nil nil nil nil
487 nil nil nil nil nil nil "<'" "`>" "=<'" "`>="
488 "~<'" "`>~" "/<'" "/`>" "(C" ")C" "/(C" "/)C" "(_" ")_"
489 "/(_" "/)_" nil nil nil nil nil nil nil nil
490 nil nil nil "0+" "0-" "0x" "0/" "0." "0o" "0*"
491 "0=" "0_" nil nil nil nil "|T" "T|" "-T" "_T"
492 nil nil nil nil nil nil nil nil nil nil
493 nil nil nil nil nil nil nil nil nil "-,-"
494 nil "XOR" "NAND" "NOR" nil nil nil nil nil nil
495 nil nil nil nil nil nil nil nil nil nil
496 nil nil nil nil nil nil nil nil "<." ".>"
497 "<<<" ">>>" nil nil nil nil nil nil nil nil
498 nil nil nil nil nil nil nil nil nil nil
499 nil nil ":3" "..." nil nil nil nil nil nil
500 nil nil nil nil nil nil nil nil nil nil
501 nil nil "Eh" nil nil nil nil nil "<7" ">7"
502 "7<" "7>" nil nil nil nil "~I" nil "(A" nil
503 nil "TR" nil "=||" "88" nil nil nil nil nil
504 nil nil "Iu" "Il" nil nil "-^-" "-`-" "D->" nil
505 nil "</" "/>" "<-D" nil nil nil nil nil nil
506 nil nil nil nil nil nil nil nil nil nil
507 nil nil nil nil nil nil nil nil nil nil
508 nil nil nil nil nil nil nil nil nil nil
509 nil nil nil nil nil nil nil nil nil nil
510 nil nil nil nil nil nil nil nil nil nil
511 nil nil nil nil nil nil nil nil nil nil
512 nil nil nil nil nil nil nil nil nil nil
513 nil nil nil nil nil nil nil nil nil nil
514 nil nil nil nil nil nil nil nil nil nil
515 nil nil nil nil nil nil nil nil nil nil
516 nil nil nil nil nil nil nil nil nil nil
517 nil nil nil nil nil nil nil nil nil nil
518 nil nil nil nil nil nil nil nil nil nil
519 nil nil nil nil nil nil nil nil nil nil
520 nil nil nil nil nil nil nil nil nil nil
521 nil nil nil nil nil nil nil nil nil nil
522 nil nil nil nil nil nil nil nil nil nil
523 nil nil nil nil nil nil nil nil nil nil
524 nil nil nil nil nil nil nil nil nil nil
525 nil nil nil nil nil nil nil nil nil nil
526 nil nil nil nil nil nil "NUL" "SOH" "STX" "ETX"
527 "EOT" "ENQ" "ACK" "BEL" "BS" "HT" "LF" "VT" "FF" "CR"
528 "SS" "SI" "DLE" "DC1" "DC2" "DC3" "DC4" "NAK" "SYN" "ETB"
529 "CAN" "EM" "SUB" "ESC" "FS" "GS" "RS" "US" "SP" "DEL"
530 "b/" ",_," "NL" nil "?^" nil nil nil nil nil
531 nil nil nil nil nil nil nil nil nil nil
532 nil nil nil nil nil nil nil nil nil nil
533 nil nil nil nil nil nil nil nil nil nil
534 nil nil nil nil nil nil nil nil nil nil
535 nil nil nil nil nil nil nil nil nil nil
536 nil nil "1-o" "2-o" "3-o" "4-o" "5-o" "6-o" "7-o" "8-o"
537 "9-o" "10-o" "11-o" "12-o" "13-o" "14-o" "15-o" "16-o" "17-o" "18-o"
538 "19-o" "20-o" "(1)" "(2)" "(3)" "(4)" "(5)" "(6)" "(7)" "(8)"
539 "(9)" "(10)" "(11)" "(12)" "(13)" "(14)" "(15)" "(16)" "(17)" "(18)"
540 "(19)" "(20)" "1." "2." "3." "4." "5." "6." "7." "8."
541 "9." "10." "11." "12." "13." "14." "15." "16." "17." "18."
542 "19." "20." "(a)" "(b)" "(c)" "(d)" "(e)" "(f)" "(g)" "(h)"
543 "(i)" "(j)" "(k)" "(l)" "(m)" "(n)" "(o)" "(p)" "(q)" "(r)"
544 "(s)" "(t)" "(u)" "(v)" "(w)" "(x)" "(y)" "(z)" "A-o" "B-o"
545 "C-o" "D-o" "E-o" "F-o" "G-o" "H-o" "I-o" "J-o" "K-o" "L-o"
546 "M-o" "N-o" "O-o" "P-o" "Q-o" "R-o" "S-o" "T-o" "U-o" "V-o"
547 "W-o" "X-o" "Y-o" "Z-o" "a-o" "b-o" "c-o" "d-o" "e-o" "f-o"
548 "g-o" "h-o" "i-o" "j-o" "k-o" "l-o" "m-o" "n-o" "o-o" "p-o"
549 "q-o" "r-o" "s-o" "t-o" "u-o" "v-o" "w-o" "x-o" "y-o" "z-o"
550 "0-o" ]
554 "A list of mule-unicode-* character sets and the strings that
555 should be used to represent the characters from each set on a DOS
556 terminal which does not have corresponding glyphs built into the
557 installed codepage.")
559 (defun IT-setup-unicode-display (&optional table)
560 "Set up display table TABLE for displaying mule-unicode-* characters
561 on a DOS terminal. If TABLE is nil or omitted, `standard-display-table'
562 is used."
563 (interactive)
564 (let ((disp-tab (or table standard-display-table))
565 (tail IT-unicode-translations)
566 translation)
567 (while tail
568 (setq translation (car tail) tail (cdr tail))
569 (let* ((chset (car translation))
570 (base (nth 1 translation))
571 (first (nth 2 translation))
572 (last (nth 3 translation))
573 (table (nth 4 translation))
574 (i 0)
575 (this (- first base))
576 glyph)
577 (while (<= i (- last first))
578 (setq glyph (aref table i))
579 (or glyph (setq glyph dos-unsupported-char-glyph))
580 (aset disp-tab (make-char chset
581 (+ (/ this 96) 32)
582 (+ (% this 96) 32))
583 (vconcat
584 (if (numberp glyph)
585 (char-to-string glyph)
586 (if (> (length glyph) 1) (concat "{" glyph "}")
587 glyph))))
588 (setq i (1+ i) this (1+ this)))))))
590 (defun dos-cpNNN-setup (codepage)
591 "Set up the MULE environment using the DOS codepage CODEPAGE.
593 This function creates the coding system cpNNN (where NNN is the value
594 of the argument CODEPAGE), and then uses this coding system to set up
595 display tables, and the language environment options as appropriate."
596 (let* ((cp (format "cp%s" codepage))
597 (charset (cp-charset-for-codepage cp))
598 (offset (cp-offset-for-codepage cp)))
599 (cp-make-coding-systems-for-codepage cp charset offset)
600 ;; This is done by set-language-environment.
601 ;;(setq nonascii-translation-table
602 ;; (symbol-value (intern (concat cp "-nonascii-translation-table"))))
603 (set-language-environment (cp-language-for-codepage cp))
604 (set-default-coding-systems (intern (concat cp "-dos")))
605 (set-selection-coding-system (intern (concat cp "-dos")))
606 (set-terminal-coding-system
607 (setq default-terminal-coding-system (intern (concat cp
608 "-unix"))))
609 (IT-display-table-setup cp)
610 ;; It's time: too many input methods in leim/quail produce
611 ;; Unicode characters. Let the user see them.
612 (IT-setup-unicode-display)
613 (prefer-coding-system (intern (concat cp "-dos")))
614 (if default-enable-multibyte-characters
615 ;; We want this in multibyte version only, since unibyte version
616 ;; should not convert non-ASCII characters at all.
617 (setq unibyte-display-via-language-environment t)
618 ;; Let the unibyte version behave as Emacs 19 did. In particular,
619 ;; let it use and display native codepage-specific glyphs for
620 ;; non-ASCII characters. For this to work correctly, we need to
621 ;; establish the correspondence between lower-case letters and their
622 ;; upper-case brethren, as appropriate for the codepage in use. The
623 ;; code below makes this happen.
624 ;; (In the multibyte mode, the appropriate tables are prepared
625 ;; elsewhere, since multibyte Emacs uses normal MULE character sets,
626 ;; which are supported on all platforms.)
627 (let* ((i 128)
628 (modify (function
629 (lambda (ch sy)
630 (modify-syntax-entry ch sy text-mode-syntax-table)
631 (if (boundp 'tex-mode-syntax-table)
632 (modify-syntax-entry ch sy tex-mode-syntax-table))
633 (modify-syntax-entry ch sy (standard-syntax-table))
635 (table (standard-case-table))
636 ;; The following are strings of letters, first lower then
637 ;; upper case. This will look funny on terminals which
638 ;; display other code pages. In particular, what is
639 ;; displayed as blanks or triangles are not what they
640 ;; look like at all! (Use `C-x =' to see what they
641 ;; really are.)
642 (chars
643 (cond
644 ((= codepage 850)
645 "‡€�š‚�ƒ¶„Ž…·†�ÆÇ µˆÒ‰ÓŠÔ‹ØŒ×�Þ¡Ö‘’“â”™•ã¢à›�–ê£é—ë˜Yìí¡I£é¤¥ÐÑçè")
646 ((= codepage 865)
647 "‡€�š‚�ƒA„Ž…A†�ˆE‰EŠE‹IŒI�I‘’“O”™•O–U£U˜Y›� A¡I¢O£U¤¥")
648 ;; default is 437
649 (t "‡€�š‚�ƒA„Ž…A†�ˆE‰EŠE‹IŒI�I‘’“O”™•O–U£U˜Y A¡I¢O£U¤¥"))))
651 (while (< i 256)
652 (funcall modify i "_")
653 (setq i (1+ i)))
655 (setq i 0)
656 (while (< i (length chars))
657 (let ((ch1 (aref chars i))
658 (ch2 (aref chars (1+ i))))
659 (if (> ch2 127)
660 (set-case-syntax-pair ch2 ch1 table))
661 (setq i (+ i 2))))
662 (save-excursion
663 (mapcar (lambda (b) (set-buffer b) (set-case-table table))
664 (buffer-list)))
665 (set-standard-case-table table)))
666 ;; Some codepages have sporadic support for Latin-1, Greek, and
667 ;; symbol glyphs, which don't belong to their native character
668 ;; set. It's a nuisance to have all those glyphs here, for all
669 ;; the codepages (for starters, I don't even have references for
670 ;; all the codepages). So I provide a hook for those who want to
671 ;; squeeze every bit of support out of their terminal/font.
672 (run-hooks 'dos-codepage-setup-hook)
675 (defvar cjk-codepages-alist
676 '((932 "Japanese" japanese-shift-jis)
677 (950 "Chinese-BIG5" cn-big5)
678 (936 "Chinese-GB" cn-gb-2312)
679 (949 "Korean" euc-kr))
680 "An alist of Far-Eastern codepages and the names of the associated
681 language and supported coding system.")
683 (defun dos-codepage-setup ()
684 "Set up the MULE environment as appropriate for the installed DOS codepage.
686 This function sets coding systems, display tables, and the language
687 environment options as appropriate for the current value of `dos-codepage'.
689 This function is automatically run at startup via the `term-setup-hook'
690 list. You can (and should) also run it whenever the value of
691 `dos-codepage' changes."
692 (interactive)
693 (let* ((desc (cdr (assq dos-codepage cjk-codepages-alist)))
694 (lang (car desc))
695 (coding (car (cdr desc)))
696 coding-dos coding-unix)
697 (if (null desc)
698 (dos-cpNNN-setup dos-codepage)
699 ;; We've got one of the Far-Eastern codepages which support
700 ;; MULE native coding systems directly.
701 (setq coding-dos (intern (format "%s-dos" coding))
702 coding-unix (intern (format "%s-unix" coding)))
703 (set-language-environment lang)
704 (set-selection-coding-system coding-dos)
705 (setq file-name-coding-system coding-unix)
706 (set-terminal-coding-system
707 (setq default-terminal-coding-system coding-unix))
708 ;; Assume they support non-ASCII Latin characters like the IBM
709 ;; codepage 437 does.
710 (IT-display-table-setup "cp437")
711 ;; It's time: too many input methods in leim/quail produce
712 ;; Unicode characters. Let the user see them.
713 (IT-setup-unicode-display)
714 (prefer-coding-system coding-dos)
715 (if default-enable-multibyte-characters
716 (setq unibyte-display-via-language-environment t))
719 ;; We want to delay the terminal and other codepage-related setup
720 ;; until after the terminal is set and user's .emacs is processed,
721 ;; because people might define their `dos-codepage-setup-hook' there.
722 (add-hook 'term-setup-hook 'dos-codepage-setup)
724 ;; In multibyte mode, we want unibyte buffers to be displayed using
725 ;; the terminal coding system, so that they display correctly on the
726 ;; DOS terminal; in unibyte mode we want to see all 8-bit characters
727 ;; verbatim. In both cases, we want the entire range of 8-bit
728 ;; characters to arrive at our display code verbatim.
729 (standard-display-8bit 127 255)
731 ;;; arch-tag: eea04c06-7311-4b5a-b531-3c1be1b070af
732 ;;; internal.el ends here