1 ;;; japanese.el --- support for Japanese -*- coding: iso-2022-7bit; no-byte-compile: t -*-
3 ;; Copyright (C) 1997, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008
4 ;; Free Software Foundation, Inc.
5 ;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
6 ;; 2005, 2006, 2007, 2008
7 ;; National Institute of Advanced Industrial Science and Technology (AIST)
8 ;; Registration Number H14PRO021
10 ;; National Institute of Advanced Industrial Science and Technology (AIST)
11 ;; Registration Number H13PRO009
13 ;; Keywords: multilingual, Japanese
15 ;; This file is part of GNU Emacs.
17 ;; GNU Emacs is free software: you can redistribute it and/or modify
18 ;; it under the terms of the GNU General Public License as published by
19 ;; the Free Software Foundation, either version 3 of the License, or
20 ;; (at your option) any later version.
22 ;; GNU Emacs is distributed in the hope that it will be useful,
23 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
24 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
25 ;; GNU General Public License for more details.
27 ;; You should have received a copy of the GNU General Public License
28 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
32 ;; For Japanese, character sets JISX0201, JISX0208, JISX0212 are
37 ;;; Load translation tables for CP932.
38 (load "international/cp51932")
39 (load "international/eucjp-ms")
41 (define-coding-system 'iso-2022-jp
42 "ISO 2022 based 7bit encoding for Japanese (MIME:ISO-2022-JP)."
43 :coding-type
'iso-2022
45 :designation
[(ascii japanese-jisx0208-1978 japanese-jisx0208
48 :flags
'(short ascii-at-eol ascii-at-cntl
7-bit designation
)
49 :charset-list
'(ascii japanese-jisx0208
50 japanese-jisx0208-1978 latin-jisx0201
)
51 :mime-charset
'iso-2022-jp
52 :suitable-for-keyboard t
)
54 (define-coding-system-alias 'junet
'iso-2022-jp
)
56 (define-coding-system 'iso-2022-jp-2
57 "ISO 2022 based 7bit encoding for CJK, Latin-1, Greek (MIME:ISO-2022-JP-2)."
58 :coding-type
'iso-2022
60 :designation
[(ascii japanese-jisx0208-1978 japanese-jisx0208
61 latin-jisx0201 japanese-jisx0212
62 chinese-gb2312 korean-ksc5601
)
64 (nil latin-iso8859-1 greek-iso8859-7
)
66 :flags
'(short ascii-at-eol ascii-at-cntl
7-bit designation single-shift
68 :charset-list
'(ascii japanese-jisx0208 japanese-jisx0212
69 latin-jisx0201 japanese-jisx0208-1978
70 chinese-gb2312 korean-ksc5601
71 latin-iso8859-1 greek-iso8859-7
)
72 :mime-charset
'iso-2022-jp-2
73 :suitable-for-keyboard t
)
75 (let ((map ; JIS vs CP932
76 '((#x301C .
#xFF5E
) ; WAVE DASH FULLWIDTH TILDE
77 (#x2014 .
#x2015
) ; EM DASH HORIZONTAL BAR
78 (#x2016 .
#x2225
) ; DOUBLE VERTICAL LINE PARALLEL TO
79 (#x2212 .
#xFF0D
) ; MINUS SIGN FULLWIDTH HYPHEN-MINUS
80 (#x00A2 .
#xFFE0
) ; CENT SIGN FULLWIDTH CENT SIGN
81 (#x00A3 .
#xFFE1
) ; POUND SIGN FULLWIDTH POUND SIGN
82 (#x00AC .
#xFFE2
) ; NOT SIGN FULLWIDTH NOT SIGN
83 (#x00A6 .
#xFFE4
) ; BROKEN LINE FULLWIDTH BROKEN LINE
85 (define-translation-table 'japanese-ucs-jis-to-cp932-map map
)
86 (mapc #'(lambda (x) (let ((tmp (car x
)))
87 (setcar x
(cdr x
)) (setcdr x tmp
)))
89 (define-translation-table 'japanese-ucs-cp932-to-jis-map map
))
91 ;; U+2014 (EM DASH) vs U+2015 (HORIZONTAL BAR)
92 (define-translation-table 'japanese-ucs-glibc-to-jis-map
'((#x2015 .
#x2014
)))
93 (define-translation-table 'japanese-ucs-jis-to-glibc-map
'((#x2014 .
#x2015
)))
95 (define-coding-system 'japanese-shift-jis
96 "Shift-JIS 8-bit encoding for Japanese (MIME:SHIFT_JIS)"
97 :coding-type
'shift-jis
99 :charset-list
'(ascii katakana-jisx0201 japanese-jisx0208
)
100 :mime-charset
'shift_jis
)
102 (define-coding-system-alias 'shift_jis
'japanese-shift-jis
)
103 (define-coding-system-alias 'sjis
'japanese-shift-jis
)
104 (define-coding-system-alias 'cp932
'japanese-shift-jis
)
106 (define-coding-system 'japanese-cp932
107 "CP932 (Microsoft shift-jis)"
108 :coding-type
'charset
110 :charset-list
'(ascii katakana-sjis cp932-2-byte
))
112 (define-coding-system-alias 'cp932
'japanese-cp932
)
114 (define-coding-system 'japanese-iso-7bit-1978-irv
115 "ISO 2022 based 7-bit encoding for Japanese JISX0208-1978 and JISX0201-Roman."
116 :coding-type
'iso-2022
118 :designation
[(latin-jisx0201 japanese-jisx0208-1978 japanese-jisx0208
119 japanese-jisx0212 katakana-jisx0201
)
121 :flags
'(short ascii-at-eol ascii-at-cntl
7-bit designation
122 use-roman use-oldjis
)
123 :charset-list
'(ascii latin-jisx0201 japanese-jisx0208-1978 japanese-jisx0208
126 (define-coding-system-alias 'iso-2022-jp-1978-irv
'japanese-iso-7bit-1978-irv
)
127 (define-coding-system-alias 'old-jis
'japanese-iso-7bit-1978-irv
)
129 (define-coding-system 'japanese-iso-8bit
130 "ISO 2022 based EUC encoding for Japanese (MIME:EUC-JP)."
131 :coding-type
'iso-2022
133 :designation
[ascii japanese-jisx0208 katakana-jisx0201 japanese-jisx0212
]
134 :flags
'(short ascii-at-eol ascii-at-cntl single-shift
)
135 :charset-list
'(ascii latin-jisx0201 japanese-jisx0208
136 katakana-jisx0201 japanese-jisx0212
137 japanese-jisx0208-1978
)
138 :mime-charset
'euc-jp
)
140 (define-coding-system-alias 'euc-japan-1990
'japanese-iso-8bit
)
141 (define-coding-system-alias 'euc-japan
'japanese-iso-8bit
)
142 (define-coding-system-alias 'euc-jp
'japanese-iso-8bit
)
144 (define-coding-system 'eucjp-ms
145 "eucJP-ms (like EUC-JP but with CP932 extension).
146 eucJP-ms is defined in <http://www.opengroup.or.jp/jvc/cde/appendix.html>."
147 :coding-type
'iso-2022
149 :designation
[ascii japanese-jisx0208 katakana-jisx0201 japanese-jisx0212
]
150 :flags
'(short ascii-at-eol ascii-at-cntl single-shift
)
151 :charset-list
'(ascii latin-jisx0201 japanese-jisx0208
152 katakana-jisx0201 japanese-jisx0212
)
153 :decode-translation-table
'eucjp-ms-decode
154 :encode-translation-table
'eucjp-ms-encode
)
156 (define-coding-system 'iso-2022-jp-2004
157 "ISO 2022 based 7bit encoding for JIS X 0213:2004 (MIME:ISO-2022-JP-2004)."
158 :coding-type
'iso-2022
160 :designation
[(ascii japanese-jisx0208 japanese-jisx0213.2004-
1
161 japanese-jisx0213-1 japanese-jisx0213-2
)
163 :flags
'(short ascii-at-eol ascii-at-cntl
7-bit designation
)
165 :charset-list
'(ascii japanese-jisx0208 japanese-jisx0213.2004-
1
166 japanese-jisx0213-1 japanese-jisx0213-2
)
167 :mime-charset
'iso-2022-jp-2004
168 :suitable-for-keyboard t
)
170 (define-coding-system-alias 'iso-2022-jp-3
'iso-2022-jp-2004
)
172 (define-coding-system 'euc-jis-2004
173 "ISO 2022 based EUC encoding for JIS X 0213 (MIME:EUC-JIS-2004)."
174 :coding-type
'iso-2022
176 :designation
[ascii japanese-jisx0213.2004-
1 katakana-jisx0201
178 :flags
'(short ascii-at-eol ascii-at-cntl single-shift
)
179 :charset-list
'(ascii latin-jisx0201 japanese-jisx0213.2004-
1
180 japanese-jisx0213-1 katakana-jisx0201
182 :mime-charset
'euc-jis-2004
)
184 (define-coding-system-alias 'euc-jisx0213
'euc-jis-2004
)
186 (define-coding-system 'japanese-shift-jis-2004
187 "Shift_JIS 8-bit encodinf for Japanese (MIME:SHIFT_JIS-2004)"
188 :coding-type
'shift-jis
190 :charset-list
'(ascii katakana-jisx0201
191 japanese-jisx0213.2004-
1 japanese-jisx0213-2
))
193 (define-coding-system-alias 'shift_jis-2004
'japanese-shift-jis-2004
)
195 (set-language-info-alist
196 "Japanese" '((setup-function . setup-japanese-environment-internal
)
197 (exit-function . use-default-char-width-table
)
198 (iso639-language . ja
)
199 (tutorial .
"TUTORIAL.ja")
200 (charset japanese-jisx0208
201 japanese-jisx0212 latin-jisx0201 katakana-jisx0201
202 japanese-jisx0213.2004-
1 japanese-jisx0213-1
203 japanese-jisx0213-2 japanese-jisx0208-1978
)
204 (coding-system iso-2022-jp japanese-iso-8bit
205 japanese-shift-jis japanese-iso-7bit-1978-irv
206 iso-2022-jp-2004 japanese-shift-jis-2004
208 (coding-priority iso-2022-jp japanese-iso-8bit
210 iso-2022-jp-2004 euc-jis-2004
211 japanese-shift-jis-2004
213 (input-method .
"japanese")
214 (features japan-util
)
215 (sample-text .
"Japanese (\e$BF|K\8l\e(B) \e$B$3$s$K$A$O\e(B, \e(I:]FAJ\e(B")
216 (documentation . t
)))
219 ;; JISX0213-1 vs Unicode
220 '((#x2477 .
[#x304B
#x309A
])
221 (#x2478 .
[#x304D
#x309A
])
222 (#x2479 .
[#x304F
#x309A
])
223 (#x247a .
[#x3051
#x309A
])
224 (#x247b .
[#x3053
#x309A
])
225 (#x2577 .
[#x30AB
#x309A
])
226 (#x2578 .
[#x30AD
#x309A
])
227 (#x2579 .
[#x30AF
#x309A
])
228 (#x257a .
[#x30B1
#x309A
])
229 (#x257b .
[#x30B3
#x309A
])
230 (#x257c .
[#x30BB
#x309A
])
231 (#x257d .
[#x30C4
#x309A
])
232 (#x257e .
[#x30C8
#x309A
])
233 (#x2678 .
[#x31F7
#x309A
])
234 (#x2b44 .
[#x00E6
#x0300
])
235 (#x2b48 .
[#x0254
#x0300
])
236 (#x2b49 .
[#x0254
#x0301
])
237 (#x2b4a .
[#x028C
#x0300
])
238 (#x2b4b .
[#x028C
#x0301
])
239 (#x2b4c .
[#x0259
#x0300
])
240 (#x2b4d .
[#x0259
#x0301
])
241 (#x2b4e .
[#x025A
#x0300
])
242 (#x2b4f .
[#x025A
#x0301
])
243 (#x2b65 .
[#x02E9
#x02E5
])
244 (#x2b66 .
[#x02E5
#x02E9
])))
247 (setcar elt
(decode-char 'japanese-jisx0213-1
(car elt
))))
248 (setq table
(make-translation-table-from-alist map
))
249 (define-translation-table 'jisx0213-to-unicode table
)
250 (define-translation-table 'unicode-to-jisx0213
251 (char-table-extra-slot table
0)))
255 ;; arch-tag: 450f5537-9d53-4d5e-b731-4cf116d8cbc9
256 ;;; japanese.el ends here