]> code.delx.au - gnu-emacs/blob - lisp/language/chinese.el
Split XEmacs/Emacs definitions and sample setup code into separate files
[gnu-emacs] / lisp / language / chinese.el
1 ;;; chinese.el --- support for Chinese -*- coding: iso-2022-7bit; -*-
2
3 ;; Copyright (C) 2001, 2002, 2003, 2004, 2005, 2006
4 ;; Free Software Foundation, Inc.
5 ;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
6 ;; 2005, 2006
7 ;; National Institute of Advanced Industrial Science and Technology (AIST)
8 ;; Registration Number H14PRO021
9 ;; Copyright (C) 2003
10 ;; National Institute of Advanced Industrial Science and Technology (AIST)
11 ;; Registration Number H13PRO009
12
13 ;; Keywords: multilingual, Chinese
14
15 ;; This file is part of GNU Emacs.
16
17 ;; GNU Emacs is free software; you can redistribute it and/or modify
18 ;; it under the terms of the GNU General Public License as published by
19 ;; the Free Software Foundation; either version 2, or (at your option)
20 ;; any later version.
21
22 ;; GNU Emacs is distributed in the hope that it will be useful,
23 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
24 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
25 ;; GNU General Public License for more details.
26
27 ;; You should have received a copy of the GNU General Public License
28 ;; along with GNU Emacs; see the file COPYING. If not, write to the
29 ;; Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
30 ;; Boston, MA 02110-1301, USA.
31
32 ;;; Commentary:
33
34 ;; For Chinese, three character sets GB2312, BIG5, and CNS11643 are
35 ;; supported.
36
37 ;;; Code:
38
39 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
40 ;;; Chinese (general)
41 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
42
43
44 (define-coding-system 'iso-2022-cn
45 "ISO 2022 based 7bit encoding for Chinese GB and CNS (MIME:ISO-2022-CN)."
46 :coding-type 'iso-2022
47 :mnemonic ?C
48 :charset-list '(ascii chinese-gb2312 chinese-cns11643-1 chinese-cns11643-2)
49 :designation [ascii
50 (nil chinese-gb2312 chinese-cns11643-1)
51 (nil chinese-cns11643-2)
52 nil]
53 :flags '(ascii-at-eol ascii-at-cntl 7-bit
54 designation locking-shift single-shift init-at-bol)
55 :mime-charset 'iso-2022-cn
56 :suitable-for-keyboard t)
57
58 (define-coding-system-alias 'chinese-iso-7bit 'iso-2022-cn)
59
60 (define-coding-system 'iso-2022-cn-ext
61 "ISO 2022 based 7bit encoding for Chinese GB and CNS (MIME:ISO-2022-CN-EXT)."
62 :coding-type 'iso-2022
63 :mnemonic ?C
64 :charset-list '(ascii
65 chinese-gb2312 chinese-cns11643-1
66 chinese-cns11643-2 chinese-cns11643-3 chinese-cns11643-4
67 chinese-cns11643-5 chinese-cns11643-6 chinese-cns11643-7)
68 :designation '[ascii
69 (nil chinese-gb2312 chinese-cns11643-1)
70 (nil chinese-cns11643-2)
71 (nil chinese-cns11643-3 chinese-cns11643-4 chinese-cns11643-5
72 chinese-cns11643-6 chinese-cns11643-7)]
73 :flags '(ascii-at-eol ascii-at-cntl 7-bit
74 designation locking-shift single-shift init-at-bol)
75 :mime-charset 'iso-2022-cn-ext
76 :suitable-for-keyboard t)
77
78 \f
79 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
80 ;;; Chinese GB2312 (simplified)
81 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
82
83 (define-coding-system 'chinese-iso-8bit
84 "ISO 2022 based EUC encoding for Chinese GB2312 (MIME:GB2312)."
85 :coding-type 'iso-2022
86 :mnemonic ?c
87 :charset-list '(ascii chinese-gb2312)
88 :designation [ascii chinese-gb2312 nil nil]
89 :mime-charset 'gb2312)
90
91 (define-coding-system-alias 'cn-gb-2312 'chinese-iso-8bit)
92 (define-coding-system-alias 'euc-china 'chinese-iso-8bit)
93 (define-coding-system-alias 'euc-cn 'chinese-iso-8bit)
94 (define-coding-system-alias 'cn-gb 'chinese-iso-8bit)
95 (define-coding-system-alias 'gb2312 'chinese-iso-8bit)
96 (define-coding-system-alias 'cp936 'chinese-iso-8bit)
97
98 (define-coding-system 'chinese-hz
99 "Hz/ZW 7-bit encoding for Chinese GB2312 (MIME:HZ-GB-2312)."
100 :coding-type 'utf-8
101 :mnemonic ?z
102 :charset-list '(ascii chinese-gb2312)
103 :mime-charset 'hz-gb-2312
104 :post-read-conversion 'post-read-decode-hz
105 :pre-write-conversion 'pre-write-encode-hz)
106
107 (define-coding-system-alias 'hz-gb-2312 'chinese-hz)
108 (define-coding-system-alias 'hz 'chinese-hz)
109
110 (set-language-info-alist
111 "Chinese-GB" '((charset chinese-gb2312 chinese-sisheng)
112 (coding-system chinese-iso-8bit iso-2022-cn chinese-hz)
113 (coding-priority chinese-iso-8bit chinese-big5 iso-2022-cn)
114 (input-method . "chinese-py-punct")
115 (features china-util)
116 (sample-text . "Chinese (\e$AVPND\e(B,\e$AFUM(;0\e(B,\e$A::So\e(B) \e$ADc:C\e(B")
117 (documentation . "Support for Chinese GB2312 character set.")
118 (tutorial . "TUTORIAL.cn"))
119 '("Chinese"))
120
121 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
122 ;; Chinese BIG5 (traditional)
123 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
124
125 (define-coding-system 'chinese-big5
126 "BIG5 8-bit encoding for Chinese (MIME:Big5)"
127 :coding-type 'charset
128 :mnemonic ?B
129 :charset-list '(ascii big5)
130 :mime-charset 'big5)
131
132 (define-coding-system-alias 'big5 'chinese-big5)
133 (define-coding-system-alias 'cn-big5 'chinese-big5)
134 (define-coding-system-alias 'cp950 'chinese-big5)
135
136 (set-language-info-alist
137 "Chinese-BIG5" '((charset chinese-big5-1 chinese-big5-2)
138 (coding-system chinese-big5 chinese-iso-7bit)
139 (coding-priority chinese-big5 iso-2022-cn chinese-iso-8bit)
140 (input-method . "chinese-py-punct-b5")
141 (ctext-non-standard-encodings "big5-0")
142 (features china-util)
143 (sample-text . "Cantonese (\e$(Gemk#\e(B,\e$(Gl]N)fc\e(B) \e$ATg3?\e(B, \e$ADc:C\e(B")
144 (documentation . "Support for Chinese Big5 character set.")
145 (tutorial . "TUTORIAL.zh"))
146 '("Chinese"))
147
148 (define-coding-system 'chinese-big5-hkscs
149 "BIG5-HKSCS 8-bit encoding for Chinese, Hong Kong supplement (MIME:Big5-HKSCS)"
150 :coding-type 'charset
151 :mnemonic ?B
152 :charset-list '(ascii big5-hkscs)
153 :mime-charset 'big5-hkscs)
154 (define-coding-system-alias 'big5-hkscs 'chinese-big5-hkscs)
155 (define-coding-system-alias 'cn-big5-hkscs 'chinese-big5-hkscs)
156
157 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
158 ;; Chinese CNS11643 (traditional)
159 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
160
161 (define-coding-system 'euc-tw
162 "ISO 2022 based EUC encoding for Chinese CNS11643."
163 :coding-type 'iso-2022
164 :mnemonic ?Z
165 :charset-list '(ascii
166 chinese-cns11643-1
167 chinese-cns11643-2
168 chinese-cns11643-3
169 chinese-cns11643-4
170 chinese-cns11643-5
171 chinese-cns11643-6
172 chinese-cns11643-7)
173 :designation [ascii chinese-cns11643-1 (chinese-cns11643-1
174 chinese-cns11643-2
175 chinese-cns11643-3
176 chinese-cns11643-4
177 chinese-cns11643-5
178 chinese-cns11643-6
179 chinese-cns11643-7) nil]
180 :mime-charset 'euc-tw)
181
182 (define-coding-system-alias 'euc-taiwan 'euc-tw)
183
184 (set-language-info-alist
185 "Chinese-CNS" '((charset chinese-cns11643-1 chinese-cns11643-2
186 chinese-cns11643-3 chinese-cns11643-4
187 chinese-cns11643-5 chinese-cns11643-6
188 chinese-cns11643-7)
189 (coding-system iso-2022-cn euc-tw)
190 (coding-priority iso-2022-cn euc-tw chinese-big5
191 chinese-iso-8bit)
192 (features china-util)
193 (input-method . "chinese-cns-quick")
194 ;; Fixme: presumably it won't accept big5 now.
195 (documentation . "\
196 Support for Chinese CNS character sets. Note that the EUC-TW coding system
197 accepts Big5 for input also (which is then converted to CNS)."))
198 '("Chinese"))
199
200 (set-language-info-alist
201 "Chinese-EUC-TW" '((charset chinese-cns11643-1 chinese-cns11643-2
202 chinese-cns11643-3 chinese-cns11643-4
203 chinese-cns11643-5 chinese-cns11643-6
204 chinese-cns11643-7 chinese-big5-1 chinese-big5-2)
205 (coding-system euc-tw iso-2022-cn)
206 (coding-priority euc-tw chinese-big5 iso-2022-cn
207 chinese-iso-8bit)
208 (features china-util)
209 (input-method . "chinese-cns-quick")
210 (documentation . "\
211 Support for Chinese, prefering the EUC-TW character set. Note that
212 the EUC-TW coding system accepts Big5 for input also (which is then
213 converted to CNS)."))
214 '("Chinese"))
215
216
217 ;;; Chinese GBK
218
219 (define-coding-system 'chinese-gbk
220 "GBK encoding for Chinese (MIME:GBK)."
221 :coding-type 'charset
222 :mnemonic ?c
223 :charset-list '(ascii chinese-gbk)
224 :mime-charset 'gbk)
225 (define-coding-system-alias 'gbk 'chinese-gbk)
226 (define-coding-system-alias 'cp936 'chinese-gbk)
227 (define-coding-system-alias 'windows-936 'chinese-gbk)
228
229 (set-language-info-alist
230 "Chinese-GBK" '((charset chinese-gbk)
231 (coding-system chinese-gbk)
232 (coding-priority gbk iso-2022-cn chinese-big5
233 chinese-iso-8bit) ; fixme?
234 (ctext-non-standard-encodings "gbk-0")
235 (input-method . "chinese-py-punct") ; fixme?
236 (sample-text . "Chinese (\e$BCfJ8\e(B,\e$BIaDL\e$A;0\e(B,\e$A::So\e(B) \e$(D95\e$B9%\e(B")
237 (features china-util)
238 (documentation . "Support for Chinese GBK character set.")
239 (tutorial . "TUTORIAL.cn"))
240 '("Chinese"))
241
242 ;;; Chinese GB18030
243
244 (define-coding-system 'chinese-gb18030
245 "GB18030 encoding for Chinese (MIME:GB18030)."
246 :coding-type 'charset
247 :mnemonic ?c
248 :charset-list '(ascii gb18030-2-byte
249 gb18030-4-byte-bmp gb18030-4-byte-smp
250 gb18030-4-byte-ext-1 gb18030-4-byte-ext-2)
251 :mime-charset 'gb18030)
252
253 (define-coding-system-alias 'gb18030 'chinese-gb18030)
254
255 (set-language-info-alist
256 "Chinese-GB18030" '((charset gb18030)
257 (coding-system chinese-gb18030)
258 (coding-priority gb18030 gbk iso-2022-cn chinese-big5
259 chinese-iso-8bit) ; fixme?
260 (input-method . "chinese-py-punct") ; fixme?
261 (sample-text . "Chinese (\e$BCfJ8\e(B,\e$BIaDL\e$A;0\e(B,\e$A::So\e(B) \e$(D0_\e$B9%\e(B")
262 (features china-util)
263 (documentation
264 . "Support for Chinese GB18030 character set.")
265 (tutorial . "TUTORIAL.cn"))
266 '("Chinese"))
267
268 ;; Fixme: add HKSCS
269
270 (provide 'chinese)
271
272 ;;; arch-tag: b82fcf7a-84f6-4e0b-b38c-1742dac0e09f
273 ;;; chinese.el ends here