]> code.delx.au - gnu-emacs/blob - lisp/language/european.el
("Latin-8", "Latin-9"): Add input methods,
[gnu-emacs] / lisp / language / european.el
1 ;;; european.el --- European languages -*- coding: iso-2022-7bit; -*-
2
3 ;; Copyright (C) 1995, 1997 Electrotechnical Laboratory, JAPAN.
4 ;; Licensed to the Free Software Foundation.
5
6 ;; Keywords: multilingual, European
7
8 ;; This file is part of GNU Emacs.
9
10 ;; GNU Emacs is free software; you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation; either version 2, or (at your option)
13 ;; any later version.
14
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
19
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs; see the file COPYING. If not, write to the
22 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
23 ;; Boston, MA 02111-1307, USA.
24
25 ;;; Commentary:
26
27 ;; For Europeans, character sets ISO8859-1,2,3,4,9,14,15 are supported.
28
29 ;;; Code:
30
31 ;; Latin-1 (ISO-8859-1)
32
33 (make-coding-system
34 'iso-latin-1 2 ?1
35 "ISO 2022 based 8-bit encoding for Latin-1 (MIME:ISO-8859-1)"
36 '(ascii latin-iso8859-1 nil nil
37 nil nil nil nil nil nil nil nil nil nil nil nil t)
38 '((safe-charsets ascii latin-iso8859-1)
39 (mime-charset . iso-8859-1)))
40
41 (define-coding-system-alias 'iso-8859-1 'iso-latin-1)
42 (define-coding-system-alias 'latin-1 'iso-latin-1)
43
44 (make-coding-system
45 'compound-text 2 ?1
46 "ISO 2022 based encoding used in inter client communication of X"
47 '((ascii t) (latin-iso8859-1 katakana-jisx0201 t) nil nil
48 nil ascii-eol ascii-cntl nil nil nil nil nil nil nil nil nil t)
49 '((safe-charsets . t)))
50
51 (define-coding-system-alias 'ctext 'compound-text)
52
53 (set-language-info-alist
54 "Latin-1" '((charset ascii latin-iso8859-1)
55 (coding-system iso-latin-1)
56 (coding-priority iso-latin-1)
57 (nonascii-translation . latin-iso8859-1)
58 (unibyte-syntax . "latin-1")
59 (unibyte-display . iso-latin-1)
60 (input-method . "latin-1-prefix")
61 (sample-text
62 . "Hello, Hej, Tere, Hei, Bonjour, Gr\e,A|_\e(B Gott, Ciao, \e,A!\e(BHola!")
63 (documentation . "\
64 This language environment is a generic one for the Latin-1 (ISO-8859-1)
65 character set which supports the following European languages:
66 Albanian, Basque, Breton, Catalan, Danish, Dutch, English, Faeroese,
67 Finnish, French (with restrictions -- see Latin-9), Frisian, Galician,
68 German, Greenlandic, Icelandic, Irish Gaelic (new orthography),
69 Italian, Latin, Luxemburgish, Norwegian, Portuguese, Rhaeto-Romanic,
70 Scottish Gaelic, Spanish, and Swedish.
71 We also have a German specific language environment \"German\".
72
73 Latin-1 also covers several written languages outside Europe, including
74 Indonesian/Malay, Tagalog (Philippines), Swahili and Afrikaans."))
75 '("European"))
76
77 \f
78 ;; Latin-2 (ISO-8859-2)
79
80 (make-coding-system
81 'iso-latin-2 2 ?2
82 "ISO 2022 based 8-bit encoding (MIME:ISO-8859-2)"
83 '(ascii latin-iso8859-2 nil nil
84 nil nil nil nil nil nil nil)
85 '((safe-charsets ascii latin-iso8859-2)
86 (mime-charset . iso-8859-2)))
87
88 (define-coding-system-alias 'iso-8859-2 'iso-latin-2)
89 (define-coding-system-alias 'latin-2 'iso-latin-2)
90
91 (set-language-info-alist
92 "Latin-2" '((charset ascii latin-iso8859-2)
93 (coding-system iso-latin-2)
94 (coding-priority iso-latin-2)
95 (nonascii-translation . latin-iso8859-2)
96 (unibyte-syntax . "latin-2")
97 (unibyte-display . iso-latin-2)
98 (input-method . "latin-2-prefix")
99 (documentation . "\
100 This language environment is a generic one for the Latin-2 (ISO-8859-2)
101 character set which supports the following languages:
102 Albanian, Czech, English, German, Hungarian, Polish, Romanian,
103 Serbo-Croatian or Croatian, Slovak, Slovene, Sorbian (upper and lower),
104 and Swedish.
105 We also have specific language environments for the following languages:
106 For Czech, \"Czech\".
107 For Romanian, \"Romanian\".
108 For Slovak, \"Slovak\"."))
109 '("European"))
110
111 \f
112 ;; Latin-3 (ISO-8859-3)
113
114 (make-coding-system
115 'iso-latin-3 2 ?3
116 "ISO 2022 based 8-bit encoding (MIME:ISO-8859-3)"
117 '(ascii latin-iso8859-3 nil nil
118 nil nil nil nil nil nil nil)
119 '((safe-charsets ascii latin-iso8859-3)
120 (mime-charset . iso-8859-3)))
121
122 (define-coding-system-alias 'iso-8859-3 'iso-latin-3)
123 (define-coding-system-alias 'latin-3 'iso-latin-3)
124
125 (set-language-info-alist
126 "Latin-3" '((charset ascii latin-iso8859-3)
127 (coding-system iso-latin-3)
128 (coding-priority iso-latin-3)
129 (nonascii-translation . latin-iso8859-3)
130 (unibyte-syntax . "latin-3")
131 (unibyte-display . iso-latin-3)
132 (input-method . "latin-3-prefix")
133 (documentation . "\
134 These languages are supported with the Latin-3 (ISO-8859-3) character set:
135 Afrikaans, Catalan, Dutch, English, Esperanto, French, Galician,
136 German, Italian, Maltese, Spanish, and Turkish."))
137 '("European"))
138
139 \f
140 ;; Latin-4 (ISO-8859-4)
141
142 (make-coding-system
143 'iso-latin-4 2 ?4
144 "ISO 2022 based 8-bit encoding (MIME:ISO-8859-4)"
145 '(ascii latin-iso8859-4 nil nil
146 nil nil nil nil nil nil nil)
147 '((safe-charsets ascii latin-iso8859-4)
148 (mime-charset . iso-8859-4)))
149
150 (define-coding-system-alias 'iso-8859-4 'iso-latin-4)
151 (define-coding-system-alias 'latin-4 'iso-latin-4)
152
153 (set-language-info-alist
154 "Latin-4" '((charset ascii latin-iso8859-4)
155 (coding-system iso-8859-4)
156 (coding-priority iso-8859-4)
157 (nonascii-translation . latin-iso8859-4)
158 (unibyte-syntax . "latin-4")
159 (unibyte-display . iso-8859-4)
160 (input-method . "latin-4-prefix")
161 (documentation . "\
162 These languages are supported with the Latin-4 (ISO-8859-4) character set:
163 Danish, English, Estonian, Finnish, German, Greenlandic, Lappish,
164 Latvian, Lithuanian, and Norwegian."))
165 '("European"))
166
167 \f
168 ;; Latin-5 (ISO-8859-9)
169
170 (make-coding-system
171 'iso-latin-5 2 ?9
172 "ISO 2022 based 8-bit encoding (MIME:ISO-8859-9)"
173 '(ascii latin-iso8859-9 nil nil
174 nil nil nil nil nil nil nil)
175 '((safe-charsets ascii latin-iso8859-9)
176 (mime-charset . iso-8859-9)))
177
178 (define-coding-system-alias 'iso-8859-9 'iso-latin-5)
179 (define-coding-system-alias 'latin-5 'iso-latin-5)
180
181 (set-language-info-alist
182 "Latin-5" '((charset ascii latin-iso8859-9)
183 (coding-system iso-latin-5)
184 (coding-priority iso-latin-5)
185 (nonascii-translation . latin-iso8859-9)
186 (unibyte-syntax . "latin-5")
187 (unibyte-display . iso-latin-5)
188 (input-method . "latin-5-prefix")
189 (documentation . "\
190 These languages are supported with the Latin-5 (ISO-8859-9) character set:
191 Bulgarian, Byelorussian, (Slavic) Macedonian, Russian, Serbian and
192 Ukranian.")) ; says ISO 8859-1
193 '("European"))
194
195 \f
196 ;; Latin-8 (ISO-8859-14)
197
198 (make-coding-system
199 'iso-latin-8 2 ?W ; `W' for `Welsh', since `C'
200 ; for `Celtic' is taken.
201 "ISO 2022 based 8-bit encoding for Latin-8 (MIME:ISO-8859-14)"
202 '(ascii latin-iso8859-14 nil nil
203 nil nil nil nil nil nil nil nil nil nil nil nil t)
204 '((safe-charsets ascii latin-iso8859-14)
205 (mime-charset . iso-8859-14)))
206
207 (define-coding-system-alias 'iso-8859-14 'iso-latin-8)
208 (define-coding-system-alias 'latin-8 'iso-latin-8)
209
210 (set-language-info-alist
211 "Latin-8" '((charset ascii latin-iso8859-14)
212 (coding-system iso-latin-8)
213 (coding-priority iso-latin-8)
214 (nonascii-translation . latin-iso8859-14)
215 (unibyte-syntax . "latin-8")
216 (unibyte-display . iso-latin-8)
217 (input-method . "latin-8-prefix")
218 ;; Fixme: Welsh/Ga{e}lic greetings
219 (sample-text . "\e,_"\e(B \e,_p\e(B \e,_^\e(B")
220 (documentation . "\
221 This language environment is a generic one for the Latin-8 (ISO-8859-14)
222 character set which supports the Celtic languages, including those not
223 covered by other ISO-8859 character sets: Welsh, Manx Gaelic and
224 Irish Gaelic (old orthography)."))
225 '("European"))
226 \f
227 ;; Latin-9 (ISO-8859-15)
228
229 (make-coding-system
230 'iso-latin-9 2 ?0 ; `0' for `Latin-0'
231 "ISO 2022 based 8-bit encoding for Latin-9 (MIME:ISO-8859-15)"
232 '(ascii latin-iso8859-15 nil nil
233 nil nil nil nil nil nil nil nil nil nil nil nil t)
234 '((safe-charsets ascii latin-iso8859-15)
235 (mime-charset . iso-8859-15)))
236
237 (define-coding-system-alias 'iso-8859-15 'iso-latin-9)
238 (define-coding-system-alias 'latin-9 'iso-latin-9)
239 (define-coding-system-alias 'latin-0 'iso-latin-9)
240
241 (set-language-info-alist
242 "Latin-9" '((charset ascii latin-iso8859-15)
243 (coding-system iso-latin-9)
244 (coding-priority iso-latin-9)
245 (nonascii-translation . latin-iso8859-15)
246 (unibyte-syntax . "latin-9")
247 (unibyte-display . iso-latin-9)
248 (input-method . "latin-9-prefix")
249 (sample-text
250 . "AVE. \e,b&(48<=>\e(B \e,b$\e(B")
251 (documentation . "\
252 This language environment is a generic one for the Latin-9 (ISO-8859-15)
253 character set which supports the same languages as Latin-1 with the
254 addition of the Euro sign and some additional French and Finnish letters.
255 Latin-9 is sometimes nicknamed `Latin-0'."))
256 '("European"))
257 \f
258 (set-language-info-alist
259 "German" '((tutorial . "TUTORIAL.de")
260 (charset ascii latin-iso8859-1)
261 (coding-system iso-latin-1)
262 (coding-priority iso-latin-1)
263 (input-method . "german-postfix")
264 (nonascii-translation . iso-latin-1)
265 (unibyte-syntax . "latin-1")
266 (unibyte-display . iso-latin-1)
267 (sample-text . "\
268 German (Deutsch Nord) Guten Tag
269 German (Deutsch S\e,A|\e(Bd) Gr\e,A|_\e(B Gott")
270 (documentation . "\
271 This language environment is almost the same as Latin-1,
272 but default input method is set to \"german-postfix\"."))
273 '("European"))
274
275 (set-language-info-alist
276 "Slovenian" '((charset . (ascii latin-iso8859-2))
277 (coding-system . (iso-8859-2))
278 (coding-priority . (iso-8859-2))
279 (nonascii-translation . latin-iso8859-2)
280 (input-method . "latin-2-postfix")
281 (unibyte-syntax . "latin-2")
282 (unibyte-display . iso-8859-2)
283 (tutorial . "TUTORIAL.sl")
284 (sample-text . "\e,B.\e(Belimo vam uspe\e,B9\e(Ben dan!")
285 (documentation . t))
286 '("European"))
287
288 ;; For Turkish, the character set ISO-8859-9 (Latin-5) is used. But,
289 ;; before the introduction of ISO-8859-9 in 1988, ISO-8859-3 (Latin-3)
290 ;; was used for Turkish. Those who use Latin-3 for Turkish should use
291 ;; "Latin-3" language environment.
292
293 (set-language-info-alist
294 "Turkish" '((charset ascii latin-iso8859-9)
295 (coding-system iso-latin-5)
296 (coding-priority iso-latin-5)
297 (nonascii-translation . latin-iso8859-9)
298 (unibyte-syntax . "latin-5")
299 (unibyte-display . iso-latin-5)
300 (input-method . "turkish-postfix")
301 (sample-text . "Turkish (T\e,M|\e(Brk\e,Mg\e(Be) Merhaba")
302 (documentation . t)))
303
304 ;; Polish ISO 8859-2 environment.
305 ;; Maintainer: Wlodek Bzyl <matwb@univ.gda.pl>
306 ;; Keywords: multilingual, Polish
307
308 (set-language-info-alist
309 "Polish" '((charset . (ascii latin-iso8859-2))
310 (coding-system . (iso-8859-2))
311 (coding-priority . (iso-8859-2))
312 (input-method . "polish-slash")
313 (nonascii-translation . latin-iso8859-2)
314 (unibyte-syntax . "latin-2")
315 (unibyte-display . iso-8859-2)
316 (tutorial . "TUTORIAL.pl")
317 (sample-text . "\e,B1!fFjJ3#qQsS6&?/<,\e(B")
318 (documentation . t))
319 '("European"))
320
321 (provide 'european)
322
323 ;;; european.el ends here