(case table): Do nothing special for i and I.

[gnu-emacs] / lisp / international / characters.el
diff --git a/lisp/international/characters.el b/lisp/international/characters.el

index 77eb49807c01ed659a1c74a42ed698b4fde5e0dd..3522b57d5d9bd2947a540a2d2cdfa4dc3eec7df2 100644 (file)
--- a/lisp/international/characters.el
+++ b/lisp/international/characters.el
@@ -1,8 +1,10 @@
  ;;; characters.el --- set syntax and category for multibyte characters
  
-;; Copyright (C) 1995, 1997 Electrotechnical Laboratory, JAPAN.
-;; Licensed to the Free Software Foundation.
-;; Copyright (C) 2001, 2002 Free Software Foundation, Inc.
+;; Copyright (C) 1997, 2000, 2001, 2002, 2003, 2004
+;;   Free Software Foundation, Inc.
+;; Copyright (C) 1995, 1997, 1998, 1999, 2000, 2001, 2003, 2004, 2005
+;;   National Institute of Advanced Industrial Science and Technology (AIST)
+;;   Registration Number H14PRO021
  
  ;; Keywords: multibyte character, character set, syntax, category
  
@@ -20,8 +22,8 @@
  
  ;; You should have received a copy of the GNU General Public License
  ;; along with GNU Emacs; see the file COPYING.  If not, write to the
-;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
-;; Boston, MA 02111-1307, USA.
+;; Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
+;; Boston, MA 02110-1301, USA.
  
  ;;; Commentary:
  
@@ -175,6 +177,17 @@
      (modify-category-entry (make-char 'chinese-gb2312 row) ?C)
      (setq row (1+ row))))
  
+(let ((tbl (standard-case-table)))
+  (dotimes (i 26)
+    (set-case-syntax-pair (make-char 'chinese-gb2312 #x23 (+ #x41 i))
+                         (make-char 'chinese-gb2312 #x23 (+ #x61 i)) tbl))
+  (dotimes (i 24)
+    (set-case-syntax-pair (make-char 'chinese-gb2312 #x26 (+ #x21 i))
+                         (make-char 'chinese-gb2312 #x26 (+ #x41 i)) tbl))
+  (dotimes (i 33)
+    (set-case-syntax-pair (make-char 'chinese-gb2312 #x27 (+ #x21 i))
+                         (make-char 'chinese-gb2312 #x27 (+ #x51 i)) tbl)))
+
  ;; Chinese character set (BIG5)
  
  (let ((from (decode-big5-char #xA141))
@@ -215,6 +228,17 @@
    (modify-category-entry generic-big5-1-char ?\|)
    (modify-category-entry generic-big5-2-char ?\|))
  
+(let ((tbl (standard-case-table)))
+  (dotimes (i 22)
+    (set-case-syntax-pair (decode-big5-char (+ #xA2CF i))
+                         (decode-big5-char (+ #xA2CF i 26)) tbl))
+  (dotimes (i 4)
+    (set-case-syntax-pair (decode-big5-char (+ #xA2E4 i))
+                         (decode-big5-char (+ #xA340 i)) tbl))
+  (dotimes (i 24)
+    (set-case-syntax-pair (decode-big5-char (+ #xA344 i))
+                         (decode-big5-char (+ #xA344 i 24)) tbl)))
+
  
  ;; Chinese character set (CNS11643)
  
@@ -627,6 +651,17 @@
      (modify-category-entry (car chars) ?C)
      (setq chars (cdr chars))))
  
+(let ((tbl (standard-case-table)))
+  (dotimes (i 26)
+    (set-case-syntax-pair (make-char 'japanese-jisx0208 #x23 (+ #x41 i))
+                         (make-char 'japanese-jisx0208 #x23 (+ #x61 i)) tbl))
+  (dotimes (i 24)
+    (set-case-syntax-pair (make-char 'japanese-jisx0208 #x26 (+ #x21 i))
+                         (make-char 'japanese-jisx0208 #x26 (+ #x41 i)) tbl))
+  (dotimes (i 33)
+    (set-case-syntax-pair (make-char 'japanese-jisx0208 #x27 (+ #x21 i))
+                         (make-char 'japanese-jisx0208 #x27 (+ #x51 i)) tbl)))
+
  ;; JISX0212
  ;; (modify-syntax-entry (make-char 'japanese-jisx0212) "w")
  (modify-syntax-entry (make-char 'japanese-jisx0212 33) "_")
@@ -672,6 +707,20 @@
      (modify-syntax-entry open (format "(%c" close))
      (modify-syntax-entry close (format ")%c" open))))
  
+(let ((tbl (standard-case-table)))
+  (dotimes (i 26)
+    (set-case-syntax-pair (make-char 'korean-ksc5601 #x23 (+ #x41 i))
+                         (make-char 'korean-ksc5601 #x23 (+ #x61 i)) tbl))
+  (dotimes (i 10)
+    (set-case-syntax-pair (make-char 'korean-ksc5601 #x25 (+ #x21 i))
+                         (make-char 'korean-ksc5601 #x25 (+ #x30 i)) tbl))
+  (dotimes (i 24)
+    (set-case-syntax-pair (make-char 'korean-ksc5601 #x25 (+ #x41 i))
+                         (make-char 'korean-ksc5601 #x25 (+ #x61 i)) tbl))
+  (dotimes (i 33)
+    (set-case-syntax-pair (make-char 'korean-ksc5601 #x2C (+ #x21 i))
+                         (make-char 'korean-ksc5601 #x2C (+ #x51 i)) tbl)))
+
  ;; Latin character set (latin-1,2,3,4,5,8,9)
  
  (modify-category-entry (make-char 'latin-iso8859-1) ?l)
@@ -863,12 +912,6 @@
  
  (let ((tbl (standard-case-table)) c)
  
-;; In some languages, U+0049 LATIN CAPITAL LETTER I and U+0131 LATIN
-;; SMALL LETTER DOTLESS I make a case pair, and so do U+0130 LATIN
-;; CAPITAL LETTER I WITH DOT ABOVE and U+0069 LATIN SMALL LETTER I.
-;; Thus we have to check language-environment to handle casing
-;; correctly.  Currently only I<->i is available.
-
    ;; Latin Extended-A, Latin Extended-B
    (setq c #x0100)
    (while (<= c #x0233)
@@ -884,8 +927,20 @@
          (set-case-syntax-pair
           (decode-char 'ucs (1- c)) (decode-char 'ucs c) tbl))
      (setq c (1+ c)))
-  (set-downcase-syntax  ?\e$,1 P\e(B ?i tbl)
-  (set-upcase-syntax    ?I ?\e$,1 Q\e(B tbl)
+
+
+  ;; In some languages, such as Turkish, U+0049 LATIN CAPITAL LETTER I
+  ;; and U+0131 LATIN SMALL LETTER DOTLESS I make a case pair, and so
+  ;; do U+0130 LATIN CAPITAL LETTER I WITH DOT ABOVE and U+0069 LATIN
+  ;; SMALL LETTER I.
+
+  ;; We used to set up half of those correspondence unconditionally,
+  ;; but that makes searches slow.  So now we don't set up either half
+  ;; of these correspondences by default.
+
+  ;;  (set-downcase-syntax  ?\e$,1 P\e(B ?i tbl)
+  ;;  (set-upcase-syntax    ?I ?\e$,1 Q\e(B tbl)
+
    (set-case-syntax-pair ?\e$,1 R\e(B ?\e$,1 S\e(B tbl)
    (set-case-syntax-pair ?\e$,1 T\e(B ?\e$,1 U\e(B tbl)
    (set-case-syntax-pair ?\e$,1 V\e(B ?\e$,1 W\e(B tbl)
@@ -1209,7 +1264,10 @@
  ;;; Setting word boundary.
  
  (setq word-combining-categories
-      '((?l . ?l)))
+      '((?l . ?l)
+       (?C . ?C)
+       (?C . ?H)
+       (?C . ?K)))
  
  (setq word-separating-categories       ;  (2-byte character sets)
        '((?A . ?K)                      ; Alpha numeric - Katakana