Mercurial > emacs
view lisp/international/encoded-kb.el @ 89905:37e044cc35f6
(Ffind_coding_systems_region_internal): Include raw-text and
no-conversion in the result.
author | Kenichi Handa <handa@m17n.org> |
---|---|
date | Wed, 14 Apr 2004 12:37:29 +0000 |
parents | f786eb22f54c |
children | 68c22ea6027c |
line wrap: on
line source
;;; encoded-kb.el --- handler to input multibyte characters encoded somehow ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN. ;; Licensed to the Free Software Foundation. ;; Copyright (C) 2002 Free Software Foundation, Inc. ;; Copyright (C) 2003 ;; National Institute of Advanced Industrial Science and Technology (AIST) ;; Registration Number H13PRO009 ;; This file is part of GNU Emacs. ;; GNU Emacs is free software; you can redistribute it and/or modify ;; it under the terms of the GNU General Public License as published by ;; the Free Software Foundation; either version 2, or (at your option) ;; any later version. ;; GNU Emacs is distributed in the hope that it will be useful, ;; but WITHOUT ANY WARRANTY; without even the implied warranty of ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ;; GNU General Public License for more details. ;; You should have received a copy of the GNU General Public License ;; along with GNU Emacs; see the file COPYING. If not, write to the ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, ;; Boston, MA 02111-1307, USA. ;;; Commentary: ;;; Code: (defconst encoded-kbd-mode-map (make-sparse-keymap) "Keymap for Encoded-kbd minor mode.") ;; Subsidiary keymaps for handling ISO2022 escape sequences. (defvar encoded-kbd-iso2022-esc-map (let ((map (make-sparse-keymap))) (define-key map "$" 'encoded-kbd-iso2022-esc-dollar-prefix) (define-key map "(" 'encoded-kbd-iso2022-designation-prefix) (define-key map ")" 'encoded-kbd-iso2022-designation-prefix) (define-key map "," 'encoded-kbd-iso2022-designation-prefix) (define-key map "-" 'encoded-kbd-iso2022-designation-prefix) map) "Keymap for handling ESC code in Encoded-kbd mode.") (fset 'encoded-kbd-iso2022-esc-prefix encoded-kbd-iso2022-esc-map) (defvar encoded-kbd-iso2022-esc-dollar-map (let ((map (make-sparse-keymap))) (define-key map "(" 'encoded-kbd-iso2022-designation-prefix) (define-key map ")" 'encoded-kbd-iso2022-designation-prefix) (define-key map "," 'encoded-kbd-iso2022-designation-prefix) (define-key map "-" 'encoded-kbd-iso2022-designation-prefix) (define-key map "@" 'encoded-kbd-iso2022-designation) (define-key map "A" 'encoded-kbd-iso2022-designation) (define-key map "B" 'encoded-kbd-iso2022-designation) map) "Keymap for handling ESC $ sequence in Encoded-kbd mode.") (fset 'encoded-kbd-iso2022-esc-dollar-prefix encoded-kbd-iso2022-esc-dollar-map) (defvar encoded-kbd-iso2022-designation-map (let ((map (make-sparse-keymap)) (l charset-list) final-char) (while l (setq final-char (charset-iso-final-char (car l))) (if (> final-char 0) (define-key map (char-to-string final-char) 'encoded-kbd-iso2022-designation)) (setq l (cdr l))) map) "Keymap for handling ISO2022 designation sequence in Encoded-kbd mode.") (fset 'encoded-kbd-iso2022-designation-prefix encoded-kbd-iso2022-designation-map) (defvar encoded-kbd-iso2022-non-ascii-map (let ((map (make-keymap)) (i 32)) (while (< i 128) (define-key map (char-to-string i) 'encoded-kbd-self-insert-iso2022-7bit) (setq i (1+ i))) (define-key map "\e" 'encoded-kbd-iso2022-esc-prefix) (setq i 160) (while (< i 256) (define-key map (vector i) 'encoded-kbd-handle-8bit) (setq i (1+ i))) map) "Keymap for handling non-ASCII character set in Encoded-kbd mode.") ;; One of the symbols `sjis', `iso2022-7', `iso2022-8', `big5', or ;; `utf-8' to denote what kind of coding-system we are now handling in ;; Encoded-kbd mode. (defvar encoded-kbd-coding nil) ;; Keep information of designation state of ISO2022 encoding. When ;; Encoded-kbd mode is on, this is set to a vector of length 4, the ;; elements are character sets currently designated to graphic ;; registers 0 thru 3. (defvar encoded-kbd-iso2022-designations nil) (put 'encoded-kbd-iso2022-designations 'permanent-local t) ;; Keep information of invocation state of ISO2022 encoding. When ;; Encoded-kbd mode is on, this is set to a vector of length 3, ;; graphic register numbers currently invoked to graphic plane 1 and ;; 2, and a single shifted graphic register number. (defvar encoded-kbd-iso2022-invocations nil) (put 'encoded-kbd-iso2022-invocations 'permanent-local t) (defun encoded-kbd-iso2022-designation () "Do ISO2022 designation according to the current key in Encoded-kbd mode. The following key sequence may cause multilingual text insertion." (interactive) (let ((key-seq (this-command-keys)) (prev-g0-charset (aref encoded-kbd-iso2022-designations (aref encoded-kbd-iso2022-invocations 0))) intermediate-char final-char reg dimension chars charset) (if (= (length key-seq) 4) ;; ESC $ <intermediate-char> <final-char> (setq intermediate-char (aref key-seq 2) dimension 2 chars (if (< intermediate-char ?,) 94 96) final-char (aref key-seq 3) reg (mod intermediate-char 4)) (if (= (aref key-seq 1) ?$) ;; ESC $ <final-char> (setq dimension 2 chars 94 final-char (aref key-seq 2) reg 0) ;; ESC <intermediate-char> <final-char> (setq intermediate-char (aref key-seq 1) dimension 1 chars (if (< intermediate-char ?,) 94 96) final-char (aref key-seq 2) reg (mod intermediate-char 4)))) (if (setq charset (iso-charset dimension chars final-char)) (aset encoded-kbd-iso2022-designations reg charset) (error "Character set of DIMENSION %s, CHARS %s, FINAL-CHAR `%c' is not supported" dimension chars final-char)) (if (memq (aref encoded-kbd-iso2022-designations (aref encoded-kbd-iso2022-invocations 0)) '(ascii latin-jisx0201)) ;; Graphic plane 0 (0x20..0x7f) is for ASCII. We don't have ;; to handle characters in this range specially. (if (not (memq prev-g0-charset '(ascii latin-jisx0201))) ;; We must exit recursive edit now. (throw 'exit nil)) ;; Graphic plane 0 is for non-ASCII. (if (memq prev-g0-charset '(ascii latin-jisx0201)) ;; We must handle keys specially. (let ((overriding-local-map encoded-kbd-iso2022-non-ascii-map)) (recursive-edit)))))) (defun encoded-kbd-handle-8bit () "Handle an 8-bit character entered in Encoded-kbd mode." (interactive) (cond ((eq encoded-kbd-coding 'iso2022-7) (error "Can't handle the character code %d" last-command-char)) ((eq encoded-kbd-coding 'iso2022-8) (cond ((= last-command-char ?\216) (aset encoded-kbd-iso2022-invocations 2 2)) ((= last-command-char ?\217) (aset encoded-kbd-iso2022-invocations 2 3)) ((>= last-command-char ?\240) (encoded-kbd-self-insert-iso2022-8bit 1)) (t (error "Can't handle the character code %d" last-command-char)))) ((eq encoded-kbd-coding 'sjis) (encoded-kbd-self-insert-sjis)) (t (encoded-kbd-self-insert-big5)))) (defun encoded-kbd-self-insert-iso2022-7bit () (interactive) (let* ((charset (aref encoded-kbd-iso2022-designations (or (aref encoded-kbd-iso2022-invocations 2) (aref encoded-kbd-iso2022-invocations 0)))) (char (if (= (charset-dimension charset) 1) (make-char charset last-command-char) (make-char charset last-command-char (read-char-exclusive))))) (aset encoded-kbd-iso2022-invocations 2 nil) (setq unread-command-events (cons char unread-command-events)))) (defun encoded-kbd-self-insert-iso2022-8bit (arg) (interactive "p") (cond ((= last-command-char ?\216) ; SS2 (Single Shift 2) (aset encoded-kbd-iso2022-invocations 2 2)) ((= last-command-char ?\217) ; SS3 (Single Shift 3) (aset encoded-kbd-iso2022-invocations 2 3)) (t (let* ((charset (aref encoded-kbd-iso2022-designations (or (aref encoded-kbd-iso2022-invocations 2) (aref encoded-kbd-iso2022-invocations 1)))) (char (if (= (charset-dimension charset) 1) (make-char charset last-command-char) (make-char charset last-command-char (read-char-exclusive))))) (aset encoded-kbd-iso2022-invocations 2 nil) ;; As simply setting unread-command-events may result in ;; infinite-loop for characters 160..255, this is a temporary ;; workaround until we found a better solution. (let ((last-command-char char)) (self-insert-command arg)))))) (defun encoded-kbd-self-insert-sjis () (interactive) (let ((char (if (or (< last-command-char ?\xA0) (>= last-command-char ?\xE0)) (decode-sjis-char (+ (ash last-command-char 8) (read-char-exclusive))) (make-char 'katakana-jisx0201 last-command-char)))) (setq unread-command-events (cons char unread-command-events)))) (defun encoded-kbd-self-insert-big5 () (interactive) (let ((char (decode-big5-char (+ (ash last-command-char 8) (read-char-exclusive))))) (setq unread-command-events (cons char unread-command-events)))) (defun encoded-kbd-self-insert-ccl () (interactive) (let ((str (char-to-string last-command-char)) (ccl (coding-system-get (keyboard-coding-system) :ccl-decoder)) (vec [nil nil nil nil nil nil nil nil nil]) result) (while (= (length (setq result (ccl-execute-on-string ccl vec str t))) 0) (dotimes (i 9) (aset vec i nil)) (setq str (format "%s%c" str (read-char-exclusive)))) (setq unread-command-events (append result unread-command-events)))) (defun encoded-kbd-self-insert-charset (arg) (interactive "p") (let* ((charset-list (coding-system-get (keyboard-coding-system) :charset-list)) (charset (car charset-list)) ;; For the moment, we can assume that the length of CHARSET-LIST ;; is 1, and the dimension of CHARSET is 1. (c (decode-char charset last-command-char))) (unless c (error "Can't decode the code point %d by %s" last-command-char charset)) ;; As simply setting unread-command-events may result in ;; infinite-loop for characters 160..255, this is a temporary ;; workaround until we found a better solution. (let ((last-command-char c)) (self-insert-command arg)))) (defun encoded-kbd-self-insert-utf-8 (arg) (interactive "p") (let (len ch) (cond ((< last-command-char #xE0) (setq len 1 ch (logand last-command-char #x1F))) ((< last-command-char #xF0) (setq len 2 ch (logand last-command-char #x0F))) ((< last-command-char #xF8) (setq len 3 ch (logand last-command-char #x07))) (t (setq len 4 ch 0))) (while (> len 0) (setq ch (logior (lsh ch 6) (logand (read-char-exclusive) #x3F)) len (1- len))) (let ((last-command-char ch)) (self-insert-command arg)))) (defun encoded-kbd-setup-keymap (coding) ;; At first, reset the keymap. (setcdr encoded-kbd-mode-map nil) ;; Then setup the keymap according to the keyboard coding system. (cond ((eq encoded-kbd-coding 'charset) (let* ((charset (car (coding-system-get coding :charset-list))) (code-space (get-charset-property charset :code-space)) (from (max (aref code-space 0) 128)) (to (aref code-space 1))) (while (<= from to) (define-key encoded-kbd-mode-map (vector from) 'encoded-kbd-self-insert-charset) (setq from (1+ from))))) ((eq encoded-kbd-coding 'sjis) (let ((i 128)) (while (< i 256) (define-key encoded-kbd-mode-map (vector i) 'encoded-kbd-self-insert-sjis) (setq i (1+ i))))) ((eq encoded-kbd-coding 'big5) (let ((i 161)) (while (< i 255) (define-key encoded-kbd-mode-map (vector i) 'encoded-kbd-self-insert-big5) (setq i (1+ i))))) ((eq encoded-kbd-coding 'iso2022-7) (define-key encoded-kbd-mode-map "\e" 'encoded-kbd-iso2022-esc-prefix)) ((eq encoded-kbd-coding 'iso2022-8) (define-key encoded-kbd-mode-map (vector ?\216) 'encoded-kbd-self-insert-iso2022-8bit) (define-key encoded-kbd-mode-map (vector ?\217) 'encoded-kbd-self-insert-iso2022-8bit) (let ((i 160)) (while (< i 256) (define-key encoded-kbd-mode-map (vector i) 'encoded-kbd-self-insert-iso2022-8bit) (setq i (1+ i))))) ((eq encoded-kbd-coding 'ccl) (let ((valid-codes (or (coding-system-get coding :valid) '((128 . 255)))) elt from to) (while valid-codes (setq elt (car valid-codes) valid-codes (cdr valid-codes)) (if (consp elt) (setq from (car elt) to (cdr elt)) (setq from (setq to elt))) (while (<= from to) (if (>= from 128) (define-key encoded-kbd-mode-map (vector from) 'encoded-kbd-self-insert-ccl)) (setq from (1+ from)))))) ((eq encoded-kbd-coding 'utf-8) (let ((i #xC0)) (while (< i 256) (define-key encoded-kbd-mode-map (vector i) 'encoded-kbd-self-insert-utf-8) (setq i (1+ i))))) (t (error "Invalid value in encoded-kbd-coding: %s" encoded-kbd-coding)))) ;; Input mode at the time Encoded-kbd mode is turned on is saved here. (defvar saved-input-mode nil) (put 'encoded-kbd-mode 'permanent-local t) ;;;###autoload (define-minor-mode encoded-kbd-mode "Toggle Encoded-kbd minor mode. With arg, turn Encoded-kbd mode on if and only if arg is positive. You should not turn this mode on manually, instead use the command \\[set-keyboard-coding-system] which turns on or off this mode automatically. In Encoded-kbd mode, a text sent from keyboard is accepted as a multilingual text encoded in a coding system set by \\[set-keyboard-coding-system]." :global t ;; We must at first reset input-mode to the original. (if saved-input-mode (apply 'set-input-mode saved-input-mode)) (if encoded-kbd-mode (let ((coding (keyboard-coding-system))) (setq saved-input-mode (current-input-mode)) (cond ((null coding) (setq encoded-kbd-mode nil) (error "No coding system for keyboard input is set")) ((eq (coding-system-type coding) 'shift-jis) (set-input-mode (nth 0 saved-input-mode) (nth 1 saved-input-mode) 'use-8th-bit (nth 3 saved-input-mode)) (setq encoded-kbd-coding 'sjis)) ((eq (coding-system-type coding) 'iso-2022) (if (memq '7-bit (coding-system-get coding :flags)) (setq encoded-kbd-coding 'iso2022-7) (set-input-mode (nth 0 saved-input-mode) (nth 1 saved-input-mode) 'use-8th-bit (nth 3 saved-input-mode)) (setq encoded-kbd-coding 'iso2022-8)) (setq encoded-kbd-iso2022-designations (coding-system-get coding :designation)) (setq encoded-kbd-iso2022-invocations (make-vector 3 nil)) (aset encoded-kbd-iso2022-invocations 0 0) (aset encoded-kbd-iso2022-invocations 1 1)) ((eq (coding-system-type coding) 'big5) (set-input-mode (nth 0 saved-input-mode) (nth 1 saved-input-mode) 'use-8th-bit (nth 3 saved-input-mode)) (setq encoded-kbd-coding 'big5)) ((eq (coding-system-type coding) 'ccl) (set-input-mode (nth 0 saved-input-mode) (nth 1 saved-input-mode) 'use-8th-bit (nth 3 saved-input-mode)) (setq encoded-kbd-coding 'ccl)) ((and (eq (coding-system-type coding) 'charset) (let* ((charset-list (coding-system-get coding :charset-list)) (charset (car charset-list))) (and (= (length charset-list) 1) (= (charset-dimension charset) 1)))) (set-input-mode (nth 0 saved-input-mode) (nth 1 saved-input-mode) 'use-8th-bit (nth 3 saved-input-mode)) (setq encoded-kbd-coding 'charset)) ((eq (coding-system-type coding) 'utf-8) (set-input-mode (nth 0 saved-input-mode) (nth 1 saved-input-mode) 'use-8th-bit (nth 3 saved-input-mode)) (setq encoded-kbd-coding 'utf-8)) (t (setq encoded-kbd-mode nil) (error "Coding-system `%s' is not supported in Encoded-kbd mode" (keyboard-coding-system)))) (encoded-kbd-setup-keymap coding)))) (provide 'encoded-kb) ;;; encoded-kb.el ends here