mule-cmds.el 55.7 KB
Newer Older
Karl Heuer's avatar
Karl Heuer committed
1 2 3
;;; mule-cmds.el --- Commands for mulitilingual environment

;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
Richard M. Stallman's avatar
Richard M. Stallman committed
4
;; Licensed to the Free Software Foundation.
Karl Heuer's avatar
Karl Heuer committed
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20

;; Keywords: mule, multilingual

;; This file is part of GNU Emacs.

;; GNU Emacs is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 2, or (at your option)
;; any later version.

;; GNU Emacs is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
;; GNU General Public License for more details.

;; You should have received a copy of the GNU General Public License
Karl Heuer's avatar
Karl Heuer committed
21 22 23
;; along with GNU Emacs; see the file COPYING.  If not, write to the
;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
;; Boston, MA 02111-1307, USA.
Karl Heuer's avatar
Karl Heuer committed
24 25 26 27 28

;;; Code:

;;; MULE related key bindings and menus.

Richard M. Stallman's avatar
Richard M. Stallman committed
29
(defvar mule-keymap (make-sparse-keymap)
Karl Heuer's avatar
Karl Heuer committed
30 31
  "Keymap for MULE (Multilingual environment) specific commands.")

32
;; Keep "C-x C-m ..." for mule specific commands.
Richard M. Stallman's avatar
Richard M. Stallman committed
33
(define-key ctl-x-map "\C-m" mule-keymap)
Kenichi Handa's avatar
Kenichi Handa committed
34

Karl Heuer's avatar
Karl Heuer committed
35 36
(define-key mule-keymap "f" 'set-buffer-file-coding-system)
(define-key mule-keymap "t" 'set-terminal-coding-system)
37 38
(define-key mule-keymap "k" 'set-keyboard-coding-system)
(define-key mule-keymap "p" 'set-buffer-process-coding-system)
39 40
(define-key mule-keymap "x" 'set-selection-coding-system)
(define-key mule-keymap "X" 'set-next-selection-coding-system)
41
(define-key mule-keymap "\C-\\" 'set-input-method)
42
(define-key mule-keymap "c" 'universal-coding-system-argument)
43
(define-key mule-keymap "l" 'set-language-environment)
Karl Heuer's avatar
Karl Heuer committed
44

45
(define-key help-map "\C-L" 'describe-language-environment)
46
(define-key help-map "L" 'describe-language-environment)
Karl Heuer's avatar
Karl Heuer committed
47
(define-key help-map "\C-\\" 'describe-input-method)
48
(define-key help-map "I" 'describe-input-method)
49
(define-key help-map "C" 'describe-coding-system)
Karl Heuer's avatar
Karl Heuer committed
50 51
(define-key help-map "h" 'view-hello-file)

Richard M. Stallman's avatar
Richard M. Stallman committed
52
(defvar mule-menu-keymap (make-sparse-keymap "Mule")
53 54
  "Keymap for MULE (Multilingual environment) menu specific commands.")

55 56 57
(define-key global-map [menu-bar mule]
  `(menu-item "Mule" ,mule-menu-keymap
	      :visible default-enable-multibyte-characters))
58 59 60

(setq menu-bar-final-items (cons 'mule menu-bar-final-items))

61 62
(defvar describe-language-environment-map
  (make-sparse-keymap "Describe Language Environment"))
63

64 65
(defvar setup-language-environment-map
  (make-sparse-keymap "Set Language Environment"))
66

67 68
(defvar set-coding-system-map
  (make-sparse-keymap "Set Coding System"))
69

70
(define-key-after mule-menu-keymap [describe-language-environment]
71
  (cons "Describe Language Environment" describe-language-environment-map)
72 73
  t)
(define-key-after mule-menu-keymap [set-language-environment]
74
  (cons "Set Language Environment" setup-language-environment-map)
75
  t)
76
(define-key-after mule-menu-keymap [mouse-set-font]
77
  '("Set Font/Fontset" . mouse-set-font)
78
  t)
79 80 81 82
(define-key-after mule-menu-keymap [separator-mule]
  '("--")
  t)
(define-key-after mule-menu-keymap [toggle-input-method]
83
  '("Toggle Input Method" . toggle-input-method)
84
  t)
85 86
(define-key-after mule-menu-keymap [set-input-method]
  '("Select Input Method" . set-input-method)
87 88
  t)
(define-key-after mule-menu-keymap [describe-input-method]
89
  '("Describe Input Method" . describe-input-method)
90 91 92 93
  t)
(define-key-after mule-menu-keymap [separator-input-method]
  '("--")
  t)
94
(define-key-after mule-menu-keymap [describe-coding-system]
95
  '("Describe Coding Systems" . describe-coding-system)
96 97
  t)
(define-key-after mule-menu-keymap [set-various-coding-system]
98
  (cons "Set Coding System" set-coding-system-map)
99 100 101 102 103
  t)
(define-key-after mule-menu-keymap [separator-coding-system]
  '("--")
  t)
(define-key-after mule-menu-keymap [mule-diag]
104
  '("Show All of MULE Status" . mule-diag)
105 106
  t)
(define-key-after mule-menu-keymap [view-hello-file]
107
  '("Show Script Examples" . view-hello-file)
108 109 110
  t)

(define-key-after set-coding-system-map [set-buffer-file-coding-system]
111
  '("Buffer File" . set-buffer-file-coding-system)
112
  t)
Richard M. Stallman's avatar
Richard M. Stallman committed
113 114 115
(define-key-after set-coding-system-map [universal-coding-system-argument]
  '("Next Command" . universal-coding-system-argument)
  t)
116 117 118 119 120 121 122
(define-key-after set-coding-system-map [set-terminal-coding-system]
  '("Terminal" . set-terminal-coding-system)
  t)
(define-key-after set-coding-system-map [set-keyboard-coding-system]
  '("Keyboard" . set-keyboard-coding-system)
  t)
(define-key-after set-coding-system-map [set-buffer-process-coding-system]
123
  '("Buffer Process" . set-buffer-process-coding-system)
124
  t)
125 126 127 128 129 130
(define-key-after set-coding-system-map [set-selection-coding-system]
  '("X Selection" . set-selection-coding-system)
  t)
(define-key-after set-coding-system-map [set-next-selection-coding-system]
  '("Next X Selection" . set-next-selection-coding-system)
  t)
131 132
(define-key setup-language-environment-map
  [Default] '("Default" . setup-specified-language-environment))
Karl Heuer's avatar
Karl Heuer committed
133

134
;; These are meaningless when running under X and W32.
Karl Heuer's avatar
Karl Heuer committed
135
(put 'set-terminal-coding-system 'menu-enable
136
     '(or (not window-system) (eq window-system 'pc)))
137
(put 'set-keyboard-coding-system 'menu-enable
138
     '(or (not window-system) (eq window-system 'pc)))
139 140 141
;; This is meaningless when the current buffer has no process.
(put 'set-buffer-process-coding-system 'menu-enable
     '(get-buffer-process (current-buffer)))
142 143 144 145 146
;; These are meaningless when running under terminal.
(put 'set-selection-coding-system 'menu-enable
     'window-system)
(put 'set-next-selection-coding-system 'menu-enable
     'window-system)
Karl Heuer's avatar
Karl Heuer committed
147 148 149 150 151 152 153 154 155

;; This should be a single character key binding because users use it
;; very frequently while editing multilingual text.  Now we can use
;; only two such keys: "\C-\\" and "\C-^", but the latter is not
;; convenient because it requires shifting on most keyboards.  An
;; alternative is "\C-\]" which is now bound to `abort-recursive-edit'
;; but it won't be used that frequently.
(define-key global-map "\C-\\" 'toggle-input-method)

156 157 158 159
;;; This is no good because people often type Shift-SPC
;;; meaning to type SPC.  -- rms.
;;; ;; Here's an alternative key binding for X users (Shift-SPACE).
;;; (define-key global-map [?\S- ] 'toggle-input-method)
160

Karl Heuer's avatar
Karl Heuer committed
161
(defun toggle-enable-multibyte-characters (&optional arg)
162 163 164 165 166 167 168 169 170 171 172
  "Change whether this buffer uses multibyte characters.
With arg, use multibyte characters if the arg is positive.

Note that this command does not convert the byte contents of
the buffer; it only changes the way those bytes are interpreted.
In general, therefore, this command *changes* the sequence of
characters that the current buffer contains.

We suggest you avoid using use this command unless you know what you
are doing.  If you use it by mistake, and the buffer is now displayed
wrong, use this command again to toggle back to the right mode."
Karl Heuer's avatar
Karl Heuer committed
173
  (interactive "P")
174 175 176 177
  (let ((new-flag
	 (if (null arg) (null enable-multibyte-characters)
	   (> (prefix-numeric-value arg) 0))))
    (set-buffer-multibyte new-flag))
Karl Heuer's avatar
Karl Heuer committed
178 179 180 181 182
  (force-mode-line-update))

(defun view-hello-file ()
  "Display the HELLO file which list up many languages and characters."
  (interactive)
183 184
  ;; We have to decode the file in any environment.
  (let ((default-enable-multibyte-characters t)
185
	(coding-system-for-read 'iso-2022-7bit))
186
    (find-file-read-only (expand-file-name "HELLO" data-directory))))
Karl Heuer's avatar
Karl Heuer committed
187

188 189 190
(defun universal-coding-system-argument ()
  "Execute an I/O command using the specified coding system."
  (interactive)
191 192 193 194 195 196 197 198 199
  (let* ((default (and buffer-file-coding-system
		       (not (eq (coding-system-type buffer-file-coding-system)
				t))
		       buffer-file-coding-system))
	 (coding-system (read-coding-system
			 (if default
			     (format "Coding system for following command (default, %s): " default)
			   "Coding system for following command: ")
			 default))
200
	 (keyseq (read-key-sequence
201
		  (format "Command to execute with %s:" coding-system)))
202 203 204 205 206 207
	 (cmd (key-binding keyseq)))
    (let ((coding-system-for-read coding-system)
	  (coding-system-for-write coding-system))
      (message "")
      (call-interactively cmd))))

208
(defun set-default-coding-systems (coding-system)
Kenichi Handa's avatar
Kenichi Handa committed
209
  "Set default value of various coding systems to CODING-SYSTEM.
210
This sets the following coding systems:
Kenichi Handa's avatar
Kenichi Handa committed
211
  o coding system of a newly created buffer
Kenichi Handa's avatar
Kenichi Handa committed
212 213
  o default coding system for subprocess I/O
This also sets the following values:
214
  o default value used as file-name-coding-system for converting file names.
215 216
  o default value for the command `set-terminal-coding-system' (not on MSDOS)
  o default value for the command `set-keyboard-coding-system'."
217 218
  (check-coding-system coding-system)
  (setq-default buffer-file-coding-system coding-system)
219 220
  (if default-enable-multibyte-characters
      (setq default-file-name-coding-system coding-system))
221 222 223 224
  ;; If coding-system is nil, honor that on MS-DOS as well, so
  ;; that they could reset the terminal coding system.
  (unless (and (eq window-system 'pc) coding-system)
    (setq default-terminal-coding-system coding-system))
225 226 227
  (setq default-keyboard-coding-system coding-system)
  (setq default-process-coding-system (cons coding-system coding-system)))

228 229 230
(defalias 'update-iso-coding-systems 'update-coding-systems-internal)
(make-obsolete 'update-iso-coding-systems 'update-coding-systems-internal)

Kenichi Handa's avatar
Kenichi Handa committed
231 232
(defun prefer-coding-system (coding-system)
  "Add CODING-SYSTEM at the front of the priority list for automatic detection.
233
This also sets the following coding systems:
Kenichi Handa's avatar
Kenichi Handa committed
234
  o coding system of a newly created buffer
Kenichi Handa's avatar
Kenichi Handa committed
235 236
  o default coding system for subprocess I/O
This also sets the following values:
237
  o default value used as file-name-coding-system for converting file names.
238 239 240
  o default value for the command `set-terminal-coding-system' (not on MSDOS)
  o default value for the command `set-keyboard-coding-system'

241 242 243
If CODING-SYSTEM specifies a certain type of EOL conversion, the coding
systems set by this function will use that type of EOL conversion.

244 245 246 247
This command does not change the default value of terminal coding system
for MS-DOS terminal, because DOS terminals only support a single coding
system, and Emacs automatically sets the default to that coding system at
startup."
Kenichi Handa's avatar
Kenichi Handa committed
248 249 250 251
  (interactive "zPrefer coding system: ")
  (if (not (and coding-system (coding-system-p coding-system)))
      (error "Invalid coding system `%s'" coding-system))
  (let ((coding-category (coding-system-category coding-system))
252 253
	(base (coding-system-base coding-system))
	(eol-type (coding-system-eol-type coding-system)))
Kenichi Handa's avatar
Kenichi Handa committed
254 255 256
    (if (not coding-category)
	;; CODING-SYSTEM is no-conversion or undecided.
	(error "Can't prefer the coding system `%s'" coding-system))
Kenichi Handa's avatar
Kenichi Handa committed
257
    (set coding-category (or base coding-system))
258
    (update-coding-systems-internal)
Kenichi Handa's avatar
Kenichi Handa committed
259 260 261 262 263
    (if (not (eq coding-category (car coding-category-list)))
	;; We must change the order.
	(setq coding-category-list
	      (cons coding-category
		    (delq coding-category coding-category-list))))
Kenichi Handa's avatar
Kenichi Handa committed
264 265 266
    (if (and base (interactive-p))
	(message "Highest priority is set to %s (base of %s)"
		 base coding-system))
267 268 269 270 271 272
    ;; If they asked for specific EOL conversion, honor that.
    (if (memq eol-type '(0 1 2 unix dos mac))
	(setq coding-system
	      (coding-system-change-eol-conversion base eol-type))
      (setq coding-system base))
    (set-default-coding-systems coding-system)))
Kenichi Handa's avatar
Kenichi Handa committed
273

Richard M. Stallman's avatar
Richard M. Stallman committed
274
(defun find-coding-systems-region-subset-p (list1 list2)
275 276 277 278 279 280 281 282 283
  "Return non-nil if all elements in LIST1 are included in LIST2.
Comparison done with EQ."
  (catch 'tag
    (while list1
      (or (memq (car list1) list2)
	  (throw 'tag nil))
      (setq list1 (cdr list1)))
    t))

Kenichi Handa's avatar
Kenichi Handa committed
284
(defun find-coding-systems-region (from to)
285 286 287 288
  "Return a list of proper coding systems to encode a text between FROM and TO.
All coding systems in the list can safely encode any multibyte characters
in the text.

Karl Heuer's avatar
Karl Heuer committed
289
If the text contains no multibyte characters, return a list of a single
Kenichi Handa's avatar
Kenichi Handa committed
290 291
element `undecided'."
  (find-coding-systems-for-charsets (find-charset-region from to)))
292

Kenichi Handa's avatar
Kenichi Handa committed
293 294 295 296 297
(defun find-coding-systems-string (string)
  "Return a list of proper coding systems to encode STRING.
All coding systems in the list can safely encode any multibyte characters
in STRING.

Karl Heuer's avatar
Karl Heuer committed
298
If STRING contains no multibyte characters, return a list of a single
Kenichi Handa's avatar
Kenichi Handa committed
299 300 301 302 303 304 305 306 307 308
element `undecided'."
  (find-coding-systems-for-charsets (find-charset-string string)))

(defun find-coding-systems-for-charsets (charsets)
  "Return a list of proper coding systems to encode characters of CHARSETS.
CHARSETS is a list of character sets."
  (if (or (null charsets)
	  (and (= (length charsets) 1)
	       (eq 'ascii (car charsets))))
      '(undecided)
309
    (setq charsets (delq 'composition charsets))
310
    (let ((l (coding-system-list 'base-only))
311
	  (charset-prefered-codings
Kenichi Handa's avatar
Kenichi Handa committed
312 313
	   (mapcar (function
		    (lambda (x)
314 315 316
		      (if (eq x 'unknown)
			  'raw-text
			(get-charset-property x 'prefered-coding-system))))
Kenichi Handa's avatar
Kenichi Handa committed
317
		   charsets))
318 319
	  (priorities (mapcar (function (lambda (x) (symbol-value x)))
			      coding-category-list))
Kenichi Handa's avatar
Kenichi Handa committed
320
	  codings coding safe)
321 322 323
      (if (memq 'unknown charsets)
	  ;; The region contains invalid multibyte characters.
	  (setq l '(raw-text)))
Kenichi Handa's avatar
Kenichi Handa committed
324 325
      (while l
	(setq coding (car l) l (cdr l))
326
	(if (and (setq safe (coding-system-get coding 'safe-charsets))
Kenichi Handa's avatar
Kenichi Handa committed
327
		 (or (eq safe t)
Richard M. Stallman's avatar
Richard M. Stallman committed
328
		     (find-coding-systems-region-subset-p charsets safe)))
Kenichi Handa's avatar
Kenichi Handa committed
329
	    ;; We put the higher priority to coding systems included
330 331
	    ;; in CHARSET-PREFERED-CODINGS, and within them, put the
	    ;; higher priority to coding systems which support smaller
Kenichi Handa's avatar
Kenichi Handa committed
332 333
	    ;; number of charsets.
	    (let ((priority
334 335 336 337 338
		   (+ (if (coding-system-get coding 'mime-charset) 4096 0)
		      (lsh (length (memq coding priorities)) 7)
		      (if (memq coding charset-prefered-codings) 64 0)
		      (if (> (coding-system-type coding) 0) 32 0)
		      (if (consp safe) (- 32 (length safe)) 0))))
Kenichi Handa's avatar
Kenichi Handa committed
339 340 341 342
	      (setq codings (cons (cons priority coding) codings)))))
      (mapcar 'cdr
	      (sort codings (function (lambda (x y) (> (car x) (car y))))))
      )))
343

344 345 346 347 348 349 350 351 352 353
(defun find-multibyte-characters (from to &optional maxcount excludes)
  "Find multibyte characters in the region specified by FROM and TO.
If FROM is a string, find multibyte characters in the string.
The return value is an alist of the following format:
  ((CHARSET COUNT CHAR ...) ...)
where
  CHARSET is a character set,
  COUNT is a number of characters,
  CHARs are found characters of the character set.
Optional 3rd arg MAXCOUNT limits how many CHARs are put in the above list.
354 355 356
Optional 4th arg EXCLUDE is a list of character sets to be ignored.

For invalid characters, CHARs are actually strings."
357 358 359 360 361 362 363
  (let ((chars nil)
	charset char)
    (if (stringp from)
	(let ((idx 0))
	  (while (setq idx (string-match "[^\000-\177]" from idx))
	    (setq char (aref from idx)
		  charset (char-charset char))
364 365 366 367
	    (if (eq charset 'unknown)
		(setq char (match-string 0)))
	    (if (or (eq charset 'unknown)
		    (not (or (eq excludes t) (memq charset excludes))))
368 369 370 371 372 373 374 375 376 377 378 379 380 381
		(let ((slot (assq charset chars)))
		  (if slot
		      (if (not (memq char (nthcdr 2 slot)))
			  (let ((count (nth 1 slot)))
			    (setcar (cdr slot) (1+ count))
			    (if (or (not maxcount) (< count maxcount))
				(nconc slot (list char)))))
		    (setq chars (cons (list charset 1 char) chars)))))
	    (setq idx (1+ idx))))
      (save-excursion
	(goto-char from)
	(while (re-search-forward "[^\000-\177]" to t)
	  (setq char (preceding-char)
		charset (char-charset char))
382 383 384 385
	  (if (eq charset 'unknown)
	      (setq char (match-string 0)))
	  (if (or (eq charset 'unknown)
		  (not (or (eq excludes t) (memq charset excludes))))
386 387
	      (let ((slot (assq charset chars)))
		(if slot
388
		    (if (not (member char (nthcdr 2 slot)))
389 390 391 392 393 394 395
			(let ((count (nth 1 slot)))
			  (setcar (cdr slot) (1+ count))
			  (if (or (not maxcount) (< count maxcount))
			      (nconc slot (list char)))))
		  (setq chars (cons (list charset 1 char) chars))))))))
    (nreverse chars)))

396 397 398 399 400 401 402
(defvar last-coding-system-specified nil
  "Most recent coding system explicitly specified by the user when asked.
This variable is set whenever Emacs asks the user which coding system
to use in order to write a file.  If you set it to nil explicitly,
then call `write-region', then afterward this variable will be non-nil
only if the user was explicitly asked and specified a coding system.")

403
(defun select-safe-coding-system (from to &optional default-coding-system)
404 405 406
  "Ask a user to select a safe coding system from candidates.
The candidates of coding systems which can safely encode a text
between FROM and TO are shown in a popup window.
407 408 409 410 411

Optional arg DEFAULT-CODING-SYSTEM specifies a coding system to be
checked at first.  If omitted, buffer-file-coding-system of the
current buffer is used.

412 413
If the text can be encoded safely by DEFAULT-CODING-SYSTEM, it is
returned without any user interaction.
414 415 416 417 418

Kludgy feature: if FROM is a string, the string is the target text,
and TO is ignored."
  (or default-coding-system
      (setq default-coding-system buffer-file-coding-system))
419 420 421
  (let* ((charsets (if (stringp from) (find-charset-string from)
		     (find-charset-region from to)))
	 (safe-coding-systems (find-coding-systems-for-charsets charsets)))
422 423
    (if (or (not enable-multibyte-characters)
	    (eq (car safe-coding-systems) 'undecided)
424
	    (eq default-coding-system 'no-conversion)
425 426 427 428 429
	    (and default-coding-system
		 (memq (coding-system-base default-coding-system)
		       safe-coding-systems)))
	default-coding-system

430 431 432 433 434 435 436 437 438 439
      ;; At first, change each coding system to the corresponding
      ;; mime-charset name if it is also a coding system.
      (let ((l safe-coding-systems)
	    mime-charset)
	(while l
	  (setq mime-charset (coding-system-get (car l) 'mime-charset))
	  (if (and mime-charset (coding-system-p mime-charset))
	      (setcar l mime-charset))
	  (setq l (cdr l))))

440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481
      (let ((non-safe-chars (find-multibyte-characters
			     from to 3
			     (and default-coding-system
				  (coding-system-get default-coding-system
						     'safe-charsets))))
	    overlays)
	(save-excursion
	  ;; Highlight characters that default-coding-system can't encode.
	  (when (integerp from)
	    (goto-char from)
	    (let ((found nil))
	      (while (and (not found)
			  (re-search-forward "[^\000-\177]" to t))
		(setq found (assq (char-charset (preceding-char))
				  non-safe-chars))))
	    (beginning-of-line)
	    (set-window-start (selected-window) (point))
	    (save-excursion
	      (while (re-search-forward "[^\000-\177]" to t)
		(let* ((char (preceding-char))
		       (charset (char-charset char)))
		  (when (assq charset non-safe-chars)
		    (setq overlays (cons (make-overlay (1- (point)) (point))
					 overlays))
		    (overlay-put (car overlays) 'face 'highlight))))))

	  ;; At last, ask a user to select a proper coding system.  
	  (unwind-protect
	      (save-window-excursion
		;; At first, show a helpful message.
		(with-output-to-temp-buffer "*Warning*"
		  (save-excursion
		    (set-buffer standard-output)
		    (insert "The target text contains the following non ASCII character(s):\n")
		    (let ((len (length non-safe-chars))
			  (shown 0))
		      (while (and non-safe-chars (< shown 3))
			(when (> (length (car non-safe-chars)) 2)
			  (setq shown (1+ shown))
			  (insert (format "%25s: " (car (car non-safe-chars))))
			  (let ((l (nthcdr 2 (car non-safe-chars))))
			    (while l
482 483
			      (if (or (stringp (car l)) (char-valid-p (car l)))
				  (insert (car l)))
484 485 486 487 488 489 490 491 492
			      (setq l (cdr l))))
			  (if (> (nth 1 (car non-safe-chars)) 3)
			      (insert "..."))
			  (insert "\n"))
			(setq non-safe-chars (cdr non-safe-chars)))
		      (if (< shown len)
			  (insert (format "%27s\n" "..."))))
		    (insert (format "\
These can't be encoded safely by the coding system %s.
493 494

Please select one from the following safe coding systems:\n"
495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520
				    default-coding-system))
		    (let ((pos (point))
			  (fill-prefix "  "))
		      (mapcar (function (lambda (x) (princ "  ") (princ x)))
			      safe-coding-systems)
		      (fill-region-as-paragraph pos (point)))))

		;; Read a coding system.
		(let* ((safe-names (mapcar (lambda (x) (list (symbol-name x)))
					   safe-coding-systems))
		       (name (completing-read
			      (format "Select coding system (default %s): "
				      (car safe-coding-systems))
			      safe-names nil t nil nil
			      (car (car safe-names)))))
		  (setq last-coding-system-specified (intern name))
		  (if (integerp (coding-system-eol-type default-coding-system))
		      (setq last-coding-system-specified
			    (coding-system-change-eol-conversion
			     last-coding-system-specified
			     (coding-system-eol-type default-coding-system))))
		  last-coding-system-specified))
	    (kill-buffer "*Warning*")
	    (while overlays
	      (delete-overlay (car overlays))
	      (setq overlays (cdr overlays)))))))))
521 522 523

(setq select-safe-coding-system-function 'select-safe-coding-system)

524 525 526 527 528 529 530 531 532 533
(defun select-message-coding-system ()
  "Return a coding system to encode the outgoing message of the current buffer.
It at first tries the first coding system found in these variables
in this order:
  (1) local value of `buffer-file-coding-system'
  (2) value of `sendmail-coding-system'
  (3) value of `default-buffer-file-coding-system'
  (4) value of `default-sendmail-coding-system'
If the found coding system can't encode the current buffer,
or none of them are bound to a coding system,
534
it asks the user to select a proper coding system."
535 536 537 538 539 540 541 542 543 544 545 546
  (let ((coding (or (and (local-variable-p 'buffer-file-coding-system)
			 buffer-file-coding-system)
		    sendmail-coding-system
		    default-buffer-file-coding-system
		    default-sendmail-coding-system)))
    (if (eq coding 'no-conversion)
	;; We should never use no-conversion for outgoing mails.
	(setq coding nil))
    (if (fboundp select-safe-coding-system-function)
	(funcall select-safe-coding-system-function
		 (point-min) (point-max) coding)
      coding)))
Karl Heuer's avatar
Karl Heuer committed
547

548
;;; Language support stuff.
Karl Heuer's avatar
Karl Heuer committed
549 550

(defvar language-info-alist nil
Richard M. Stallman's avatar
Richard M. Stallman committed
551
  "Alist of language environment definitions.
Karl Heuer's avatar
Karl Heuer committed
552 553
Each element looks like:
	(LANGUAGE-NAME . ((KEY . INFO) ...))
Richard M. Stallman's avatar
Richard M. Stallman committed
554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576
where LANGUAGE-NAME is a string, the name of the language environment,
KEY is a symbol denoting the kind of information, and
INFO is the data associated with KEY.
Meaningful values for KEY include

  documentation      value is documentation of what this language environment
			is meant for, and how to use it.
  charset	     value is a list of the character sets used by this
			language environment.
  sample-text	     value is one line of text,
			written using those character sets,
			appropriate for this language environment.
  setup-function     value is a function to call to switch to this
			language environment.
  exit-function      value is a function to call to leave this
		        language environment.
  coding-system      value is a list of coding systems that are good
			for saving text written in this language environment.
			This list serves as suggestions to the user;
			in effect, as a kind of documentation.
  coding-priority    value is a list of coding systems for this language
			environment, in order of decreasing priority.
			This is used to set up the coding system priority
577
			list when you switch to this language environment.
578
  nonascii-translation
579
		     value is a translation table to be set in the
580
			variable `nonascii-translation-table' in this
581 582
			language environment, or a character set from
			which `nonascii-insert-offset' is calculated.
583
  charset-origin-alist
584
		     value is an alist to be set in the variable
585 586 587
			`charset-origin-alist' in this language environment.
  input-method       value is a default input method for this language
			environment.
588 589
  features           value is a list of features requested in this
			language environment.
590 591 592 593 594 595

The following keys take effect only when multibyte characters are
globally disabled, i.e. the value of `default-enable-multibyte-characters'
is nil.

  unibyte-syntax     value is a library name to load to set
Karl Heuer's avatar
Karl Heuer committed
596
			unibyte 8-bit character syntaxes for this
597 598 599 600 601 602 603
			language environment.

  unibyte-display    value is a coding system to encode characters
			for the terminal.  Characters in the range
			of 160 to 255 display not as octal escapes,
			but as non-ASCII characters in this language
			environment.")
Richard M. Stallman's avatar
Richard M. Stallman committed
604 605 606 607 608 609 610 611 612

(defun get-language-info (lang-env key)
  "Return information listed under KEY for language environment LANG-ENV.
KEY is a symbol denoting the kind of information.
For a list of useful values for KEY and their meanings,
see `language-info-alist'."
  (if (symbolp lang-env)
      (setq lang-env (symbol-name lang-env)))
  (let ((lang-slot (assoc-ignore-case lang-env language-info-alist)))
Karl Heuer's avatar
Karl Heuer committed
613 614 615
    (if lang-slot
	(cdr (assq key (cdr lang-slot))))))

616
(defun set-language-info (lang-env key info)
Richard M. Stallman's avatar
Richard M. Stallman committed
617 618 619
  "Modify part of the definition of language environment LANG-ENV.
Specifically, this stores the information INFO under KEY
in the definition of this language environment.
Karl Heuer's avatar
Karl Heuer committed
620
KEY is a symbol denoting the kind of information.
Richard M. Stallman's avatar
Richard M. Stallman committed
621
INFO is the value for that information.
622

Richard M. Stallman's avatar
Richard M. Stallman committed
623
For a list of useful values for KEY and their meanings,
624
see `language-info-alist'."
Richard M. Stallman's avatar
Richard M. Stallman committed
625 626
  (if (symbolp lang-env)
      (setq lang-env (symbol-name lang-env)))
Karl Heuer's avatar
Karl Heuer committed
627
  (let (lang-slot key-slot)
Richard M. Stallman's avatar
Richard M. Stallman committed
628
    (setq lang-slot (assoc lang-env language-info-alist))
Karl Heuer's avatar
Karl Heuer committed
629
    (if (null lang-slot)		; If no slot for the language, add it.
Richard M. Stallman's avatar
Richard M. Stallman committed
630
	(setq lang-slot (list lang-env)
Karl Heuer's avatar
Karl Heuer committed
631 632 633 634 635 636
	      language-info-alist (cons lang-slot language-info-alist)))
    (setq key-slot (assq key lang-slot))
    (if (null key-slot)			; If no slot for the key, add it.
	(progn
	  (setq key-slot (list key))
	  (setcdr lang-slot (cons key-slot (cdr lang-slot)))))
637
    (setcdr key-slot info)))
Karl Heuer's avatar
Karl Heuer committed
638

Richard M. Stallman's avatar
Richard M. Stallman committed
639 640 641
(defun set-language-info-alist (lang-env alist &optional parents)
  "Store ALIST as the definition of language environment LANG-ENV.
ALIST is an alist of KEY and INFO values.  See the documentation of
642
`set-language-info' for the meanings of KEY and INFO.
643

Richard M. Stallman's avatar
Richard M. Stallman committed
644 645 646 647 648 649 650
Optional arg PARENTS is a list of parent menu names; it specifies
where to put this language environment in the 
Describe Language Environment and Set Language Environment menus.
For example, (\"European\") means to put this language environment
in the European submenu in each of those two menus."
  (if (symbolp lang-env)
      (setq lang-env (symbol-name lang-env)))
651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678
  (let ((describe-map describe-language-environment-map)
	(setup-map setup-language-environment-map))
    (if parents
	(let ((l parents)
	      map parent-symbol parent)
	  (while l
	    (if (symbolp (setq parent-symbol (car l)))
		(setq parent (symbol-name parent))
	      (setq parent parent-symbol parent-symbol (intern parent)))
	    (setq map (lookup-key describe-map (vector parent-symbol)))
	    (if (not map)
		(progn
		  (setq map (intern (format "describe-%s-environment-map"
					    (downcase parent))))
		  (define-prefix-command map)
		  (define-key-after describe-map (vector parent-symbol)
		    (cons parent map) t)))
	    (setq describe-map (symbol-value map))
	    (setq map (lookup-key setup-map (vector parent-symbol)))
	    (if (not map)
		(progn
		  (setq map (intern (format "setup-%s-environment-map"
					    (downcase parent))))
		  (define-prefix-command map)
		  (define-key-after setup-map (vector parent-symbol)
		    (cons parent map) t)))
	    (setq setup-map (symbol-value map))
	    (setq l (cdr l)))))
679 680

    ;; Set up menu items for this language env.
681
    (let ((doc (assq 'documentation alist)))
682 683
      (when doc
	(define-key-after describe-map (vector (intern lang-env))
684 685 686
	  (cons lang-env 'describe-specified-language-support) t)))
    (define-key-after setup-map (vector (intern lang-env))
      (cons lang-env 'setup-specified-language-environment) t)
687

688
    (while alist
689
      (set-language-info lang-env (car (car alist)) (cdr (car alist)))
690
      (setq alist (cdr alist)))))
Karl Heuer's avatar
Karl Heuer committed
691

692
(defun read-language-name (key prompt &optional default)
Richard M. Stallman's avatar
Richard M. Stallman committed
693
  "Read a language environment name which has information for KEY.
694
If KEY is nil, read any language environment.
Richard M. Stallman's avatar
Richard M. Stallman committed
695 696
Prompt with PROMPT.  DEFAULT is the default choice of language environment.
This returns a language environment name as a string."
Karl Heuer's avatar
Karl Heuer committed
697 698 699
  (let* ((completion-ignore-case t)
	 (name (completing-read prompt
				language-info-alist
700 701
				(and key
				     (function (lambda (elm) (assq key elm))))
702
				t nil nil default)))
703
    (if (and (> (length name) 0)
704 705
	     (or (not key)
		 (get-language-info name key)))
706
	name)))
Karl Heuer's avatar
Karl Heuer committed
707 708 709

;;; Multilingual input methods.

710 711 712 713 714 715 716 717 718 719
(defconst leim-list-file-name "leim-list.el"
  "Name of LEIM list file.
This file contains a list of libraries of Emacs input methods (LEIM)
in the format of Lisp expression for registering each input method.
Emacs loads this file at startup time.")

(defvar leim-list-header (format "\
;;; %s -- list of LEIM (Library of Emacs Input Method)
;;
;; This file contains a list of LEIM (Library of Emacs Input Method)
Karl Heuer's avatar
Karl Heuer committed
720
;; in the same directory as this file.  Loading this file registers
721 722
;; the whole input methods in Emacs.
;;
Kenichi Handa's avatar
Kenichi Handa committed
723
;; Each entry has the form:
724 725 726 727 728 729 730 731 732 733 734 735 736
;;   (register-input-method
;;    INPUT-METHOD LANGUAGE-NAME ACTIVATE-FUNC
;;    TITLE DESCRIPTION
;;    ARG ...)
;; See the function `register-input-method' for the meanings of arguments.
;;
;; If this directory is included in load-path, Emacs automatically
;; loads this file at startup time.

"
				 leim-list-file-name)
  "Header to be inserted in LEIM list file.")

737
(defvar leim-list-entry-regexp "^(register-input-method"
738 739 740 741 742 743 744 745
  "Regexp matching head of each entry in LEIM list file.
See also the variable `leim-list-header'")

(defvar update-leim-list-functions
  '(quail-update-leim-list-file)
  "List of functions to call to update LEIM list file.
Each function is called with one arg, LEIM directory name.")

746 747
(defun update-leim-list-file (&rest dirs)
  "Update LEIM list file in directories DIRS."
748 749
  (let ((functions update-leim-list-functions))
    (while functions
750
      (apply (car functions) dirs)
751 752
      (setq functions (cdr functions)))))

Karl Heuer's avatar
Karl Heuer committed
753 754
(defvar current-input-method nil
  "The current input method for multilingual text.
755
If nil, that means no input method is activated now.")
Karl Heuer's avatar
Karl Heuer committed
756 757 758 759
(make-variable-buffer-local 'current-input-method)
(put 'current-input-method 'permanent-local t)

(defvar current-input-method-title nil
760
  "Title string of the current input method shown in mode line.")
Karl Heuer's avatar
Karl Heuer committed
761 762 763
(make-variable-buffer-local 'current-input-method-title)
(put 'current-input-method-title 'permanent-local t)

764
(defcustom default-input-method nil
765
  "*Default input method for multilingual text (a string).
766
This is the input method activated automatically by the command
Richard M. Stallman's avatar
Richard M. Stallman committed
767
`toggle-input-method' (\\[toggle-input-method])."
768
  :group 'mule
769
  :type '(choice (const nil) string))
770

Kenichi Handa's avatar
Kenichi Handa committed
771 772 773 774
(defvar input-method-history nil
  "History list for some commands that read input methods.")
(make-variable-buffer-local 'input-method-history)
(put 'input-method-history 'permanent-local t)
Karl Heuer's avatar
Karl Heuer committed
775 776 777 778

(defvar inactivate-current-input-method-function nil
  "Function to call for inactivating the current input method.
Every input method should set this to an appropriate value when activated.
779 780 781 782
This function is called with no argument.

This function should never change the value of `current-input-method'.
It is set to nil by the function `inactivate-input-method'.")
Karl Heuer's avatar
Karl Heuer committed
783 784 785 786 787 788 789 790 791
(make-variable-buffer-local 'inactivate-current-input-method-function)
(put 'inactivate-current-input-method-function 'permanent-local t)

(defvar describe-current-input-method-function nil
  "Function to call for describing the current input method.
This function is called with no argument.")
(make-variable-buffer-local 'describe-current-input-method-function)
(put 'describe-current-input-method-function 'permanent-local t)

792
(defvar input-method-alist nil
Richard M. Stallman's avatar
Richard M. Stallman committed
793
  "Alist of input method names vs how to use them.
794
Each element has the form:
Richard M. Stallman's avatar
Richard M. Stallman committed
795 796 797
   (INPUT-METHOD LANGUAGE-ENV ACTIVATE-FUNC TITLE DESCRIPTION ARGS...)
See the function `register-input-method' for the meanings of the elements.")

798
(defun register-input-method (input-method lang-env &rest args)
Richard M. Stallman's avatar
Richard M. Stallman committed
799
  "Register INPUT-METHOD as an input method for language environment ENV.
800
INPUT-METHOD and LANG-ENV are symbols or strings.
801 802

The remaining arguments are:
Richard M. Stallman's avatar
Richard M. Stallman committed
803 804 805 806 807
	ACTIVATE-FUNC, TITLE, DESCRIPTION, and ARGS...
ACTIVATE-FUNC is a function to call to activate this method.
TITLE is a string to show in the mode line when this method is active.
DESCRIPTION is a string describing this method and what it is good for.
The ARGS, if any, are passed as arguments to ACTIVATE-FUNC.
808 809 810 811 812 813 814 815 816 817 818 819 820 821
All told, the arguments to ACTIVATE-FUNC are INPUT-METHOD and the ARGS.

This function is mainly used in the file \"leim-list.el\" which is
created at building time of emacs, registering all quail input methods
contained in the emacs distribution.

In case you want to register a new quail input method by yourself, be
careful to use the same input method title as given in the third
parameter of `quail-define-package' (if the values are different, the
string specified in this function takes precedence).

The commands `describe-input-method' and `list-input-methods' need
this duplicated values to show some information about input methods
without loading the affected quail packages."
822 823
  (if (symbolp lang-env)
      (setq lang-env (symbol-name lang-env)))
824 825
  (if (symbolp input-method)
      (setq input-method (symbol-name input-method)))
826
  (let ((info (cons lang-env args))
827 828 829 830 831 832
	(slot (assoc input-method input-method-alist)))
    (if slot
	(setcdr slot info)
      (setq slot (cons input-method info))
      (setq input-method-alist (cons slot input-method-alist)))))

833
(defun read-input-method-name (prompt &optional default inhibit-null)
834
  "Read a name of input method from a minibuffer prompting with PROMPT.
835 836
If DEFAULT is non-nil, use that as the default,
  and substitute it into PROMPT at the first `%s'.
837 838 839
If INHIBIT-NULL is non-nil, null input signals an error.

The return value is a string."
840 841
  (if default
      (setq prompt (format prompt default)))
842
  (let* ((completion-ignore-case t)
Kenichi Handa's avatar
Kenichi Handa committed
843 844
	 ;; This binding is necessary because input-method-history is
	 ;; buffer local.
845
	 (input-method (completing-read prompt input-method-alist
846 847
					nil t nil 'input-method-history
					default)))
848 849 850
    (if (> (length input-method) 0)
	input-method
      (if inhibit-null
851
	  (error "No valid input method is specified")))))
852 853

(defun activate-input-method (input-method)
Richard M. Stallman's avatar
Richard M. Stallman committed
854 855 856
  "Switch to input method INPUT-METHOD for the current buffer.
If some other input method is already active, turn it off first.
If INPUT-METHOD is nil, deactivate any current input method."
857
  (if (and input-method (symbolp input-method))
858
      (setq input-method (symbol-name input-method)))
Kenichi Handa's avatar
Kenichi Handa committed
859 860
  (if (and current-input-method
	   (not (string= current-input-method input-method)))
861
      (inactivate-input-method))
Richard M. Stallman's avatar
Richard M. Stallman committed
862
  (unless (or current-input-method (null input-method))
863 864
    (let ((slot (assoc input-method input-method-alist)))
      (if (null slot)
Kenichi Handa's avatar
Kenichi Handa committed
865
	  (error "Can't activate input method `%s'" input-method))
Kenichi Handa's avatar
Kenichi Handa committed
866 867 868 869 870 871 872 873
      (let ((func (nth 2 slot)))
	(if (functionp func)
	    (apply (nth 2 slot) input-method (nthcdr 5 slot))
	  (if (and (consp func) (symbolp (car func)) (symbolp (cdr func)))
	      (progn
		(require (cdr func))
		(apply (car func) input-method (nthcdr 5 slot)))
	    (error "Can't activate input method `%s'" input-method))))
874
      (setq current-input-method input-method)
Kenichi Handa's avatar
Kenichi Handa committed
875
      (setq current-input-method-title (nth 3 slot))
876 877 878
      (unwind-protect
	  (run-hooks 'input-method-activate-hook)
	(force-mode-line-update)))))
879 880

(defun inactivate-input-method ()
881
  "Turn off the current input method."
Kenichi Handa's avatar
Kenichi Handa committed
882 883 884 885 886 887 888 889 890
  (when current-input-method
    (if input-method-history
	(unless (string= current-input-method (car input-method-history))
	  (setq input-method-history
		(cons current-input-method
		      (delete current-input-method input-method-history))))
      (setq input-method-history (list current-input-method)))
    (unwind-protect
	(funcall inactivate-current-input-method-function)
891
      (unwind-protect
Kenichi Handa's avatar
Kenichi Handa committed
892 893
	  (run-hooks 'input-method-inactivate-hook)
	(setq current-input-method nil
894 895
	      current-input-method-title nil)
	(force-mode-line-update)))))
Karl Heuer's avatar
Karl Heuer committed
896

897
(defun set-input-method (input-method)
Richard M. Stallman's avatar
Richard M. Stallman committed
898 899
  "Select and activate input method INPUT-METHOD for the current buffer.
This also sets the default input method to the one you specify."
900
  (interactive
Kenichi Handa's avatar
Kenichi Handa committed
901
   (let* ((default (or (car input-method-history) default-input-method)))
Richard M. Stallman's avatar
Richard M. Stallman committed
902
     (list (read-input-method-name
903
	    (if default "Select input method (default %s): " "Select input method: ")
Richard M. Stallman's avatar
Richard M. Stallman committed
904
	    default t))))
905
  (activate-input-method input-method)
Richard M. Stallman's avatar
Richard M. Stallman committed
906
  (setq default-input-method input-method))
Karl Heuer's avatar
Karl Heuer committed
907 908

(defun toggle-input-method (&optional arg)
909
  "Turn on or off a multilingual text input method for the current buffer.
Kenichi Handa's avatar
Kenichi Handa committed
910

911 912 913 914
With no prefix argument, if some input method is currently activated,
turn it off.  Otherwise, activate an input method--the one most recently used,
or the one specified in `default-input-method', or one read from the
minibuffer.
Kenichi Handa's avatar
Kenichi Handa committed
915

916 917 918
With a prefix arg, read an input method from minibuffer and turn it on.
The default is the most recent input method specified
\(not including the currently active input method, if any).
Kenichi Handa's avatar
Kenichi Handa committed
919 920

When there's no input method to turn on, turn on what read from minibuffer."
Karl Heuer's avatar
Karl Heuer committed
921
  (interactive "P")
922 923 924 925 926 927
  (if (and current-input-method (not arg))
      (inactivate-input-method)
    (let ((default (or (car input-method-history) default-input-method)))
      (if (and arg default (equal current-input-method default)
	       (> (length input-method-history) 1))
	  (setq default (nth 1 input-method-history)))
Kenichi Handa's avatar
Kenichi Handa committed
928 929
      (activate-input-method
       (if (or arg (not default))
930 931 932 933
	   (progn
	     (read-input-method-name
	      (if default "Input method (default %s): " "Input method: " )
	      default t))
Kenichi Handa's avatar
Kenichi Handa committed
934 935 936
	 default))
      (or default-input-method
	  (setq default-input-method current-input-method)))))
937 938

(defun describe-input-method (input-method)
Richard M. Stallman's avatar
Richard M. Stallman committed
939
  "Describe input method INPUT-METHOD."
940 941 942
  (interactive
   (list (read-input-method-name
	  "Describe input method (default, current choice): ")))
943
  (if (and input-method (symbolp input-method))
944
      (setq input-method (symbol-name input-method)))
945 946 947 948 949 950 951 952
  (if (null input-method)
      (describe-current-input-method)
    (with-output-to-temp-buffer "*Help*"
      (let ((elt (assoc input-method input-method-alist)))
	(princ (format "Input method: %s (`%s' in mode line) for %s\n  %s\n"
		       input-method (nth 3 elt) (nth 1 elt) (nth 4 elt)))))))

(defun describe-current-input-method ()
953
  "Describe the input method currently in use."
Karl Heuer's avatar
Karl Heuer committed
954 955 956 957 958 959 960
  (if current-input-method
      (if (and (symbolp describe-current-input-method-function)
	       (fboundp describe-current-input-method-function))
	  (funcall describe-current-input-method-function)
	(message "No way to describe the current input method `%s'"
		 (cdr current-input-method))
	(ding))
961
    (error "No input method is activated now")))
Karl Heuer's avatar
Karl Heuer committed
962

963
(defun read-multilingual-string (prompt &optional initial-input input-method)
Karl Heuer's avatar
Karl Heuer committed
964 965
  "Read a multilingual string from minibuffer, prompting with string PROMPT.
The input method selected last time is activated in minibuffer.
966
If optional second arg INITIAL-INPUT is non-nil, insert it in the minibuffer
967 968
initially.
Optional 3rd argument INPUT-METHOD specifies the input method
969 970
to be activated instead of the one selected last time.  It is a symbol
or a string."
971 972
  (setq input-method
	(or input-method
973
	    current-input-method
974 975
	    default-input-method
	    (read-input-method-name "Input method: " nil t)))
976
  (if (and input-method (symbolp input-method))
977
      (setq input-method (symbol-name input-method)))
978 979 980 981 982 983
  (let ((prev-input-method current-input-method))
    (unwind-protect
	(progn
	  (activate-input-method input-method)
	  (read-string prompt initial-input nil nil t))
      (activate-input-method prev-input-method))))