123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408 |
- ;;; mule-util.el --- utility functions for multilingual environment (mule)
- ;; Copyright (C) 1997-1998, 2000-2012 Free Software Foundation, Inc.
- ;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
- ;; 2005, 2006, 2007, 2008, 2009, 2010, 2011
- ;; National Institute of Advanced Industrial Science and Technology (AIST)
- ;; Registration Number H14PRO021
- ;; Copyright (C) 2003
- ;; National Institute of Advanced Industrial Science and Technology (AIST)
- ;; Registration Number H13PRO009
- ;; Keywords: mule, multilingual
- ;; This file is part of GNU Emacs.
- ;; GNU Emacs is free software: you can redistribute it and/or modify
- ;; it under the terms of the GNU General Public License as published by
- ;; the Free Software Foundation, either version 3 of the License, or
- ;; (at your option) any later version.
- ;; GNU Emacs is distributed in the hope that it will be useful,
- ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- ;; GNU General Public License for more details.
- ;; You should have received a copy of the GNU General Public License
- ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
- ;;; Commentary:
- ;;; Code:
- ;;; String manipulations while paying attention to multibyte
- ;;; characters.
- ;;;###autoload
- (defun string-to-sequence (string type)
- "Convert STRING to a sequence of TYPE which contains characters in STRING.
- TYPE should be `list' or `vector'."
- ;;; (let ((len (length string))
- ;;; (i 0)
- ;;; val)
- (cond ((eq type 'list)
- ;; Applicable post-Emacs 20.2 and asymptotically ~10 times
- ;; faster than the code below:
- (append string nil))
- ;;; (setq val (make-list len 0))
- ;;; (let ((l val))
- ;;; (while (< i len)
- ;;; (setcar l (aref string i))
- ;;; (setq l (cdr l) i (1+ i))))))
- ((eq type 'vector)
- ;; As above.
- (vconcat string))
- ;;; (setq val (make-vector len 0))
- ;;; (while (< i len)
- ;;; (aset val i (aref string i))
- ;;; (setq i (1+ i))))
- (t
- (error "Invalid type: %s" type)))
- ;;; val)
- )
- ;;;###autoload
- (make-obsolete 'string-to-sequence
- "use `string-to-list' or `string-to-vector'."
- "22.1")
- ;;;###autoload
- (defsubst string-to-list (string)
- "Return a list of characters in STRING."
- (append string nil))
- ;;;###autoload
- (defsubst string-to-vector (string)
- "Return a vector of characters in STRING."
- (vconcat string))
- ;;;###autoload
- (defun store-substring (string idx obj)
- "Embed OBJ (string or character) at index IDX of STRING."
- (if (integerp obj)
- (aset string idx obj)
- (let ((len1 (length obj))
- (len2 (length string))
- (i 0))
- (while (< i len1)
- (aset string (+ idx i) (aref obj i))
- (setq i (1+ i)))))
- string)
- ;;;###autoload
- (defun truncate-string-to-width (str end-column
- &optional start-column padding ellipsis)
- "Truncate string STR to end at column END-COLUMN.
- The optional 3rd arg START-COLUMN, if non-nil, specifies the starting
- column; that means to return the characters occupying columns
- START-COLUMN ... END-COLUMN of STR. Both END-COLUMN and START-COLUMN
- are specified in terms of character display width in the current
- buffer; see also `char-width'.
- The optional 4th arg PADDING, if non-nil, specifies a padding
- character (which should have a display width of 1) to add at the end
- of the result if STR doesn't reach column END-COLUMN, or if END-COLUMN
- comes in the middle of a character in STR. PADDING is also added at
- the beginning of the result if column START-COLUMN appears in the
- middle of a character in STR.
- If PADDING is nil, no padding is added in these cases, so
- the resulting string may be narrower than END-COLUMN.
- If ELLIPSIS is non-nil, it should be a string which will replace the
- end of STR (including any padding) if it extends beyond END-COLUMN,
- unless the display width of STR is equal to or less than the display
- width of ELLIPSIS. If it is non-nil and not a string, then ELLIPSIS
- defaults to \"...\"."
- (or start-column
- (setq start-column 0))
- (when (and ellipsis (not (stringp ellipsis)))
- (setq ellipsis "..."))
- (let ((str-len (length str))
- (str-width (string-width str))
- (ellipsis-len (if ellipsis (length ellipsis) 0))
- (ellipsis-width (if ellipsis (string-width ellipsis) 0))
- (idx 0)
- (column 0)
- (head-padding "") (tail-padding "")
- ch last-column last-idx from-idx)
- (condition-case nil
- (while (< column start-column)
- (setq ch (aref str idx)
- column (+ column (char-width ch))
- idx (1+ idx)))
- (args-out-of-range (setq idx str-len)))
- (if (< column start-column)
- (if padding (make-string end-column padding) "")
- (when (and padding (> column start-column))
- (setq head-padding (make-string (- column start-column) padding)))
- (setq from-idx idx)
- (when (>= end-column column)
- (if (and (< end-column str-width)
- (> str-width ellipsis-width))
- (setq end-column (- end-column ellipsis-width))
- (setq ellipsis ""))
- (condition-case nil
- (while (< column end-column)
- (setq last-column column
- last-idx idx
- ch (aref str idx)
- column (+ column (char-width ch))
- idx (1+ idx)))
- (args-out-of-range (setq idx str-len)))
- (when (> column end-column)
- (setq column last-column
- idx last-idx))
- (when (and padding (< column end-column))
- (setq tail-padding (make-string (- end-column column) padding))))
- (concat head-padding (substring str from-idx idx)
- tail-padding ellipsis))))
- ;;; Test suite for truncate-string-to-width
- ;; (dolist (test '((("" 0) . "")
- ;; (("x" 1) . "x")
- ;; (("xy" 1) . "x")
- ;; (("xy" 2 1) . "y")
- ;; (("xy" 0) . "")
- ;; (("xy" 3) . "xy")
- ;; (("$AVP(B" 0) . "")
- ;; (("$AVP(B" 1) . "")
- ;; (("$AVP(B" 2) . "$AVP(B")
- ;; (("$AVP(B" 1 nil ? ) . " ")
- ;; (("$AVPND(B" 3 1 ? ) . " ")
- ;; (("x$AVP(Bx" 2) . "x")
- ;; (("x$AVP(Bx" 3) . "x$AVP(B")
- ;; (("x$AVP(Bx" 3) . "x$AVP(B")
- ;; (("x$AVP(Bx" 4 1) . "$AVP(Bx")
- ;; (("kor$(CGQ(Be$(C1[(Ban" 8 1 ? ) . "or$(CGQ(Be$(C1[(B")
- ;; (("kor$(CGQ(Be$(C1[(Ban" 7 2 ? ) . "r$(CGQ(Be ")
- ;; (("" 0 nil nil "...") . "")
- ;; (("x" 3 nil nil "...") . "x")
- ;; (("$AVP(B" 3 nil nil "...") . "$AVP(B")
- ;; (("foo" 3 nil nil "...") . "foo")
- ;; (("foo" 2 nil nil "...") . "fo") ;; XEmacs failure?
- ;; (("foobar" 6 0 nil "...") . "foobar")
- ;; (("foobarbaz" 6 nil nil "...") . "foo...")
- ;; (("foobarbaz" 7 2 nil "...") . "ob...")
- ;; (("foobarbaz" 9 3 nil "...") . "barbaz")
- ;; (("$A$3(Bh$A$s(Be$A$K(Bl$A$A(Bl$A$O(Bo" 15 1 ? t) . " h$A$s(Be$A$K(Bl$A$A(Bl$A$O(Bo")
- ;; (("$A$3(Bh$A$s(Be$A$K(Bl$A$A(Bl$A$O(Bo" 14 1 ? t) . " h$A$s(Be$A$K(Bl$A$A(B...")
- ;; (("x" 3 nil nil "$(Gemk#(B") . "x")
- ;; (("$AVP(B" 2 nil nil "$(Gemk#(B") . "$AVP(B")
- ;; (("$AVP(B" 1 nil ?x "$(Gemk#(B") . "x") ;; XEmacs error
- ;; (("$AVPND(B" 3 nil ? "$(Gemk#(B") . "$AVP(B ") ;; XEmacs error
- ;; (("foobarbaz" 4 nil nil "$(Gemk#(B") . "$(Gemk#(B")
- ;; (("foobarbaz" 5 nil nil "$(Gemk#(B") . "f$(Gemk#(B")
- ;; (("foobarbaz" 6 nil nil "$(Gemk#(B") . "fo$(Gemk#(B")
- ;; (("foobarbaz" 8 3 nil "$(Gemk#(B") . "b$(Gemk#(B")
- ;; (("$A$3(Bh$A$s(Be$A$K(Bl$A$A(Bl$A$O(Bo" 14 4 ?x "$AHU1>$(Gk#(B") . "xe$A$KHU1>$(Gk#(B")
- ;; (("$A$3(Bh$A$s(Be$A$K(Bl$A$A(Bl$A$O(Bo" 13 4 ?x "$AHU1>$(Gk#(B") . "xex$AHU1>$(Gk#(B")
- ;; ))
- ;; (let (ret)
- ;; (condition-case e
- ;; (setq ret (apply #'truncate-string-to-width (car test)))
- ;; (error (setq ret e)))
- ;; (unless (equal ret (cdr test))
- ;; (error "%s: expected %s, got %s"
- ;; (prin1-to-string (cons 'truncate-string-to-width (car test)))
- ;; (prin1-to-string (cdr test))
- ;; (if (consp ret)
- ;; (format "error: %s: %s" (car ret)
- ;; (prin1-to-string (cdr ret)))
- ;; (prin1-to-string ret))))))
- ;;; Nested alist handler. Nested alist is alist whose elements are
- ;;; also nested alist.
- ;;;###autoload
- (defsubst nested-alist-p (obj)
- "Return t if OBJ is a nested alist.
- Nested alist is a list of the form (ENTRY . BRANCHES), where ENTRY is
- any Lisp object, and BRANCHES is a list of cons cells of the form
- \(KEY-ELEMENT . NESTED-ALIST).
- You can use a nested alist to store any Lisp object (ENTRY) for a key
- sequence KEYSEQ, where KEYSEQ is a sequence of KEY-ELEMENT. KEYSEQ
- can be a string, a vector, or a list."
- (and obj (listp obj) (listp (cdr obj))))
- ;;;###autoload
- (defun set-nested-alist (keyseq entry alist &optional len branches)
- "Set ENTRY for KEYSEQ in a nested alist ALIST.
- Optional 4th arg LEN non-nil means the first LEN elements in KEYSEQ
- are considered.
- Optional 5th argument BRANCHES if non-nil is branches for a keyseq
- longer than KEYSEQ.
- See the documentation of `nested-alist-p' for more detail."
- (or (nested-alist-p alist)
- (error "Invalid argument %s" alist))
- (let ((islist (listp keyseq))
- (len (or len (length keyseq)))
- (i 0)
- key-elt slot)
- (while (< i len)
- (if (null (nested-alist-p alist))
- (error "Keyseq %s is too long for this nested alist" keyseq))
- (setq key-elt (if islist (nth i keyseq) (aref keyseq i)))
- (setq slot (assoc key-elt (cdr alist)))
- (unless slot
- (setq slot (cons key-elt (list t)))
- (setcdr alist (cons slot (cdr alist))))
- (setq alist (cdr slot))
- (setq i (1+ i)))
- (setcar alist entry)
- (if branches
- (setcdr (last alist) branches))))
- ;;;###autoload
- (defun lookup-nested-alist (keyseq alist &optional len start nil-for-too-long)
- "Look up key sequence KEYSEQ in nested alist ALIST. Return the definition.
- Optional 3rd argument LEN specifies the length of KEYSEQ.
- Optional 4th argument START specifies index of the starting key.
- The returned value is normally a nested alist of which
- car part is the entry for KEYSEQ.
- If ALIST is not deep enough for KEYSEQ, return number which is
- how many key elements at the front of KEYSEQ it takes
- to reach a leaf in ALIST.
- Optional 5th argument NIL-FOR-TOO-LONG non-nil means return nil
- even if ALIST is not deep enough."
- (or (nested-alist-p alist)
- (error "Invalid argument %s" alist))
- (or len
- (setq len (length keyseq)))
- (let ((i (or start 0)))
- (if (catch 'lookup-nested-alist-tag
- (if (listp keyseq)
- (while (< i len)
- (if (setq alist (cdr (assoc (nth i keyseq) (cdr alist))))
- (setq i (1+ i))
- (throw 'lookup-nested-alist-tag t))))
- (while (< i len)
- (if (setq alist (cdr (assoc (aref keyseq i) (cdr alist))))
- (setq i (1+ i))
- (throw 'lookup-nested-alist-tag t))))
- ;; KEYSEQ is too long.
- (if nil-for-too-long nil i)
- alist)))
- ;; Coding system related functions.
- ;;;###autoload
- (defun coding-system-post-read-conversion (coding-system)
- "Return the value of CODING-SYSTEM's `post-read-conversion' property."
- (coding-system-get coding-system :post-read-conversion))
- ;;;###autoload
- (defun coding-system-pre-write-conversion (coding-system)
- "Return the value of CODING-SYSTEM's `pre-write-conversion' property."
- (coding-system-get coding-system :pre-write-conversion))
- ;;;###autoload
- (defun coding-system-translation-table-for-decode (coding-system)
- "Return the value of CODING-SYSTEM's `decode-translation-table' property."
- (coding-system-get coding-system :decode-translation-table))
- ;;;###autoload
- (defun coding-system-translation-table-for-encode (coding-system)
- "Return the value of CODING-SYSTEM's `encode-translation-table' property."
- (coding-system-get coding-system :encode-translation-table))
- ;;;###autoload
- (defmacro with-coding-priority (coding-systems &rest body)
- "Execute BODY like `progn' with CODING-SYSTEMS at the front of priority list.
- CODING-SYSTEMS is a list of coding systems. See `set-coding-system-priority'.
- This affects the implicit sorting of lists of coding systems returned by
- operations such as `find-coding-systems-region'."
- (let ((current (make-symbol "current")))
- `(let ((,current (coding-system-priority-list)))
- (apply #'set-coding-system-priority ,coding-systems)
- (unwind-protect
- (progn ,@body)
- (apply #'set-coding-system-priority ,current)))))
- ;;;###autoload(put 'with-coding-priority 'lisp-indent-function 1)
- (put 'with-coding-priority 'edebug-form-spec t)
- ;;;###autoload
- (defmacro detect-coding-with-priority (from to priority-list)
- "Detect a coding system of the text between FROM and TO with PRIORITY-LIST.
- PRIORITY-LIST is an alist of coding categories vs the corresponding
- coding systems ordered by priority."
- `(with-coding-priority (mapcar #'cdr ,priority-list)
- (detect-coding-region ,from ,to)))
- (make-obsolete 'detect-coding-with-priority
- "use `with-coding-priority' and `detect-coding-region'." "23.1")
- ;;;###autoload
- (defun detect-coding-with-language-environment (from to lang-env)
- "Detect a coding system for the text between FROM and TO with LANG-ENV.
- The detection takes into account the coding system priorities for the
- language environment LANG-ENV."
- (let ((coding-priority (get-language-info lang-env 'coding-priority)))
- (if coding-priority
- (with-coding-priority coding-priority
- (detect-coding-region from to)))))
- (declare-function internal-char-font "fontset.c" (position &optional ch))
- ;;;###autoload
- (defun char-displayable-p (char)
- "Return non-nil if we should be able to display CHAR.
- On a multi-font display, the test is only whether there is an
- appropriate font from the selected frame's fontset to display
- CHAR's charset in general. Since fonts may be specified on a
- per-character basis, this may not be accurate."
- (cond ((< char 128)
- ;; ASCII characters are always displayable.
- t)
- ((not enable-multibyte-characters)
- ;; Maybe there's a font for it, but we can't put it in the buffer.
- nil)
- ((display-multi-font-p)
- ;; On a window system, a character is displayable if we have
- ;; a font for that character in the default face of the
- ;; currently selected frame.
- (car (internal-char-font nil char)))
- (t
- ;; On a terminal, a character is displayable if the coding
- ;; system for the terminal can encode it.
- (let ((coding (terminal-coding-system)))
- (when coding
- (let ((cs-list (coding-system-get coding :charset-list)))
- (cond
- ((listp cs-list)
- (catch 'tag
- (mapc #'(lambda (charset)
- (if (encode-char char charset)
- (throw 'tag charset)))
- cs-list)
- nil))
- ((eq cs-list 'iso-2022)
- (catch 'tag2
- (mapc #'(lambda (charset)
- (if (and (plist-get (charset-plist charset)
- :iso-final-char)
- (encode-char char charset))
- (throw 'tag2 charset)))
- charset-list)
- nil))
- ((eq cs-list 'emacs-mule)
- (catch 'tag3
- (mapc #'(lambda (charset)
- (if (and (plist-get (charset-plist charset)
- :emacs-mule-id)
- (encode-char char charset))
- (throw 'tag3 charset)))
- charset-list)
- nil)))))))))
- (provide 'mule-util)
- ;; Local Variables:
- ;; coding: iso-2022-7bit
- ;; End:
- ;;; mule-util.el ends here
|