;;; mule-tests.el --- unit tests for mule.el -*- lexical-binding: t; -*-
;; Copyright (C) 2017-2023 Free Software Foundation, Inc.
;; This file is part of GNU Emacs.
;; GNU Emacs is free software: you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
;; GNU Emacs is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with GNU Emacs. If not, see .
;;; Commentary:
;; Unit tests for lisp/international/mule.el.
;;; Code:
(require 'ert-x) ;For `ert-simulate-keys'.
(ert-deftest find-auto-coding--bug27391 ()
"Check that Bug#27391 is fixed."
(with-temp-buffer
(insert "\n[comment]: # ( Local Variables: )\n"
"[comment]: # ( coding: utf-8 )\n"
"[comment]: # ( End: )\n")
(goto-char (point-min))
(should (equal (let ((auto-coding-alist ())
(auto-coding-regexp-alist ())
(auto-coding-functions ()))
(find-auto-coding "" (buffer-size)))
'(utf-8 . :coding)))))
(ert-deftest mule-cmds-tests--encode-ebcdic ()
(should (equal (encode-coding-char ?a 'ebcdic-int) "\201"))
(should (not (multibyte-string-p (encode-coding-char ?a 'utf-8)))))
(ert-deftest mule-cmds--test-universal-coding-system-argument ()
(should (equal "ccccccccccccccccab"
(let ((enable-recursive-minibuffers t))
(ert-simulate-keys
(kbd "C-x RET c u t f - 8 RET C-u C-u c a b RET")
(read-string "prompt:"))))))
;;Bug#65997, ensure that old-names haven't overriden new names.
(ert-deftest mule-cmds-tests--ucs-names-old-name-override ()
(let (code-points)
(dotimes (u (1+ (max-char 'ucs)))
(when-let* ((name (get-char-code-property u 'name))
(c (char-from-name name)))
(when (and (not (<= #xD800 u #xDFFF))
(not (= c u)))
(push (format "%X" u) code-points))))
(setq code-points (nreverse code-points))
(should (null code-points))))
;; Bug#65997, ensure that all codepoints with names are in '(ucs-names)'.
(ert-deftest mule-cmds-tests--ucs-names-missing-names ()
(let (code-points)
(dotimes (u (1+ (max-char 'ucs)))
(when-let ((name (get-char-code-property u 'name)))
(when (and (not (<= #xD800 u #xDFFF))
(not (<= #x18800 u #x18AFF))
(not (char-from-name name)))
(push (format "%X" u) code-points))))
(setq code-points (nreverse code-points))
(should (null code-points))))
(ert-deftest mule-utf-7 ()
;; utf-7 and utf-7-imap are not ASCII-compatible.
(should-not (coding-system-get 'utf-7 :ascii-compatible-p))
(should-not (coding-system-get 'utf-7-imap :ascii-compatible-p))
;; Invariant ASCII subset.
(let ((s (apply #'string (append (number-sequence #x20 #x25)
(number-sequence #x27 #x7e)))))
(should (equal (encode-coding-string s 'utf-7-imap) s))
(should (equal (decode-coding-string s 'utf-7-imap) s)))
;; Escaped ampersand.
(should (equal (encode-coding-string "a&bcd" 'utf-7-imap) "a&-bcd"))
(should (equal (decode-coding-string "a&-bcd" 'utf-7-imap) "a&bcd"))
;; Ability to encode Unicode.
(should (equal (check-coding-systems-region "あ" nil '(utf-7-imap)) nil))
(should (equal (encode-coding-string "あ" 'utf-7-imap) "&MEI-"))
(should (equal (decode-coding-string "&MEI-" 'utf-7-imap) "あ")))
(ert-deftest mule-hz ()
;; The chinese-hz encoding is not ASCII compatible.
(should-not (coding-system-get 'chinese-hz :ascii-compatible-p)))
;;; Testing `sgml-html-meta-auto-coding-function'.
(defconst sgml-html-meta-pre "
"
"The beginning of a minimal HTML document.")
(defconst sgml-html-meta-post ""
"The end of a minimal HTML document.")
(defun sgml-html-meta-run (coding-system)
"Run `sgml-html-meta-auto-coding-function' on a minimal HTML.
When CODING-SYSTEM is not nil, insert it, wrapped in a ''
element. When CODING-SYSTEM contains HTML meta characters or
white space, insert it as-is, without additional formatting. Use
the variables `sgml-html-meta-pre' and `sgml-html-meta-post' to
provide HTML fragments. Some tests override those variables."
(with-temp-buffer
(insert sgml-html-meta-pre
(cond ((not coding-system)
"")
((string-match "[<>'\"\n ]" coding-system)
coding-system)
(t
(format "" coding-system)))
sgml-html-meta-post)
(goto-char (point-min))
(sgml-html-meta-auto-coding-function (- (point-max) (point-min)))))
(ert-deftest sgml-html-meta-utf-8 ()
"Baseline: UTF-8."
(should (eq 'utf-8 (coding-system-base (sgml-html-meta-run "utf-8")))))
(ert-deftest sgml-html-meta-windows-hebrew ()
"A non-Unicode charset."
(should (eq 'windows-1255 (sgml-html-meta-run "windows-1255"))))
(ert-deftest sgml-html-meta-none ()
(should (eq nil (sgml-html-meta-run nil))))
(ert-deftest sgml-html-meta-unknown-coding ()
(should (eq nil (sgml-html-meta-run "XXX"))))
(ert-deftest sgml-html-meta-no-pre ()
"Without the prefix, so not HTML."
(let ((sgml-html-meta-pre ""))
(should (eq nil (sgml-html-meta-run "utf-8")))))
(ert-deftest sgml-html-meta-no-post-less-than-10lines ()
"No '', detect charset in the first 10 lines."
(let ((sgml-html-meta-post ""))
(should (eq 'utf-8 (coding-system-base
(sgml-html-meta-run
(concat "\n\n\n\n\n\n\n\n\n"
"")))))))
(ert-deftest sgml-html-meta-no-post-10lines ()
"No '', do not detect charset after the first 10 lines."
(let ((sgml-html-meta-post ""))
(should (eq nil (sgml-html-meta-run
(concat "\n\n\n\n\n\n\n\n\n\n"
""))))))
(ert-deftest sgml-html-meta-utf-8-with-bom ()
"Requesting 'UTF-8' does not override `utf-8-with-signature'.
Check fix for Bug#20623."
(let ((buffer-file-coding-system 'utf-8-with-signature))
(should (eq 'utf-8-with-signature (sgml-html-meta-run "utf-8")))))
;; Stop "Local Variables" above causing confusion when visiting this file.
;;; mule-tests.el ends here