mirror of
git://git.sv.gnu.org/emacs.git
synced 2026-01-13 06:50:39 -08:00
`string-search` is easier to understand, less error-prone, much faster, does not pollute the regexp cache, and does not mutate global state. Use it where applicable and obviously safe (erring on the conservative side). * admin/authors.el (authors-canonical-file-name) (authors-scan-change-log): * lisp/apropos.el (apropos-command) (apropos-documentation-property, apropos-symbols-internal): * lisp/arc-mode.el (archive-arc-summarize) (archive-zoo-summarize): * lisp/calc/calc-aent.el (math-read-factor): * lisp/calc/calc-ext.el (math-read-big-expr) (math-format-nice-expr, math-format-number-fancy): * lisp/calc/calc-forms.el (math-read-angle-brackets): * lisp/calc/calc-graph.el (calc-graph-set-range): * lisp/calc/calc-keypd.el (calc-keypad-press): * lisp/calc/calc-lang.el (tex, latex, math-read-big-rec): * lisp/calc/calc-prog.el (calc-fix-token-name) (calc-user-define-permanent, math-define-exp): * lisp/calc/calc.el (calc-record, calcDigit-key) (calc-count-lines): * lisp/calc/calcalg2.el (calc-solve-for, calc-poly-roots) (math-do-integral): * lisp/calc/calcalg3.el (calc-find-root, calc-find-minimum) (calc-get-fit-variables): * lisp/cedet/ede/speedbar.el (ede-tag-expand): * lisp/cedet/semantic/java.el (semantic-java-expand-tag): * lisp/cedet/semantic/sb.el (semantic-sb-show-extra) (semantic-sb-expand-group): * lisp/cedet/semantic/wisent/python.el (semantic-python-instance-variable-p): * lisp/cus-edit.el (get): * lisp/descr-text.el (describe-text-sexp): * lisp/dired-aux.el (dired-compress-file): * lisp/dired-x.el (dired-make-relative-symlink): * lisp/dired.el (dired-glob-regexp): * lisp/dos-fns.el (dos-convert-standard-filename, dos-8+3-filename): * lisp/edmacro.el (edmacro-format-keys): * lisp/emacs-lisp/eieio-opt.el (eieio-sb-expand): * lisp/emacs-lisp/eieio-speedbar.el (eieio-speedbar-object-expand): * lisp/emacs-lisp/lisp-mnt.el (lm-keywords-list): * lisp/emacs-lisp/warnings.el (display-warning): * lisp/emulation/viper-ex.el (viper-ex-read-file-name) (ex-print-display-lines): * lisp/env.el (read-envvar-name, setenv): * lisp/epa-mail.el (epa-mail-encrypt): * lisp/epg.el (epg--start): * lisp/erc/erc-backend.el (erc-parse-server-response): * lisp/erc/erc-dcc.el (erc-dcc-member): * lisp/erc/erc-speedbar.el (erc-speedbar-expand-server) (erc-speedbar-expand-channel, erc-speedbar-expand-user): * lisp/erc/erc.el (erc-send-input): * lisp/eshell/em-glob.el (eshell-glob-entries): * lisp/eshell/esh-proc.el (eshell-needs-pipe-p): * lisp/eshell/esh-util.el (eshell-convert): * lisp/eshell/esh-var.el (eshell-envvar-names): * lisp/faces.el (x-resolve-font-name): * lisp/ffap.el (ffap-file-at-point): * lisp/files.el (wildcard-to-regexp, shell-quote-wildcard-pattern): * lisp/forms.el (forms--update): * lisp/frameset.el (frameset-filter-unshelve-param): * lisp/gnus/gnus-art.el (article-decode-charset): * lisp/gnus/gnus-kill.el (gnus-kill-parse-rn-kill-file): * lisp/gnus/gnus-mlspl.el (gnus-group-split-fancy): * lisp/gnus/gnus-msg.el (gnus-summary-resend-message-insert-gcc) (gnus-inews-insert-gcc): * lisp/gnus/gnus-rfc1843.el (rfc1843-decode-article-body): * lisp/gnus/gnus-search.el (gnus-search-indexed-parse-output) (gnus-search--complete-key-data): * lisp/gnus/gnus-spec.el (gnus-parse-simple-format): * lisp/gnus/gnus-sum.el (gnus-summary-refer-article): * lisp/gnus/gnus-util.el (gnus-extract-address-components) (gnus-newsgroup-directory-form): * lisp/gnus/gnus-uu.el (gnus-uu-grab-view): * lisp/gnus/gnus.el (gnus-group-native-p, gnus-short-group-name): * lisp/gnus/message.el (message-check-news-header-syntax) (message-make-message-id, message-user-mail-address) (message-make-fqdn, message-get-reply-headers, message-followup): * lisp/gnus/mm-decode.el (mm-dissect-buffer): * lisp/gnus/nnheader.el (nnheader-insert): * lisp/gnus/nnimap.el (nnimap-process-quirk) (nnimap-imap-ranges-to-gnus-ranges): * lisp/gnus/nnmaildir.el (nnmaildir--ensure-suffix): * lisp/gnus/nnmairix.el (nnmairix-determine-original-group-from-path): * lisp/gnus/nnrss.el (nnrss-match-macro): * lisp/gnus/nntp.el (nntp-find-group-and-number): * lisp/help-fns.el (help--symbol-completion-table-affixation): * lisp/help.el (help-function-arglist): * lisp/hippie-exp.el (he-concat-directory-file-name): * lisp/htmlfontify.el (hfy-relstub): * lisp/ido.el (ido-make-prompt, ido-complete, ido-copy-current-word) (ido-exhibit): * lisp/image/image-converter.el (image-convert-p): * lisp/info-xref.el (info-xref-docstrings): * lisp/info.el (Info-toc-build, Info-follow-reference) (Info-backward-node, Info-finder-find-node) (Info-speedbar-expand-node): * lisp/international/mule-diag.el (print-fontset-element): * lisp/language/korea-util.el (default-korean-keyboard): * lisp/linum.el (linum-after-change): * lisp/mail/ietf-drums.el (ietf-drums-parse-address): * lisp/mail/mail-utils.el (mail-dont-reply-to): * lisp/mail/rfc2047.el (rfc2047-encode-1, rfc2047-decode-string): * lisp/mail/rfc2231.el (rfc2231-parse-string): * lisp/mail/rmailkwd.el (rmail-set-label): * lisp/mail/rmailsum.el (rmail-header-summary): * lisp/mail/smtpmail.el (smtpmail-maybe-append-domain) (smtpmail-user-mail-address): * lisp/mail/uce.el (uce-reply-to-uce): * lisp/man.el (Man-default-man-entry): * lisp/mh-e/mh-alias.el (mh-alias-gecos-name) (mh-alias-minibuffer-confirm-address): * lisp/mh-e/mh-comp.el (mh-forwarded-letter-subject): * lisp/mh-e/mh-speed.el (mh-speed-parse-flists-output): * lisp/mh-e/mh-utils.el (mh-collect-folder-names-filter) (mh-folder-completion-function): * lisp/minibuffer.el (completion--make-envvar-table) (completion-file-name-table, completion-flex-try-completion) (completion-flex-all-completions): * lisp/mpc.el (mpc--proc-quote-string, mpc-cmd-special-tag-p) (mpc-constraints-tag-lookup): * lisp/net/ange-ftp.el (ange-ftp-send-cmd) (ange-ftp-allow-child-lookup): * lisp/net/mailcap.el (mailcap-mime-types): * lisp/net/mairix.el (mairix-search-thread-this-article): * lisp/net/pop3.el (pop3-open-server): * lisp/net/soap-client.el (soap-decode-xs-complex-type): * lisp/net/socks.el (socks-filter): * lisp/nxml/nxml-outln.el (nxml-highlighted-qname): * lisp/nxml/rng-cmpct.el (rng-c-expand-name, rng-c-expand-datatype): * lisp/nxml/rng-uri.el (rng-uri-file-name-1): * lisp/obsolete/complete.el (partial-completion-mode) (PC-do-completion): * lisp/obsolete/longlines.el (longlines-encode-string): * lisp/obsolete/nnir.el (nnir-compose-result): * lisp/obsolete/terminal.el (te-quote-arg-for-sh): * lisp/obsolete/tpu-edt.el (tpu-check-search-case): * lisp/obsolete/url-ns.el (isPlainHostName): * lisp/pcmpl-unix.el (pcomplete/scp): * lisp/play/dunnet.el (dun-listify-string2, dun-get-path) (dun-unix-parse, dun-doassign, dun-cat, dun-batch-unix-interface): * lisp/progmodes/ebnf2ps.el: (ebnf-eps-header-footer-comment): * lisp/progmodes/gdb-mi.el (gdb-var-delete) (gdb-speedbar-expand-node, gdbmi-bnf-incomplete-record-result): * lisp/progmodes/gud.el (gud-find-expr): * lisp/progmodes/idlw-help.el (idlwave-do-context-help1): * lisp/progmodes/idlw-shell.el (idlwave-shell-mode) (idlwave-shell-filter-hidden-output, idlwave-shell-filter): * lisp/progmodes/idlwave.el (idlwave-skip-label-or-case) (idlwave-routine-info): * lisp/progmodes/octave.el (inferior-octave-completion-at-point): * lisp/progmodes/sh-script.el (sh-add-completer): * lisp/progmodes/sql.el (defun): * lisp/progmodes/xscheme.el (xscheme-process-filter): * lisp/replace.el (query-replace-compile-replacement) (map-query-replace-regexp): * lisp/shell.el (shell--command-completion-data) (shell-environment-variable-completion): * lisp/simple.el (display-message-or-buffer): * lisp/speedbar.el (speedbar-dired, speedbar-tag-file) (speedbar-tag-expand): * lisp/subr.el (split-string-and-unquote): * lisp/tar-mode.el (tar-extract): * lisp/term.el (term-command-hook, serial-read-name): * lisp/textmodes/bibtex.el (bibtex-print-help-message): * lisp/textmodes/ispell.el (ispell-lookup-words, ispell-filter) (ispell-parse-output, ispell-buffer-local-parsing): * lisp/textmodes/reftex-cite.el (reftex-do-citation): * lisp/textmodes/reftex-parse.el (reftex-notice-new): * lisp/textmodes/reftex-ref.el (reftex-show-entry): * lisp/textmodes/reftex.el (reftex-compile-variables): * lisp/textmodes/tex-mode.el (tex-send-command) (tex-start-tex, tex-append): * lisp/thingatpt.el (thing-at-point-url-at-point): * lisp/tmm.el (tmm-add-one-shortcut): * lisp/transient.el (transient-format-key): * lisp/url/url-auth.el (url-basic-auth) (url-digest-auth-directory-id-assoc): * lisp/url/url-news.el (url-news): * lisp/url/url-util.el (url-parse-query-string): * lisp/vc/vc-cvs.el (vc-cvs-parse-entry): * lisp/wid-browse.el (widget-browse-sexp): * lisp/woman.el (woman-parse-colon-path, woman-mini-help) (WoMan-getpage-in-background, woman-negative-vertical-space): * lisp/xml.el: * test/lisp/emacs-lisp/check-declare-tests.el (check-declare-tests-warn): * test/lisp/files-tests.el (files-tests-file-name-non-special-dired-compress-handler): * test/lisp/net/network-stream-tests.el (server-process-filter): * test/src/coding-tests.el (ert-test-unibyte-buffer-dos-eol-decode): Use `string-search` instead of `string-match` and `string-match-p`.
437 lines
17 KiB
EmacsLisp
437 lines
17 KiB
EmacsLisp
;;; coding-tests.el --- tests for text encoding and decoding -*- lexical-binding: t -*-
|
||
|
||
;; Copyright (C) 2013-2021 Free Software Foundation, Inc.
|
||
|
||
;; Author: Eli Zaretskii <eliz@gnu.org>
|
||
;; Author: Kenichi Handa <handa@gnu.org>
|
||
|
||
;; This file is part of GNU Emacs.
|
||
|
||
;; GNU Emacs is free software: you can redistribute it and/or modify
|
||
;; it under the terms of the GNU General Public License as published by
|
||
;; the Free Software Foundation, either version 3 of the License, or
|
||
;; (at your option) any later version.
|
||
|
||
;; GNU Emacs is distributed in the hope that it will be useful,
|
||
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
;; GNU General Public License for more details.
|
||
|
||
;; You should have received a copy of the GNU General Public License
|
||
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
|
||
|
||
;;; Code:
|
||
|
||
(require 'ert)
|
||
|
||
;; Directory to hold test data files.
|
||
(defvar coding-tests-workdir
|
||
(expand-file-name "coding-tests" temporary-file-directory))
|
||
|
||
;; Remove all generated test files.
|
||
(defun coding-tests-remove-files ()
|
||
(delete-directory coding-tests-workdir t))
|
||
|
||
(ert-deftest ert-test-coding-bogus-coding-systems ()
|
||
(unwind-protect
|
||
(let (test-file)
|
||
(or (file-directory-p coding-tests-workdir)
|
||
(mkdir coding-tests-workdir t))
|
||
(setq test-file (expand-file-name "nonexistent" coding-tests-workdir))
|
||
(if (file-exists-p test-file)
|
||
(delete-file test-file))
|
||
(should-error
|
||
(let ((coding-system-for-read 'bogus))
|
||
(insert-file-contents test-file)))
|
||
;; See bug #21602.
|
||
(setq test-file (expand-file-name "writing" coding-tests-workdir))
|
||
(should-error
|
||
(let ((coding-system-for-write (intern "\"us-ascii\"")))
|
||
(write-region "some text" nil test-file))))
|
||
(coding-tests-remove-files)))
|
||
|
||
;; See issue #5251.
|
||
(ert-deftest ert-test-unibyte-buffer-dos-eol-decode ()
|
||
(with-temp-buffer
|
||
(set-buffer-multibyte nil)
|
||
(insert (encode-coding-string "あ" 'euc-jp) "\xd" "\n")
|
||
(decode-coding-region (point-min) (point-max) 'euc-jp-dos)
|
||
(should-not (string-search "\^M" (buffer-string)))))
|
||
|
||
;; Return the contents (specified by CONTENT-TYPE; ascii, latin, or
|
||
;; binary) of a test file.
|
||
(defun coding-tests-file-contents (content-type)
|
||
(let* ((ascii "ABCDEFGHIJKLMNOPQRSTUVWXYZ\n")
|
||
(latin (concat ascii "ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏ\n"))
|
||
(binary (string-to-multibyte
|
||
(concat (string-as-unibyte latin)
|
||
(unibyte-string #xC0 #xC1 ?\n)))))
|
||
(cond ((eq content-type 'ascii) ascii)
|
||
((eq content-type 'latin) latin)
|
||
((eq content-type 'binary) binary)
|
||
(t
|
||
(error "Invalid file content type: %s" content-type)))))
|
||
|
||
;; Generate FILE with CONTENTS encoded by CODING-SYSTEM.
|
||
;; whose encoding specified by CODING-SYSTEM.
|
||
(defun coding-tests-gen-file (file contents coding-system)
|
||
(or (file-directory-p coding-tests-workdir)
|
||
(mkdir coding-tests-workdir t))
|
||
(setq file (expand-file-name file coding-tests-workdir))
|
||
(with-temp-file file
|
||
(set-buffer-file-coding-system coding-system)
|
||
(insert contents))
|
||
file)
|
||
|
||
;;; The following three functions are filters for contents of a test
|
||
;;; file.
|
||
|
||
;; Convert all LFs to CR LF sequences in the string STR.
|
||
(defun coding-tests-lf-to-crlf (str)
|
||
(with-temp-buffer
|
||
(insert str)
|
||
(goto-char (point-min))
|
||
(while (search-forward "\n" nil t)
|
||
(delete-char -1)
|
||
(insert "\r\n"))
|
||
(buffer-string)))
|
||
|
||
;; Convert all LFs to CRs in the string STR.
|
||
(defun coding-tests-lf-to-cr (str)
|
||
(with-temp-buffer
|
||
(insert str)
|
||
(subst-char-in-region (point-min) (point-max) ?\n ?\r)
|
||
(buffer-string)))
|
||
|
||
;; Convert all LFs to LF LF sequences in the string STR.
|
||
(defun coding-tests-lf-to-lflf (str)
|
||
(with-temp-buffer
|
||
(insert str)
|
||
(goto-char (point-min))
|
||
(while (search-forward "\n" nil t)
|
||
(insert "\n"))
|
||
(buffer-string)))
|
||
|
||
;; Prepend the UTF-8 BOM to STR.
|
||
(defun coding-tests-add-bom (str)
|
||
(concat "\xfeff" str))
|
||
|
||
;; Return the name of test file whose contents specified by
|
||
;; CONTENT-TYPE and whose encoding specified by CODING-SYSTEM.
|
||
(defun coding-tests-filename (content-type coding-system &optional ext)
|
||
(if ext
|
||
(expand-file-name (format "%s-%s.%s" content-type coding-system ext)
|
||
coding-tests-workdir)
|
||
(expand-file-name (format "%s-%s" content-type coding-system)
|
||
coding-tests-workdir)))
|
||
|
||
|
||
;;; Check ASCII optimizing decoder
|
||
|
||
;; Generate a test file whose contents specified by CONTENT-TYPE and
|
||
;; whose encoding specified by CODING-SYSTEM.
|
||
(defun coding-tests-ao-gen-file (content-type coding-system)
|
||
(let ((file (coding-tests-filename content-type coding-system)))
|
||
(coding-tests-gen-file file
|
||
(coding-tests-file-contents content-type)
|
||
coding-system)))
|
||
|
||
;; Test the decoding of a file whose contents and encoding are
|
||
;; specified by CONTENT-TYPE and WRITE-CODING. The test passes if the
|
||
;; file is read by READ-CODING and detected as DETECTED-CODING and the
|
||
;; contents is correctly decoded.
|
||
;; Optional 5th arg TRANSLATOR is a function to translate the original
|
||
;; file contents to match with the expected result of decoding. For
|
||
;; instance, when a file of dos eol-type is read by unix eol-type,
|
||
;; `coding-tests-lf-to-crlf' must be specified.
|
||
|
||
(defun coding-tests (content-type write-coding read-coding detected-coding
|
||
&optional translator)
|
||
(prefer-coding-system 'utf-8-auto)
|
||
(let ((filename (coding-tests-filename content-type write-coding)))
|
||
(with-temp-buffer
|
||
(let ((coding-system-for-read read-coding)
|
||
(contents (coding-tests-file-contents content-type))
|
||
(disable-ascii-optimization nil))
|
||
(if translator
|
||
(setq contents (funcall translator contents)))
|
||
(insert-file-contents filename)
|
||
(if (and (coding-system-equal buffer-file-coding-system detected-coding)
|
||
(string= (buffer-string) contents))
|
||
nil
|
||
(list buffer-file-coding-system
|
||
(string-to-list (buffer-string))
|
||
(string-to-list contents)))))))
|
||
|
||
(ert-deftest ert-test-coding-ascii ()
|
||
(unwind-protect
|
||
(progn
|
||
(dolist (eol-type '(unix dos mac))
|
||
(coding-tests-ao-gen-file 'ascii eol-type))
|
||
(should-not (coding-tests 'ascii 'unix 'undecided 'unix))
|
||
(should-not (coding-tests 'ascii 'dos 'undecided 'dos))
|
||
(should-not (coding-tests 'ascii 'dos 'dos 'dos))
|
||
(should-not (coding-tests 'ascii 'mac 'undecided 'mac))
|
||
(should-not (coding-tests 'ascii 'mac 'mac 'mac))
|
||
(should-not (coding-tests 'ascii 'dos 'utf-8 'utf-8-dos))
|
||
(should-not (coding-tests 'ascii 'dos 'unix 'unix
|
||
'coding-tests-lf-to-crlf))
|
||
(should-not (coding-tests 'ascii 'mac 'dos 'dos
|
||
'coding-tests-lf-to-cr))
|
||
(should-not (coding-tests 'ascii 'dos 'mac 'mac
|
||
'coding-tests-lf-to-lflf)))
|
||
(coding-tests-remove-files)))
|
||
|
||
(ert-deftest ert-test-coding-latin ()
|
||
(unwind-protect
|
||
(progn
|
||
(dolist (coding '("utf-8" "utf-8-with-signature"))
|
||
(dolist (eol-type '("unix" "dos" "mac"))
|
||
(coding-tests-ao-gen-file 'latin
|
||
(intern (concat coding "-" eol-type)))))
|
||
(should-not (coding-tests 'latin 'utf-8-unix 'undecided 'utf-8-unix))
|
||
(should-not (coding-tests 'latin 'utf-8-unix 'utf-8-unix 'utf-8-unix))
|
||
(should-not (coding-tests 'latin 'utf-8-dos 'undecided 'utf-8-dos))
|
||
(should-not (coding-tests 'latin 'utf-8-dos 'utf-8-dos 'utf-8-dos))
|
||
(should-not (coding-tests 'latin 'utf-8-mac 'undecided 'utf-8-mac))
|
||
(should-not (coding-tests 'latin 'utf-8-mac 'utf-8-mac 'utf-8-mac))
|
||
(should-not (coding-tests 'latin 'utf-8-dos 'unix 'utf-8-unix
|
||
'coding-tests-lf-to-crlf))
|
||
(should-not (coding-tests 'latin 'utf-8-mac 'dos 'utf-8-dos
|
||
'coding-tests-lf-to-cr))
|
||
(should-not (coding-tests 'latin 'utf-8-dos 'mac 'utf-8-mac
|
||
'coding-tests-lf-to-lflf))
|
||
(should-not (coding-tests 'latin 'utf-8-with-signature-unix 'undecided
|
||
'utf-8-with-signature-unix))
|
||
(should-not (coding-tests 'latin 'utf-8-with-signature-unix 'utf-8-auto
|
||
'utf-8-with-signature-unix))
|
||
(should-not (coding-tests 'latin 'utf-8-with-signature-dos 'undecided
|
||
'utf-8-with-signature-dos))
|
||
(should-not (coding-tests 'latin 'utf-8-with-signature-unix 'utf-8
|
||
'utf-8-unix 'coding-tests-add-bom))
|
||
(should-not (coding-tests 'latin 'utf-8-with-signature-unix 'utf-8
|
||
'utf-8-unix 'coding-tests-add-bom)))
|
||
(coding-tests-remove-files)))
|
||
|
||
(ert-deftest ert-test-coding-binary ()
|
||
(unwind-protect
|
||
(progn
|
||
(dolist (eol-type '("unix" "dos" "mac"))
|
||
(coding-tests-ao-gen-file 'binary
|
||
(intern (concat "raw-text" "-" eol-type))))
|
||
(should-not (coding-tests 'binary 'raw-text-unix 'undecided
|
||
'raw-text-unix))
|
||
(should-not (coding-tests 'binary 'raw-text-dos 'undecided
|
||
'raw-text-dos))
|
||
(should-not (coding-tests 'binary 'raw-text-mac 'undecided
|
||
'raw-text-mac))
|
||
(should-not (coding-tests 'binary 'raw-text-dos 'unix
|
||
'raw-text-unix 'coding-tests-lf-to-crlf))
|
||
(should-not (coding-tests 'binary 'raw-text-mac 'dos
|
||
'raw-text-dos 'coding-tests-lf-to-cr))
|
||
(should-not (coding-tests 'binary 'raw-text-dos 'mac
|
||
'raw-text-mac 'coding-tests-lf-to-lflf)))
|
||
(coding-tests-remove-files)))
|
||
|
||
|
||
;;; Check the coding system `prefer-utf-8'.
|
||
|
||
;; Read FILE. Check if the encoding was detected as DETECT. If
|
||
;; PREFER is non-nil, prefer that coding system before reading.
|
||
|
||
(defun coding-tests-prefer-utf-8-read (file detect prefer)
|
||
(with-temp-buffer
|
||
(with-coding-priority (if prefer (list prefer))
|
||
(insert-file-contents file))
|
||
(if (eq buffer-file-coding-system detect)
|
||
nil
|
||
(format "Invalid detection: %s" buffer-file-coding-system))))
|
||
|
||
;; Read FILE, modify it, and write it. Check if the coding system
|
||
;; used for writing was CODING. If CODING-TAG is non-nil, insert
|
||
;; coding tag with it before writing. If STR is non-nil, insert it
|
||
;; before writing.
|
||
|
||
(defun coding-tests-prefer-utf-8-write (file coding-tag coding
|
||
&optional str)
|
||
(with-temp-buffer
|
||
(insert-file-contents file)
|
||
(goto-char (point-min))
|
||
(if coding-tag
|
||
(insert (format ";; -*- coding: %s; -*-\n" coding-tag))
|
||
(insert ";;\n"))
|
||
(if str
|
||
(insert str))
|
||
(write-file (coding-tests-filename 'test 'test "el"))
|
||
(if (coding-system-equal buffer-file-coding-system coding)
|
||
nil
|
||
(format "Incorrect encoding: %s" last-coding-system-used))))
|
||
|
||
(ert-deftest ert-test-coding-prefer-utf-8 ()
|
||
(unwind-protect
|
||
(let ((ascii (coding-tests-gen-file "ascii.el"
|
||
(coding-tests-file-contents 'ascii)
|
||
'unix))
|
||
(latin (coding-tests-gen-file "utf-8.el"
|
||
(coding-tests-file-contents 'latin)
|
||
'utf-8-unix)))
|
||
(should-not (coding-tests-prefer-utf-8-read
|
||
ascii 'prefer-utf-8-unix nil))
|
||
(should-not (coding-tests-prefer-utf-8-read
|
||
latin 'utf-8-unix nil))
|
||
(should-not (coding-tests-prefer-utf-8-read
|
||
latin 'utf-8-unix 'iso-8859-1))
|
||
(should-not (coding-tests-prefer-utf-8-read
|
||
latin 'utf-8-unix 'sjis))
|
||
(should-not (coding-tests-prefer-utf-8-write
|
||
ascii nil 'prefer-utf-8-unix))
|
||
(should-not (coding-tests-prefer-utf-8-write
|
||
ascii 'iso-8859-1 'iso-8859-1-unix))
|
||
(should-not (coding-tests-prefer-utf-8-write
|
||
ascii nil 'utf-8-unix "À")))
|
||
(coding-tests-remove-files)))
|
||
|
||
|
||
;;; The following is for benchmark testing of the new optimized
|
||
;;; decoder, not for regression testing.
|
||
|
||
(defun generate-ascii-file ()
|
||
(dotimes (_i 100000)
|
||
(insert-char ?a 80)
|
||
(insert "\n")))
|
||
|
||
(defun generate-rarely-nonascii-file ()
|
||
(dotimes (i 100000)
|
||
(if (/= i 50000)
|
||
(insert-char ?a 80)
|
||
(insert ?À)
|
||
(insert-char ?a 79))
|
||
(insert "\n")))
|
||
|
||
(defun generate-mostly-nonascii-file ()
|
||
(dotimes (_i 30000)
|
||
(insert-char ?a 80)
|
||
(insert "\n"))
|
||
(dotimes (_i 20000)
|
||
(insert-char ?À 80)
|
||
(insert "\n"))
|
||
(dotimes (_i 10000)
|
||
(insert-char ?あ 80)
|
||
(insert "\n")))
|
||
|
||
|
||
(defvar test-file-list
|
||
'((generate-ascii-file
|
||
("~/ascii-tag-utf-8-unix.unix" ";; -*- coding: utf-8-unix; -*-" unix)
|
||
("~/ascii-tag-utf-8.unix" ";; -*- coding: utf-8; -*-" unix)
|
||
("~/ascii-tag-none.unix" "" unix)
|
||
("~/ascii-tag-utf-8-dos.dos" ";; -*- coding: utf-8-dos; -*-" dos)
|
||
("~/ascii-tag-utf-8.dos" ";; -*- coding: utf-8; -*-" dos)
|
||
("~/ascii-tag-none.dos" "" dos))
|
||
(generate-rarely-nonascii-file
|
||
("~/utf-8-r-tag-utf-8-unix.unix" ";; -*- coding: utf-8-unix; -*-" utf-8-unix)
|
||
("~/utf-8-r-tag-utf-8.unix" ";; -*- coding: utf-8; -*-" utf-8-unix)
|
||
("~/utf-8-r-tag-none.unix" "" utf-8-unix)
|
||
("~/utf-8-r-tag-utf-8-dos.dos" ";; -*- coding: utf-8-dos; -*-" utf-8-dos)
|
||
("~/utf-8-r-tag-utf-8.dos" ";; -*- coding: utf-8; -*-" utf-8-dos)
|
||
("~/utf-8-r-tag-none.dos" "" utf-8-dos))
|
||
(generate-mostly-nonascii-file
|
||
("~/utf-8-m-tag-utf-8-unix.unix" ";; -*- coding: utf-8-unix; -*-" utf-8-unix)
|
||
("~/utf-8-m-tag-utf-8.unix" ";; -*- coding: utf-8; -*-" utf-8-unix)
|
||
("~/utf-8-m-tag-none.unix" "" utf-8-unix)
|
||
("~/utf-8-m-tag-utf-8-dos.dos" ";; -*- coding: utf-8-dos; -*-" utf-8-dos)
|
||
("~/utf-8-m-tag-utf-8.dos" ";; -*- coding: utf-8; -*-" utf-8-dos)
|
||
("~/utf-8-m-tag-none.dos" "" utf-8-dos))))
|
||
|
||
(defun generate-benchmark-test-file ()
|
||
(interactive)
|
||
(with-temp-buffer
|
||
(message "Generating data...")
|
||
(dolist (files test-file-list)
|
||
(delete-region (point-min) (point-max))
|
||
(funcall (car files))
|
||
(dolist (file (cdr files))
|
||
(message "Writing %s..." (car file))
|
||
(goto-char (point-min))
|
||
(insert (nth 1 file) "\n")
|
||
(let ((coding-system-for-write (nth 2 file)))
|
||
(write-region (point-min) (point-max) (car file)))
|
||
(delete-region (point-min) (point))))))
|
||
|
||
(defun benchmark-decoder ()
|
||
(let ((gc-cons-threshold (max gc-cons-threshold 4000000)))
|
||
(insert "Without optimization:\n")
|
||
(dolist (files test-file-list)
|
||
(dolist (file (cdr files))
|
||
(let* ((disable-ascii-optimization t)
|
||
(result (benchmark-run 10
|
||
(with-temp-buffer (insert-file-contents (car file))))))
|
||
(insert (format "%s: %s\n" (car file) result)))))
|
||
(insert "With optimization:\n")
|
||
(dolist (files test-file-list)
|
||
(dolist (file (cdr files))
|
||
(let* ((disable-ascii-optimization nil)
|
||
(result (benchmark-run 10
|
||
(with-temp-buffer (insert-file-contents (car file))))))
|
||
(insert (format "%s: %s\n" (car file) result)))))))
|
||
|
||
(ert-deftest coding-nocopy-trivial ()
|
||
"Check that the NOCOPY parameter works for the trivial coding system."
|
||
(let ((s "abc"))
|
||
(should-not (eq (decode-coding-string s nil nil) s))
|
||
(should (eq (decode-coding-string s nil t) s))
|
||
(should-not (eq (encode-coding-string s nil nil) s))
|
||
(should (eq (encode-coding-string s nil t) s))))
|
||
|
||
(ert-deftest coding-nocopy-ascii ()
|
||
"Check that the NOCOPY parameter works for ASCII-only strings."
|
||
(let* ((uni (apply #'string (number-sequence 0 127)))
|
||
(multi (string-to-multibyte uni)))
|
||
(dolist (s (list uni multi))
|
||
;; Encodings without EOL conversion.
|
||
(dolist (coding '(us-ascii-unix iso-latin-1-unix utf-8-unix))
|
||
(should-not (eq (decode-coding-string s coding nil) s))
|
||
(should-not (eq (encode-coding-string s coding nil) s))
|
||
(should (eq (decode-coding-string s coding t) s))
|
||
(should (eq (encode-coding-string s coding t) s))
|
||
(should (eq last-coding-system-used coding)))
|
||
|
||
;; With EOL conversion inhibited.
|
||
(let ((inhibit-eol-conversion t))
|
||
(dolist (coding '(us-ascii iso-latin-1 utf-8))
|
||
(should-not (eq (decode-coding-string s coding nil) s))
|
||
(should-not (eq (encode-coding-string s coding nil) s))
|
||
(should (eq (decode-coding-string s coding t) s))
|
||
(should (eq (encode-coding-string s coding t) s))))))
|
||
|
||
;; Check identity decoding with EOL conversion for ASCII except CR.
|
||
(let* ((uni (apply #'string (delq ?\r (number-sequence 0 127))))
|
||
(multi (string-to-multibyte uni)))
|
||
(dolist (s (list uni multi))
|
||
(dolist (coding '(us-ascii-dos iso-latin-1-dos utf-8-dos mac-roman-mac))
|
||
(should-not (eq (decode-coding-string s coding nil) s))
|
||
(should (eq (decode-coding-string s coding t) s)))))
|
||
|
||
;; Check identity encoding with EOL conversion for ASCII except LF.
|
||
(let* ((uni (apply #'string (delq ?\n (number-sequence 0 127))))
|
||
(multi (string-to-multibyte uni)))
|
||
(dolist (s (list uni multi))
|
||
(dolist (coding '(us-ascii-dos iso-latin-1-dos utf-8-dos mac-roman-mac))
|
||
(should-not (eq (encode-coding-string s coding nil) s))
|
||
(should (eq (encode-coding-string s coding t) s))))))
|
||
|
||
|
||
(ert-deftest coding-check-coding-systems-region ()
|
||
(should (equal (check-coding-systems-region "aå" nil '(utf-8))
|
||
nil))
|
||
(should (equal (check-coding-systems-region "aåbγc" nil
|
||
'(utf-8 iso-latin-1 us-ascii))
|
||
'((iso-latin-1 3) (us-ascii 1 3))))
|
||
(should-error (check-coding-systems-region "å" nil '(bad-coding-system))))
|
||
|
||
;; Local Variables:
|
||
;; byte-compile-warnings: (not obsolete)
|
||
;; End:
|
||
|
||
(provide 'coding-tests)
|
||
;; coding-tests.el ends here
|