emacs/lisp/mail/ietf-drums.el

322 lines
9.6 KiB
EmacsLisp
Raw Normal View History

;;; ietf-drums.el --- Functions for parsing RFC 2822 headers -*- lexical-binding:t -*-
2005-08-06 19:51:42 +00:00
;; Copyright (C) 1998-2020 Free Software Foundation, Inc.
2000-09-19 13:40:08 +00:00
;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
;; This file is part of GNU Emacs.
;; GNU Emacs is free software: you can redistribute it and/or modify
2000-09-19 13:40:08 +00:00
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
2000-09-19 13:40:08 +00:00
;; GNU Emacs is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
2000-09-19 13:40:08 +00:00
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
2000-09-19 13:40:08 +00:00
;;; Commentary:
;; DRUMS is an IETF Working Group that worked on Internet RFC 2822,
;; the successor to RFC 822 and the predecessor of RFC 5322. This
;; library is based on draft-ietf-drums-msg-fmt-05.txt, released on
;; 1998-08-05.
2000-09-19 13:40:08 +00:00
;; Pending a real regression self test suite, Simon Josefsson added
;; various self test expressions snipped from bug reports, and their
;; expected value, below. I you believe it could be useful, please
;; add your own test cases, or write a real self test suite, or just
;; remove this.
;; <m3oekvfd50.fsf@whitebox.m5r.de>
;; (ietf-drums-parse-address "'foo' <foo@example.com>")
;; => ("foo@example.com" . "'foo'")
2000-09-19 13:40:08 +00:00
;;; Code:
(eval-when-compile (require 'cl-lib))
2000-09-19 13:40:08 +00:00
(defvar ietf-drums-no-ws-ctl-token "\001-\010\013\014\016-\037\177"
"US-ASCII control characters excluding CR, LF and white space.")
(defvar ietf-drums-text-token "\001-\011\013\014\016-\177"
2002-11-29 15:57:52 +00:00
"US-ASCII characters excluding CR and LF.")
2000-09-19 13:40:08 +00:00
(defvar ietf-drums-specials-token "()<>[]:;@\\,.\""
"Special characters.")
(defvar ietf-drums-quote-token "\\"
"Quote character.")
(defvar ietf-drums-wsp-token " \t"
"White space.")
(defvar ietf-drums-fws-regexp
(concat "[" ietf-drums-wsp-token "]*\n[" ietf-drums-wsp-token "]+")
"Folding white space.")
(defvar ietf-drums-atext-token "-^a-zA-Z0-9!#$%&'*+/=?_`{|}~"
"Textual token.")
(defvar ietf-drums-dot-atext-token "-^a-zA-Z0-9!#$%&'*+/=?_`{|}~."
"Textual token including full stop.")
(defvar ietf-drums-qtext-token
(concat ietf-drums-no-ws-ctl-token "\041\043-\133\135-\177")
2003-02-04 13:24:35 +00:00
"Non-white-space control characters, plus the rest of ASCII excluding
2002-11-29 15:57:52 +00:00
backslash and doublequote.")
2000-09-19 13:40:08 +00:00
(defvar ietf-drums-tspecials "][()<>@,;:\\\"/?="
"Tspecials.")
(defvar ietf-drums-syntax-table
(let ((table (copy-syntax-table emacs-lisp-mode-syntax-table)))
(modify-syntax-entry ?\\ "/" table)
(modify-syntax-entry ?< "(" table)
(modify-syntax-entry ?> ")" table)
(modify-syntax-entry ?@ "w" table)
(modify-syntax-entry ?/ "w" table)
(modify-syntax-entry ?* "_" table)
(modify-syntax-entry ?\; "_" table)
(modify-syntax-entry ?\' "_" table)
2000-09-19 13:40:08 +00:00
table))
(defun ietf-drums-token-to-list (token)
"Translate TOKEN into a list of characters."
(let ((i 0)
b c out range)
2000-09-19 13:40:08 +00:00
(while (< i (length token))
(setq c (aref token i))
(cl-incf i)
2000-09-19 13:40:08 +00:00
(cond
((eq c ?-)
2000-09-19 13:40:08 +00:00
(if b
(setq range t)
(push c out)))
(range
(while (<= b c)
(push (make-char 'ascii b) out)
(cl-incf b))
2000-09-19 13:40:08 +00:00
(setq range nil))
((= i (length token))
(push (make-char 'ascii c) out))
2000-09-19 13:40:08 +00:00
(t
(when b
(push (make-char 'ascii b) out))
2000-09-19 13:40:08 +00:00
(setq b c))))
(nreverse out)))
(defsubst ietf-drums-init (string)
(set-syntax-table ietf-drums-syntax-table)
(insert string)
(ietf-drums-unfold-fws)
(goto-char (point-min)))
(defun ietf-drums-remove-comments (string)
"Remove comments from STRING."
(with-temp-buffer
(let (c)
(ietf-drums-init string)
(while (not (eobp))
(setq c (char-after))
(cond
((eq c ?\")
(condition-case nil
(forward-sexp 1)
(error (goto-char (point-max)))))
2000-09-19 13:40:08 +00:00
((eq c ?\()
(delete-region
(point)
(condition-case nil
(with-syntax-table (copy-syntax-table ietf-drums-syntax-table)
(modify-syntax-entry ?\" "w")
(forward-sexp 1)
(point))
(error (point-max)))))
2000-09-19 13:40:08 +00:00
(t
(forward-char 1))))
(buffer-string))))
(defun ietf-drums-remove-whitespace (string)
"Remove whitespace from STRING."
(with-temp-buffer
(ietf-drums-init string)
(let (c)
(while (not (eobp))
(setq c (char-after))
(cond
((eq c ?\")
(forward-sexp 1))
((eq c ?\()
(forward-sexp 1))
((memq c '(?\ ?\t ?\n ?\r))
2000-09-19 13:40:08 +00:00
(delete-char 1))
(t
(forward-char 1))))
(buffer-string))))
(defun ietf-drums-get-comment (string)
"Return the first comment in STRING."
(with-temp-buffer
(ietf-drums-init string)
(let (result c)
(while (not (eobp))
(setq c (char-after))
(cond
((eq c ?\")
(forward-sexp 1))
((eq c ?\()
(setq result
(buffer-substring
(1+ (point))
(progn (forward-sexp 1) (1- (point))))))
(t
(forward-char 1))))
result)))
(defun ietf-drums-strip (string)
"Remove comments and whitespace from STRING."
(ietf-drums-remove-whitespace (ietf-drums-remove-comments string)))
(defun ietf-drums-remove-garbage (string)
"Remove some garbage from STRING."
(while (string-match "[][()<>@,;:\\\"/?=]+" string)
(setq string (concat (substring string 0 (match-beginning 0))
(substring string (match-end 0)))))
string)
(defun ietf-drums-strip-cte (string)
"Remove comments, whitespace and garbage from STRING.
STRING is assumed to be a string that is extracted from
the Content-Transfer-Encoding header of a mail."
(ietf-drums-remove-garbage (inline (ietf-drums-strip string))))
(declare-function rfc2047-decode-string "rfc2047" (string &optional address-mime))
(defun ietf-drums-parse-address (string &optional decode)
"Parse STRING and return a MAILBOX / DISPLAY-NAME pair.
If DECODE, the DISPLAY-NAME will have RFC2047 decoding performed
(that's the \"=?utf...q...=?\") stuff."
2000-09-19 13:40:08 +00:00
(with-temp-buffer
(let (display-name mailbox c display-string)
(ietf-drums-init string)
(while (not (eobp))
(setq c (char-after))
;; If we have an uneven number of quote characters,
;; `forward-sexp' will fail. In these cases, just delete the
;; final of these quote characters.
(when (and (eq c ?\")
(not
(save-excursion
(ignore-errors
(forward-sexp 1)
t))))
(delete-char 1)
(setq c (char-after)))
2000-09-19 13:40:08 +00:00
(cond
((or (eq c ? )
(eq c ?\t))
(forward-char 1))
((eq c ?\()
(forward-sexp 1))
((eq c ?\")
(push (buffer-substring
(1+ (point)) (progn (forward-sexp 1) (1- (point))))
display-name))
((looking-at (concat "[" ietf-drums-atext-token "@" "]"))
(push (buffer-substring (point) (progn (forward-sexp 1) (point)))
display-name))
((eq c ?<)
(setq mailbox
(ietf-drums-remove-whitespace
(ietf-drums-remove-comments
(buffer-substring
(1+ (point))
(progn (forward-sexp 1) (1- (point))))))))
(t
(forward-char 1))))
2000-09-19 13:40:08 +00:00
;; If we found no display-name, then we look for comments.
(if display-name
(setq display-string
(mapconcat 'identity (reverse display-name) " "))
(setq display-string (ietf-drums-get-comment string)))
(if (not mailbox)
(when (and display-string
(string-match "@" display-string))
2000-09-19 13:40:08 +00:00
(cons
(mapconcat 'identity (nreverse display-name) "")
(ietf-drums-get-comment string)))
(cons mailbox (if decode
(rfc2047-decode-string display-string)
display-string))))))
2000-09-19 13:40:08 +00:00
(defun ietf-drums-parse-addresses (string &optional rawp)
"Parse STRING and return a list of MAILBOX / DISPLAY-NAME pairs.
If RAWP, don't actually parse the addresses, but instead return
a list of address strings."
(if (null string)
nil
(with-temp-buffer
(ietf-drums-init string)
(let ((beg (point))
pairs c address)
(while (not (eobp))
(setq c (char-after))
(cond
((memq c '(?\" ?< ?\())
(condition-case nil
(forward-sexp 1)
(error
(skip-chars-forward "^,"))))
((eq c ?,)
(setq address
(if rawp
(buffer-substring beg (point))
(condition-case nil
(ietf-drums-parse-address
(buffer-substring beg (point)))
(error nil))))
(if address (push address pairs))
(forward-char 1)
(setq beg (point)))
(t
(forward-char 1))))
(setq address
(if rawp
(buffer-substring beg (point))
(condition-case nil
(ietf-drums-parse-address
(buffer-substring beg (point)))
(error nil))))
(if address (push address pairs))
(nreverse pairs)))))
2000-09-19 13:40:08 +00:00
(defun ietf-drums-unfold-fws ()
"Unfold folding white space in the current buffer."
(goto-char (point-min))
(while (re-search-forward ietf-drums-fws-regexp nil t)
(replace-match " " t t))
(goto-char (point-min)))
(defun ietf-drums-parse-date (string)
"Return an Emacs time spec from STRING."
Simplify use of encode-time Most uses of (apply #'encode-time foo) can now be replaced with (encode-time foo). Make similar simplifications. * lisp/calendar/time-date.el (date-to-time): * lisp/calendar/timeclock.el (timeclock-when-to-leave) (timeclock-day-base, timeclock-generate-report): * lisp/emacs-lisp/timer.el (timer-set-idle-time): * lisp/eshell/esh-util.el (eshell-parse-ange-ls): * lisp/gnus/gnus-art.el (article-make-date-line): * lisp/gnus/gnus-delay.el (gnus-delay-article) (gnus-delay-send-queue): * lisp/gnus/gnus-icalendar.el (gnus-icalendar-event--decode-datefield): * lisp/gnus/gnus-logic.el (gnus-advanced-date): * lisp/gnus/message.el (message-make-expires-date): * lisp/gnus/nndiary.el (nndiary-compute-reminders): * lisp/mail/ietf-drums.el (ietf-drums-parse-date): * lisp/net/tramp-adb.el (tramp-adb-ls-output-time-less-p): * lisp/org/org-agenda.el (org-agenda-get-timestamps) (org-agenda-get-progress, org-agenda-show-clocking-issues): * lisp/org/org-capture.el (org-capture-set-target-location): * lisp/org/org-clock.el (org-clock-get-sum-start, org-clock-sum) (org-clocktable-steps): * lisp/org/org-colview.el (org-colview-construct-allowed-dates) * lisp/org/org-macro.el (org-macro--vc-modified-time): * lisp/org/org-table.el (org-table-eval-formula): * lisp/org/org.el (org-current-time, org-store-link) (org-time-today, org-read-date, org-read-date-display) (org-display-custom-time, org-time-string-to-time) (org-timestamp-change, org-timestamp--to-internal-time): * lisp/url/url-dav.el (url-dav-process-date-property): * lisp/vc/vc-cvs.el (vc-cvs-annotate-current-time) (vc-cvs-parse-entry): Simplify use of encode-time. * lisp/org/org-clock.el (org-clock-get-clocked-time): (org-clock-resolve, org-resolve-clocks, org_clock_out) (org-clock-update-time-maybe): Avoid some rounding problems with encode-time and float-time. * lisp/org/org-clock.el (org-clock-in, org-clock-update-time-maybe): * lisp/org/org-colview.el (org-columns--age-to-minutes): * lisp/org/org.el (org-get-scheduled-time, org-get-deadline-time) (org-add-planning-info, org-2ft, org-time-string-to-absolute) (org-closest-date): Use org-time-string-to-time instead of doing it by hand with encode-time. * lisp/org/org.el (org-current-time): Simplify rounding. (org-read-date): Avoid extra trip through encode-time.
2019-02-10 20:25:22 -08:00
(encode-time (parse-time-string string)))
2000-09-19 13:40:08 +00:00
(defun ietf-drums-narrow-to-header ()
"Narrow to the header section in the current buffer."
(narrow-to-region
(goto-char (point-min))
(if (re-search-forward "^\r?$" nil 1)
(match-beginning 0)
(point-max)))
(goto-char (point-min)))
(defun ietf-drums-quote-string (string)
"Quote string if it needs quoting to be displayed in a header."
(if (string-match (concat "[^" ietf-drums-atext-token "]") string)
(concat "\"" string "\"")
string))
(defun ietf-drums-make-address (name address)
(if name
(concat (ietf-drums-quote-string name) " <" address ">")
address))
2000-09-19 13:40:08 +00:00
(provide 'ietf-drums)
;;; ietf-drums.el ends here