2021-01-10 15:00:47 +01:00
|
|
|
;;; notmuch-parser.el --- streaming S-expression parser -*- lexical-binding: t -*-
|
2013-05-31 20:40:06 -04:00
|
|
|
;;
|
|
|
|
;; Copyright © Austin Clements
|
|
|
|
;;
|
|
|
|
;; This file is part of Notmuch.
|
|
|
|
;;
|
|
|
|
;; Notmuch is free software: you can redistribute it and/or modify it
|
|
|
|
;; under the terms of the GNU General Public License as published by
|
|
|
|
;; the Free Software Foundation, either version 3 of the License, or
|
|
|
|
;; (at your option) any later version.
|
|
|
|
;;
|
|
|
|
;; Notmuch is distributed in the hope that it will be useful, but
|
|
|
|
;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
;; General Public License for more details.
|
|
|
|
;;
|
|
|
|
;; You should have received a copy of the GNU General Public License
|
2016-06-02 12:26:14 -04:00
|
|
|
;; along with Notmuch. If not, see <https://www.gnu.org/licenses/>.
|
2013-05-31 20:40:06 -04:00
|
|
|
;;
|
|
|
|
;; Authors: Austin Clements <aclements@csail.mit.edu>
|
|
|
|
|
2016-04-13 03:58:47 -04:00
|
|
|
;;; Code:
|
|
|
|
|
emacs: improve how cl-lib and pcase are required
We need to load `cl-lib' at run-time because we use more from it than
just macros. Never-the-less many, but not all libraries required it
only at compile-time, which we got away with because at least some
libraries already required it at run-time as well.
We use `cl-lib' and (currently to a lesser extend) `pcase' throughout
the code-base, which means that we should require these features in
most libraries.
In the past we tried to only require these features in just the
libraries that actually need them, without fully succeeding. We did
not succeed in doing so because that means we would have to check
every time that we use a function from these features whether they
are already being required in the current library.
An alternative would be to add the `require' forms at the top of every
library but that is a bit annoying too.
In order to make sure that these features are loaded when needed but
also to keep the noise down we only require them in "notmuch-lib.el",
which most other libraries require, and in most of the few libraries
that do not do so, namely "notmuch-draft.el", "notmuch-message.el" and
"notmuch-parser.el". ("coolj.el", "make-deps.el", various generated
libraries, and "notmuch-compat.el" are left touched.)
2021-01-10 15:01:07 +01:00
|
|
|
(require 'cl-lib)
|
|
|
|
(require 'pcase)
|
2021-01-10 15:01:08 +01:00
|
|
|
(require 'subr-x)
|
2013-05-31 20:40:06 -04:00
|
|
|
|
|
|
|
(defun notmuch-sexp-create-parser ()
|
|
|
|
"Return a new streaming S-expression parser.
|
|
|
|
|
|
|
|
This parser is designed to incrementally read an S-expression
|
|
|
|
whose structure is known to the caller. Like a typical
|
|
|
|
S-expression parsing interface, it provides a function to read a
|
|
|
|
complete S-expression from the input. However, it extends this
|
|
|
|
with an additional function that requires the next value in the
|
|
|
|
input to be a list and descends into it, allowing its elements to
|
|
|
|
be read one at a time or further descended into. Both functions
|
|
|
|
can return 'retry to indicate that not enough input is available.
|
|
|
|
|
|
|
|
The parser always consumes input from point in the current
|
|
|
|
buffer. Hence, the caller is allowed to delete any data before
|
|
|
|
point and may resynchronize after an error by moving point."
|
|
|
|
(vector 'notmuch-sexp-parser
|
2020-08-08 13:49:53 +02:00
|
|
|
0 ; List depth
|
|
|
|
nil ; Partial parse position marker
|
|
|
|
nil)) ; Partial parse state
|
2013-05-31 20:40:06 -04:00
|
|
|
|
|
|
|
(defmacro notmuch-sexp--depth (sp) `(aref ,sp 1))
|
|
|
|
(defmacro notmuch-sexp--partial-pos (sp) `(aref ,sp 2))
|
|
|
|
(defmacro notmuch-sexp--partial-state (sp) `(aref ,sp 3))
|
|
|
|
|
|
|
|
(defun notmuch-sexp-read (sp)
|
|
|
|
"Consume and return the value at point in the current buffer.
|
|
|
|
|
|
|
|
Returns 'retry if there is insufficient input to parse a complete
|
|
|
|
value (though it may still move point over whitespace). If the
|
|
|
|
parser is currently inside a list and the next token ends the
|
|
|
|
list, this moves point just past the terminator and returns 'end.
|
|
|
|
Otherwise, this moves point to just past the end of the value and
|
|
|
|
returns the value."
|
|
|
|
(skip-chars-forward " \n\r\t")
|
|
|
|
(cond ((eobp) 'retry)
|
|
|
|
((= (char-after) ?\))
|
|
|
|
;; We've reached the end of a list
|
|
|
|
(if (= (notmuch-sexp--depth sp) 0)
|
|
|
|
;; .. but we weren't in a list. Let read signal the
|
|
|
|
;; error to be consistent with all other code paths.
|
|
|
|
(read (current-buffer))
|
|
|
|
;; Go up a level and return an end token
|
2020-04-25 22:18:07 +02:00
|
|
|
(cl-decf (notmuch-sexp--depth sp))
|
2013-05-31 20:40:06 -04:00
|
|
|
(forward-char)
|
|
|
|
'end))
|
|
|
|
((= (char-after) ?\()
|
|
|
|
;; We're at the beginning of a list. If we haven't started
|
|
|
|
;; a partial parse yet, attempt to read the list in its
|
|
|
|
;; entirety. If this fails, or we've started a partial
|
|
|
|
;; parse, extend the partial parse to figure out when we
|
|
|
|
;; have a complete list.
|
|
|
|
(catch 'return
|
2020-08-08 13:49:42 +02:00
|
|
|
(unless (notmuch-sexp--partial-state sp)
|
2013-05-31 20:40:06 -04:00
|
|
|
(let ((start (point)))
|
|
|
|
(condition-case nil
|
|
|
|
(throw 'return (read (current-buffer)))
|
|
|
|
(end-of-file (goto-char start)))))
|
|
|
|
;; Extend the partial parse
|
|
|
|
(let (is-complete)
|
|
|
|
(save-excursion
|
|
|
|
(let* ((new-state (parse-partial-sexp
|
|
|
|
(or (notmuch-sexp--partial-pos sp) (point))
|
|
|
|
(point-max) 0 nil
|
|
|
|
(notmuch-sexp--partial-state sp)))
|
|
|
|
;; A complete value is available if we've
|
|
|
|
;; reached depth 0.
|
2020-04-25 22:18:07 +02:00
|
|
|
(depth (car new-state)))
|
|
|
|
(cl-assert (>= depth 0))
|
2013-05-31 20:40:06 -04:00
|
|
|
(if (= depth 0)
|
|
|
|
;; Reset partial parse state
|
|
|
|
(setf (notmuch-sexp--partial-state sp) nil
|
|
|
|
(notmuch-sexp--partial-pos sp) nil
|
|
|
|
is-complete t)
|
|
|
|
;; Update partial parse state
|
|
|
|
(setf (notmuch-sexp--partial-state sp) new-state
|
|
|
|
(notmuch-sexp--partial-pos sp) (point-marker)))))
|
|
|
|
(if is-complete
|
|
|
|
(read (current-buffer))
|
|
|
|
'retry))))
|
|
|
|
(t
|
|
|
|
;; Attempt to read a non-compound value
|
|
|
|
(let ((start (point)))
|
|
|
|
(condition-case nil
|
|
|
|
(let ((val (read (current-buffer))))
|
|
|
|
;; We got what looks like a complete read, but if
|
|
|
|
;; we reached the end of the buffer in the process,
|
|
|
|
;; we may not actually have all of the input we
|
|
|
|
;; need (unless it's a string, which is delimited).
|
|
|
|
(if (or (stringp val) (not (eobp)))
|
|
|
|
val
|
|
|
|
;; We can't be sure the input was complete
|
|
|
|
(goto-char start)
|
|
|
|
'retry))
|
|
|
|
(end-of-file
|
|
|
|
(goto-char start)
|
|
|
|
'retry))))))
|
|
|
|
|
|
|
|
(defun notmuch-sexp-begin-list (sp)
|
|
|
|
"Parse the beginning of a list value and enter the list.
|
|
|
|
|
|
|
|
Returns 'retry if there is insufficient input to parse the
|
|
|
|
beginning of the list. If this is able to parse the beginning of
|
|
|
|
a list, it moves point past the token that opens the list and
|
|
|
|
returns t. Later calls to `notmuch-sexp-read' will return the
|
|
|
|
elements inside the list. If the input in buffer is not the
|
|
|
|
beginning of a list, throw invalid-read-syntax."
|
|
|
|
(skip-chars-forward " \n\r\t")
|
|
|
|
(cond ((eobp) 'retry)
|
|
|
|
((= (char-after) ?\()
|
|
|
|
(forward-char)
|
2020-04-25 22:18:07 +02:00
|
|
|
(cl-incf (notmuch-sexp--depth sp))
|
2013-05-31 20:40:06 -04:00
|
|
|
t)
|
|
|
|
(t
|
|
|
|
;; Skip over the bad character like `read' does
|
|
|
|
(forward-char)
|
|
|
|
(signal 'invalid-read-syntax (list (string (char-before)))))))
|
|
|
|
|
|
|
|
(defvar notmuch-sexp--parser nil
|
|
|
|
"The buffer-local notmuch-sexp-parser instance.
|
|
|
|
|
|
|
|
Used by `notmuch-sexp-parse-partial-list'.")
|
|
|
|
|
|
|
|
(defvar notmuch-sexp--state nil
|
|
|
|
"The buffer-local `notmuch-sexp-parse-partial-list' state.")
|
|
|
|
|
|
|
|
(defun notmuch-sexp-parse-partial-list (result-function result-buffer)
|
|
|
|
"Incrementally parse an S-expression list from the current buffer.
|
|
|
|
|
|
|
|
This function consumes an S-expression list from the current
|
|
|
|
buffer, applying RESULT-FUNCTION in RESULT-BUFFER to each
|
|
|
|
complete value in the list. It operates incrementally and should
|
|
|
|
be called whenever the input buffer has been extended with
|
|
|
|
additional data. The caller just needs to ensure it does not
|
|
|
|
move point in the input buffer."
|
|
|
|
;; Set up the initial state
|
|
|
|
(unless (local-variable-p 'notmuch-sexp--parser)
|
2020-11-16 22:28:39 +01:00
|
|
|
(setq-local notmuch-sexp--parser (notmuch-sexp-create-parser))
|
|
|
|
(setq-local notmuch-sexp--state 'begin))
|
2013-05-31 20:40:06 -04:00
|
|
|
(let (done)
|
|
|
|
(while (not done)
|
2020-04-25 22:18:07 +02:00
|
|
|
(cl-case notmuch-sexp--state
|
2013-05-31 20:40:06 -04:00
|
|
|
(begin
|
|
|
|
;; Enter the list
|
|
|
|
(if (eq (notmuch-sexp-begin-list notmuch-sexp--parser) 'retry)
|
|
|
|
(setq done t)
|
|
|
|
(setq notmuch-sexp--state 'result)))
|
|
|
|
(result
|
|
|
|
;; Parse a result
|
|
|
|
(let ((result (notmuch-sexp-read notmuch-sexp--parser)))
|
2020-04-25 22:18:07 +02:00
|
|
|
(cl-case result
|
2013-05-31 20:40:06 -04:00
|
|
|
(retry (setq done t))
|
|
|
|
(end (setq notmuch-sexp--state 'end))
|
|
|
|
(t (with-current-buffer result-buffer
|
|
|
|
(funcall result-function result))))))
|
|
|
|
(end
|
2021-01-10 15:00:50 +01:00
|
|
|
;; Skip over trailing whitespace.
|
|
|
|
(skip-chars-forward " \n\r\t")
|
|
|
|
;; Any trailing data is unexpected.
|
|
|
|
(unless (eobp)
|
|
|
|
(error "Trailing garbage following expression"))
|
2013-05-31 20:40:06 -04:00
|
|
|
(setq done t)))))
|
|
|
|
;; Clear out what we've parsed
|
|
|
|
(delete-region (point-min) (point)))
|
|
|
|
|
|
|
|
(provide 'notmuch-parser)
|
|
|
|
|
2016-04-13 03:58:47 -04:00
|
|
|
;;; notmuch-parser.el ends here
|