emacs: Switch from text to JSON format for search results

The JSON format eliminates the complex escaping issues that have
plagued the text search format.  This uses the incremental JSON parser
so that, like the text parser, it can output search results
incrementally.

This slows down the parser by about ~4X, but puts us in a good
position to optimize either by improving the JSON parser (evidence
suggests this can reduce the overhead to ~40% over the text format) or
by switching to S-expressions (evidence suggests this will more than
double performance over the text parser).  [1]

This also fixes the incremental search parsing test.

This has one minor side-effect on search result formatting.
Previously, the date field was always padded to a fixed width of 12
characters because of how the text parser's regexp was written.  The
JSON format doesn't do this.  We could pad it out in Emacs before
formatting it, but, since all of the other fields are variable width,
we instead fix notmuch-search-result-format to take the variable-width
field and pad it out.  For users who have customized this variable,
we'll mention in the NEWS how to fix this slight format change.

[1] id:"20110720205007.GB21316@mit.edu"
This commit is contained in:
Austin Clements 2012-07-09 17:42:41 -04:00 committed by David Bremner
parent 889dda3731
commit 9c5ea07cc6
2 changed files with 64 additions and 47 deletions

View file

@ -60,7 +60,7 @@
(require 'notmuch-message) (require 'notmuch-message)
(defcustom notmuch-search-result-format (defcustom notmuch-search-result-format
`(("date" . "%s ") `(("date" . "%12s ")
("count" . "%-7s ") ("count" . "%-7s ")
("authors" . "%-20s ") ("authors" . "%-20s ")
("subject" . "%s ") ("subject" . "%s ")
@ -557,17 +557,14 @@ This function advances the next thread when finished."
(notmuch-search-tag '("-inbox")) (notmuch-search-tag '("-inbox"))
(notmuch-search-next-thread)) (notmuch-search-next-thread))
(defvar notmuch-search-process-filter-data nil
"Data that has not yet been processed.")
(make-variable-buffer-local 'notmuch-search-process-filter-data)
(defun notmuch-search-process-sentinel (proc msg) (defun notmuch-search-process-sentinel (proc msg)
"Add a message to let user know when \"notmuch search\" exits" "Add a message to let user know when \"notmuch search\" exits"
(let ((buffer (process-buffer proc)) (let ((buffer (process-buffer proc))
(status (process-status proc)) (status (process-status proc))
(exit-status (process-exit-status proc)) (exit-status (process-exit-status proc))
(never-found-target-thread nil)) (never-found-target-thread nil))
(if (memq status '(exit signal)) (when (memq status '(exit signal))
(kill-buffer (process-get proc 'parse-buf))
(if (buffer-live-p buffer) (if (buffer-live-p buffer)
(with-current-buffer buffer (with-current-buffer buffer
(save-excursion (save-excursion
@ -577,8 +574,6 @@ This function advances the next thread when finished."
(if (eq status 'signal) (if (eq status 'signal)
(insert "Incomplete search results (search process was killed).\n")) (insert "Incomplete search results (search process was killed).\n"))
(when (eq status 'exit) (when (eq status 'exit)
(if notmuch-search-process-filter-data
(insert (concat "Error: Unexpected output from notmuch search:\n" notmuch-search-process-filter-data)))
(insert "End of search results.") (insert "End of search results.")
(unless (= exit-status 0) (unless (= exit-status 0)
(insert (format " (process returned %d)" exit-status))) (insert (format " (process returned %d)" exit-status)))
@ -758,45 +753,59 @@ non-authors is found, assume that all of the authors match."
(insert (apply #'format string objects)) (insert (apply #'format string objects))
(insert "\n"))) (insert "\n")))
(defvar notmuch-search-process-state nil
"Parsing state of the search process filter.")
(defvar notmuch-search-json-parser nil
"Incremental JSON parser for the search process filter.")
(defun notmuch-search-process-filter (proc string) (defun notmuch-search-process-filter (proc string)
"Process and filter the output of \"notmuch search\"" "Process and filter the output of \"notmuch search\""
(let ((buffer (process-buffer proc))) (let ((results-buf (process-buffer proc))
(if (buffer-live-p buffer) (parse-buf (process-get proc 'parse-buf))
(with-current-buffer buffer
(let ((line 0)
(more t)
(inhibit-read-only t) (inhibit-read-only t)
(string (concat notmuch-search-process-filter-data string))) done)
(setq notmuch-search-process-filter-data nil) (if (not (buffer-live-p results-buf))
(while more (delete-process proc)
(while (and (< line (length string)) (= (elt string line) ?\n)) (with-current-buffer parse-buf
(setq line (1+ line))) ;; Insert new data
(if (string-match "^thread:\\([0-9A-Fa-f]*\\) \\([^][]*\\) \\[\\([0-9]*\\)/\\([0-9]*\\)\\] \\([^;]*\\); \\(.*\\) (\\([^()]*\\))$" string line) (save-excursion
(let* ((thread-id (match-string 1 string)) (goto-char (point-max))
(tags-str (match-string 7 string)) (insert string)))
(result (list :thread thread-id (with-current-buffer results-buf
:date_relative (match-string 2 string) (while (not done)
:matched (string-to-number (condition-case nil
(match-string 3 string)) (case notmuch-search-process-state
:total (string-to-number ((begin)
(match-string 4 string)) ;; Enter the results list
:authors (match-string 5 string) (if (eq (notmuch-json-begin-compound
:subject (match-string 6 string) notmuch-search-json-parser) 'retry)
:tags (if tags-str (setq done t)
(save-match-data (setq notmuch-search-process-state 'result)))
(split-string tags-str)))))) ((result)
(if (/= (match-beginning 0) line) ;; Parse a result
(let ((result (notmuch-json-read notmuch-search-json-parser)))
(case result
((retry) (setq done t))
((end) (setq notmuch-search-process-state 'end))
(otherwise (notmuch-search-show-result result)))))
((end)
;; Any trailing data is unexpected
(notmuch-json-eof notmuch-search-json-parser)
(setq done t)))
(json-error
;; Do our best to resynchronize and ensure forward
;; progress
(notmuch-search-show-error (notmuch-search-show-error
(substring string line (match-beginning 0)))) "%s"
(notmuch-search-show-result result) (with-current-buffer parse-buf
(set 'line (match-end 0))) (let ((bad (buffer-substring (line-beginning-position)
(set 'more nil) (line-end-position))))
(while (and (< line (length string)) (= (elt string line) ?\n)) (forward-line)
(setq line (1+ line))) bad))))))
(if (< line (length string)) ;; Clear out what we've parsed
(setq notmuch-search-process-filter-data (substring string line))) (with-current-buffer parse-buf
)))) (delete-region (point-min) (point)))))))
(delete-process proc))))
(defun notmuch-search-tag-all (&optional tag-changes) (defun notmuch-search-tag-all (&optional tag-changes)
"Add/remove tags from all messages in current search buffer. "Add/remove tags from all messages in current search buffer.
@ -899,10 +908,19 @@ Other optional parameters are used as follows:
(let ((proc (start-process (let ((proc (start-process
"notmuch-search" buffer "notmuch-search" buffer
notmuch-command "search" notmuch-command "search"
"--format=json"
(if oldest-first (if oldest-first
"--sort=oldest-first" "--sort=oldest-first"
"--sort=newest-first") "--sort=newest-first")
query))) query))
;; Use a scratch buffer to accumulate partial output.
;; This buffer will be killed by the sentinel, which
;; should be called no matter how the process dies.
(parse-buf (generate-new-buffer " *notmuch search parse*")))
(set (make-local-variable 'notmuch-search-process-state) 'begin)
(set (make-local-variable 'notmuch-search-json-parser)
(notmuch-json-create-parser parse-buf))
(process-put proc 'parse-buf parse-buf)
(set-process-sentinel proc 'notmuch-search-process-sentinel) (set-process-sentinel proc 'notmuch-search-process-sentinel)
(set-process-filter proc 'notmuch-search-process-filter) (set-process-filter proc 'notmuch-search-process-filter)
(set-process-query-on-exit-flag proc nil)))) (set-process-query-on-exit-flag proc nil))))

View file

@ -36,7 +36,6 @@ test_emacs '(notmuch-search "tag:inbox")
test_expect_equal_file OUTPUT $EXPECTED/notmuch-search-tag-inbox test_expect_equal_file OUTPUT $EXPECTED/notmuch-search-tag-inbox
test_begin_subtest "Incremental parsing of search results" test_begin_subtest "Incremental parsing of search results"
test_subtest_known_broken
test_emacs "(ad-enable-advice 'notmuch-search-process-filter 'around 'pessimal) test_emacs "(ad-enable-advice 'notmuch-search-process-filter 'around 'pessimal)
(ad-activate 'notmuch-search-process-filter) (ad-activate 'notmuch-search-process-filter)
(notmuch-search \"tag:inbox\") (notmuch-search \"tag:inbox\")