From d4cd8ad34b39cea2566e421d9b84ae6d73553db9 Mon Sep 17 00:00:00 2001 From: Arun Isaac Date: Wed, 13 Jul 2022 17:43:03 +0530 Subject: document: Index boolean terms. Metadata that will be used in boolean filtering should be indexed as boolean terms, not as free text. This also results in the happy coincidence that we no longer need a specialized document-term-generator generic method for and . * tissue/document.scm (document-boolean-terms): New public generic function. (document-term-generator): Use document-boolean-terms. * tissue/issue.scm (document-boolean-terms): New generic method. (document-term-generator): Delete generic method. * tissue/commit.scm (document-boolean-terms): New generic method. (document-term-generator): Delete generic method. --- tissue/document.scm | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) (limited to 'tissue/document.scm') diff --git a/tissue/document.scm b/tissue/document.scm index ecdabc3..48d82cc 100644 --- a/tissue/document.scm +++ b/tissue/document.scm @@ -36,6 +36,7 @@ document-web-uri document-type document-id-term + document-boolean-terms document-text document-recency-date document-term-generator @@ -142,6 +143,10 @@ that operates on a copy of OBJECT. It does not mutate OBJECT." (string-trim-both (symbol->string (class-name (class-of document))) (char-set #\< #\>))) +(define-method (document-boolean-terms (document )) + "Return the boolean terms in DOCUMENT." + (list)) + (define-method (document-term-generator (document )) "Return a term generator for DOCUMENT. The returned term generator has indexed the type and text of the document. If further free text is to @@ -153,7 +158,9 @@ and further text, increase-termpos! must be called before indexing." #:document (make-document #:data (call-with-output-string (cut write (object->scm document) <>)) - #:terms `((,(document-id-term document) . 0)) + #:terms (map (cut cons <> 0) + (cons (document-id-term document) + (document-boolean-terms document))) ;; This serialization of the recency date gets ;; the timezone ordering wrong. TODO: Replace it ;; with sortable-serialise once it is working in -- cgit v1.2.3