unofficial mirror of notmuch@notmuchmail.org
 help / color / mirror / code / Atom feed
From: David Bremner <david@tethera.net>
To: notmuch@notmuchmail.org
Cc: David Bremner <david@tethera.net>
Subject: [PATCH 19/25] lib/parse-sexp: add support for regexp fields
Date: Sat, 17 Jul 2021 23:40:15 -0300	[thread overview]
Message-ID: <20210718024021.3850340-20-david@tethera.net> (raw)
In-Reply-To: <20210718024021.3850340-1-david@tethera.net>

This commit connects the previously added keyword / flag handling with
the previously refactored regexp to query refactoring.
---
 lib/parse-sexp.cc         | 35 +++++++++++++++--------
 lib/regexp-fields.h       |  8 +++---
 test/T081-sexpr-search.sh | 59 +++++++++++++++++++++++++++++++++++++++
 3 files changed, 86 insertions(+), 16 deletions(-)

diff --git a/lib/parse-sexp.cc b/lib/parse-sexp.cc
index 95ee7c99..c0d0b596 100644
--- a/lib/parse-sexp.cc
+++ b/lib/parse-sexp.cc
@@ -1,8 +1,8 @@
-#include <xapian.h>
-#include "notmuch-private.h"
+#include "database-private.h"
 #include "sexp.h"
 #include "parse-time-vrp.h"
 #include "query-fp.h"
+#include "regexp-fields.h"
 
 typedef struct  {
     const char *name;
@@ -13,6 +13,7 @@ typedef struct  {
 typedef enum {
     SEXP_FLAG_NONE	= 0,
     SEXP_FLAG_WILDCARD	= 1 << 0,
+    SEXP_FLAG_REGEXP	= 1 << 1,
 } _sexp_flag_t;
 
 /*
@@ -51,18 +52,18 @@ static _sexp_field_t fields[] =
     { "attachment",   Xapian::Query::OP_PHRASE,       SEXP_FLAG_WILDCARD },
     { "body",         Xapian::Query::OP_PHRASE,       SEXP_FLAG_NONE },
     { "date",         Xapian::Query::OP_INVALID,      SEXP_FLAG_NONE },
-    { "from",         Xapian::Query::OP_PHRASE,       SEXP_FLAG_NONE },
-    { "folder",       Xapian::Query::OP_OR,           SEXP_FLAG_NONE },
-    { "id",           Xapian::Query::OP_OR,           SEXP_FLAG_NONE },
-    { "is",           Xapian::Query::OP_AND,          SEXP_FLAG_WILDCARD },
-    { "mid",          Xapian::Query::OP_OR,           SEXP_FLAG_NONE },
+    { "from",         Xapian::Query::OP_PHRASE,       SEXP_FLAG_REGEXP },
+    { "folder",       Xapian::Query::OP_OR,           SEXP_FLAG_REGEXP },
+    { "id",           Xapian::Query::OP_OR,           SEXP_FLAG_REGEXP },
+    { "is",           Xapian::Query::OP_AND,          SEXP_FLAG_WILDCARD | SEXP_FLAG_REGEXP },
+    { "mid",          Xapian::Query::OP_OR,           SEXP_FLAG_REGEXP },
     { "mimetype",     Xapian::Query::OP_PHRASE,       SEXP_FLAG_NONE },
-    { "path",         Xapian::Query::OP_OR,           SEXP_FLAG_NONE },
-    { "property",     Xapian::Query::OP_AND,          SEXP_FLAG_WILDCARD },
+    { "path",         Xapian::Query::OP_OR,           SEXP_FLAG_REGEXP },
+    { "property",     Xapian::Query::OP_AND,          SEXP_FLAG_WILDCARD | SEXP_FLAG_REGEXP },
     { "query",        Xapian::Query::OP_INVALID,      SEXP_FLAG_NONE },
-    { "subject",      Xapian::Query::OP_PHRASE,       SEXP_FLAG_NONE },
-    { "tag",          Xapian::Query::OP_AND,          SEXP_FLAG_WILDCARD },
-    { "thread",       Xapian::Query::OP_OR,           SEXP_FLAG_NONE },
+    { "subject",      Xapian::Query::OP_PHRASE,       SEXP_FLAG_REGEXP },
+    { "tag",          Xapian::Query::OP_AND,          SEXP_FLAG_WILDCARD | SEXP_FLAG_REGEXP },
+    { "thread",       Xapian::Query::OP_OR,           SEXP_FLAG_REGEXP },
     { "to",           Xapian::Query::OP_PHRASE,       SEXP_FLAG_NONE },
     { }
 };
@@ -76,6 +77,7 @@ static _sexp_keyword_t keywords[] =
 {
     { "any", SEXP_FLAG_WILDCARD },
     { "*", SEXP_FLAG_WILDCARD },
+    { "rx", SEXP_FLAG_REGEXP },
     { }
 };
 
@@ -305,6 +307,15 @@ _sexp_to_xapian_query (notmuch_database_t *notmuch, const sexp_t *sx, Xapian::Qu
 		}
 		output = Xapian::Query (Xapian::Query::OP_WILDCARD, term_prefix);
 		return NOTMUCH_STATUS_SUCCESS;
+	    } else if (flags & SEXP_FLAG_REGEXP) {
+		if (! rest || ! rest->val) {
+		    _notmuch_database_log (notmuch, "missing regular expression\n");
+		    return NOTMUCH_STATUS_BAD_QUERY_SYNTAX;
+		} else {
+		    std::string msg; /* ignored */
+		    return _notmuch_regexp_to_query (notmuch, Xapian::BAD_VALUENO, field->name,
+						     rest->val, output, msg);
+		}
 	    } else {
 		return _sexp_combine_field (term_prefix, field->xapian_op, rest,
 					    output);
diff --git a/lib/regexp-fields.h b/lib/regexp-fields.h
index 9c871de7..aa8fd81c 100644
--- a/lib/regexp-fields.h
+++ b/lib/regexp-fields.h
@@ -27,13 +27,13 @@
 
 #include <sys/types.h>
 #include <regex.h>
-#include "database-private.h"
 #include "notmuch-private.h"
+#include "database-private.h"
 
 notmuch_status_t
-_notmuch_regex_to_query (notmuch_database_t *notmuch, Xapian::valueno slot, std::string field,
-			 std::string regexp_str,
-			 Xapian::Query &output, std::string &msg);
+_notmuch_regexp_to_query (notmuch_database_t *notmuch, Xapian::valueno slot, std::string field,
+			  std::string regexp_str,
+			  Xapian::Query &output, std::string &msg);
 
 /* A posting source that returns documents where a value matches a
  * regexp.
diff --git a/test/T081-sexpr-search.sh b/test/T081-sexpr-search.sh
index 04eba2c0..281a9bf7 100755
--- a/test/T081-sexpr-search.sh
+++ b/test/T081-sexpr-search.sh
@@ -377,4 +377,63 @@ output=$(notmuch search --query-syntax=sexp '(subject deleted)' | notmuch_search
 test_expect_equal "$output" "thread:XXX   2001-01-05 [1/1] Notmuch Test Suite; Not deleted (inbox unread)
 thread:XXX   2001-01-05 [2/2] Notmuch Test Suite; Deleted (deleted inbox unread)"
 
+test_begin_subtest "illegal regexp search"
+test_expect_code 1 "notmuch search --query-syntax=sexp '(body :rx foo)'"
+
+notmuch search --output=messages from:cworth > cworth.msg-ids
+
+test_begin_subtest "regexp 'folder' search"
+notmuch search 'folder:/^bar$/' | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(folder :rx ^bar$)' | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp from search"
+notmuch search --output=messages --query-syntax=sexp '(from :rx cworth)' > OUTPUT
+test_expect_equal_file cworth.msg-ids OUTPUT
+
+test_begin_subtest "regexp search for 'from' 2"
+notmuch search from:/cworth@cworth.org/ and subject:patch | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(and (from :rx cworth@cworth.org) (subject patch))' \
+    | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'id' search"
+notmuch search --output=messages --query-syntax=sexp '(id :rx yoom)' > OUTPUT
+test_expect_equal_file cworth.msg-ids OUTPUT
+
+test_begin_subtest "unanchored 'is' search"
+notmuch search tag:signed or tag:inbox > EXPECTED
+notmuch search --query-syntax=sexp '(is :rx i)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "anchored 'is' search"
+notmuch search tag:signed > EXPECTED
+notmuch search --query-syntax=sexp '(is :rx ^si)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "combine regexp mid and subject"
+notmuch search subject:/-C/ and mid:/y..m/ | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(and (subject :rx -C) (mid :rx y..m))' | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'path' search"
+notmuch search 'path:/^bar$/' | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(path :rx ^bar$)' | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'property' search"
+notmuch search property:foo=bar > EXPECTED
+notmuch search --query-syntax=sexp '(property :rx foo=.*)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "anchored 'tag' search"
+notmuch search tag:signed > EXPECTED
+notmuch search --query-syntax=sexp '(tag :rx ^si)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'thread' search"
+notmuch search --output=threads '*' | grep '7$' > EXPECTED
+notmuch search --output=threads --query-syntax=sexp '(thread :rx 7$)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
 test_done
-- 
2.30.2

  parent reply	other threads:[~2021-07-18  2:40 UTC|newest]

Thread overview: 26+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2021-07-18  2:39 v2 sexpr parser David Bremner
2021-07-18  2:39 ` [PATCH 01/25] configure: optional library sfsexp David Bremner
2021-07-18  2:39 ` [PATCH 02/25] lib: split notmuch_query_create David Bremner
2021-07-18  2:39 ` [PATCH 03/25] lib: define notmuch_query_create_sexpr David Bremner
2021-07-18  2:40 ` [PATCH 04/25] CLI/search+address: support sexpr queries David Bremner
2021-07-18  2:40 ` [PATCH 05/25] lib: add new status code for query syntax errors David Bremner
2021-07-18  2:40 ` [PATCH 06/25] lib/parse-sexp: parse 'and', 'not', 'or' David Bremner
2021-07-18  2:40 ` [PATCH 07/25] lib/parse-sexp: parse 'subject' David Bremner
2021-07-18  2:40 ` [PATCH 08/25] lib/parse-sexp: split terms in phrase mode David Bremner
2021-07-18  2:40 ` [PATCH 09/25] lib/parse-sexp: handle most fields David Bremner
2021-07-18  2:40 ` [PATCH 10/25] lib/parse-sexp: handle unprefixed terms David Bremner
2021-07-18  2:40 ` [PATCH 11/25] lib: factor out date to query conversion David Bremner
2021-07-18  2:40 ` [PATCH 12/25] lib/parse-sexp: parse date fields David Bremner
2021-07-18  2:40 ` [PATCH 13/25] lib: factor out expansion of saved queries David Bremner
2021-07-18  2:40 ` [PATCH 14/25] lib/parse-sexp: handle " David Bremner
2021-07-18  2:40 ` [PATCH 15/25] lib/parse-sexp: add keyword arguments for fields David Bremner
2021-07-18  2:40 ` [PATCH 16/25] lib/parse-sexp: initial support for wildcard queries David Bremner
2021-07-18  2:40 ` [PATCH 17/25] lib/query: generalize exclude handling to s-expression queries David Bremner
2021-07-18  2:40 ` [PATCH 18/25] lib: factor out query construction from regexp David Bremner
2021-07-18  2:40 ` David Bremner [this message]
2021-07-18  2:40 ` [PATCH 20/25] lib/thread-fp: factor out query expansion David Bremner
2021-07-18  2:40 ` [PATCH 21/25] lib: define _notmuch_query_from_sexp David Bremner
2021-07-18  2:40 ` [PATCH 22/25] lib: generate actual Xapian query for "*" and "" David Bremner
2021-07-18  2:40 ` [PATCH 23/25] lib/parse-sexp: support thread subqueries David Bremner
2021-07-18  2:40 ` [PATCH 24/25] lib/parse-sexp: support infix subqueries David Bremner
2021-07-18  2:40 ` [PATCH 25/25] lib/parse-sexp: parse user headers David Bremner

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

  List information: https://notmuchmail.org/

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=20210718024021.3850340-20-david@tethera.net \
    --to=david@tethera.net \
    --cc=notmuch@notmuchmail.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
Code repositories for project(s) associated with this public inbox

	https://yhetil.org/notmuch.git/

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).