From: David Bremner <david@tethera.net>
To: notmuch@notmuchmail.org
Cc: David Bremner <david@tethera.net>
Subject: [PATCH 19/25] lib/parse-sexp: add support for regexp fields
Date: Sat, 17 Jul 2021 23:40:15 -0300 [thread overview]
Message-ID: <20210718024021.3850340-20-david@tethera.net> (raw)
In-Reply-To: <20210718024021.3850340-1-david@tethera.net>
This commit connects the previously added keyword / flag handling with
the previously refactored regexp to query refactoring.
---
lib/parse-sexp.cc | 35 +++++++++++++++--------
lib/regexp-fields.h | 8 +++---
test/T081-sexpr-search.sh | 59 +++++++++++++++++++++++++++++++++++++++
3 files changed, 86 insertions(+), 16 deletions(-)
diff --git a/lib/parse-sexp.cc b/lib/parse-sexp.cc
index 95ee7c99..c0d0b596 100644
--- a/lib/parse-sexp.cc
+++ b/lib/parse-sexp.cc
@@ -1,8 +1,8 @@
-#include <xapian.h>
-#include "notmuch-private.h"
+#include "database-private.h"
#include "sexp.h"
#include "parse-time-vrp.h"
#include "query-fp.h"
+#include "regexp-fields.h"
typedef struct {
const char *name;
@@ -13,6 +13,7 @@ typedef struct {
typedef enum {
SEXP_FLAG_NONE = 0,
SEXP_FLAG_WILDCARD = 1 << 0,
+ SEXP_FLAG_REGEXP = 1 << 1,
} _sexp_flag_t;
/*
@@ -51,18 +52,18 @@ static _sexp_field_t fields[] =
{ "attachment", Xapian::Query::OP_PHRASE, SEXP_FLAG_WILDCARD },
{ "body", Xapian::Query::OP_PHRASE, SEXP_FLAG_NONE },
{ "date", Xapian::Query::OP_INVALID, SEXP_FLAG_NONE },
- { "from", Xapian::Query::OP_PHRASE, SEXP_FLAG_NONE },
- { "folder", Xapian::Query::OP_OR, SEXP_FLAG_NONE },
- { "id", Xapian::Query::OP_OR, SEXP_FLAG_NONE },
- { "is", Xapian::Query::OP_AND, SEXP_FLAG_WILDCARD },
- { "mid", Xapian::Query::OP_OR, SEXP_FLAG_NONE },
+ { "from", Xapian::Query::OP_PHRASE, SEXP_FLAG_REGEXP },
+ { "folder", Xapian::Query::OP_OR, SEXP_FLAG_REGEXP },
+ { "id", Xapian::Query::OP_OR, SEXP_FLAG_REGEXP },
+ { "is", Xapian::Query::OP_AND, SEXP_FLAG_WILDCARD | SEXP_FLAG_REGEXP },
+ { "mid", Xapian::Query::OP_OR, SEXP_FLAG_REGEXP },
{ "mimetype", Xapian::Query::OP_PHRASE, SEXP_FLAG_NONE },
- { "path", Xapian::Query::OP_OR, SEXP_FLAG_NONE },
- { "property", Xapian::Query::OP_AND, SEXP_FLAG_WILDCARD },
+ { "path", Xapian::Query::OP_OR, SEXP_FLAG_REGEXP },
+ { "property", Xapian::Query::OP_AND, SEXP_FLAG_WILDCARD | SEXP_FLAG_REGEXP },
{ "query", Xapian::Query::OP_INVALID, SEXP_FLAG_NONE },
- { "subject", Xapian::Query::OP_PHRASE, SEXP_FLAG_NONE },
- { "tag", Xapian::Query::OP_AND, SEXP_FLAG_WILDCARD },
- { "thread", Xapian::Query::OP_OR, SEXP_FLAG_NONE },
+ { "subject", Xapian::Query::OP_PHRASE, SEXP_FLAG_REGEXP },
+ { "tag", Xapian::Query::OP_AND, SEXP_FLAG_WILDCARD | SEXP_FLAG_REGEXP },
+ { "thread", Xapian::Query::OP_OR, SEXP_FLAG_REGEXP },
{ "to", Xapian::Query::OP_PHRASE, SEXP_FLAG_NONE },
{ }
};
@@ -76,6 +77,7 @@ static _sexp_keyword_t keywords[] =
{
{ "any", SEXP_FLAG_WILDCARD },
{ "*", SEXP_FLAG_WILDCARD },
+ { "rx", SEXP_FLAG_REGEXP },
{ }
};
@@ -305,6 +307,15 @@ _sexp_to_xapian_query (notmuch_database_t *notmuch, const sexp_t *sx, Xapian::Qu
}
output = Xapian::Query (Xapian::Query::OP_WILDCARD, term_prefix);
return NOTMUCH_STATUS_SUCCESS;
+ } else if (flags & SEXP_FLAG_REGEXP) {
+ if (! rest || ! rest->val) {
+ _notmuch_database_log (notmuch, "missing regular expression\n");
+ return NOTMUCH_STATUS_BAD_QUERY_SYNTAX;
+ } else {
+ std::string msg; /* ignored */
+ return _notmuch_regexp_to_query (notmuch, Xapian::BAD_VALUENO, field->name,
+ rest->val, output, msg);
+ }
} else {
return _sexp_combine_field (term_prefix, field->xapian_op, rest,
output);
diff --git a/lib/regexp-fields.h b/lib/regexp-fields.h
index 9c871de7..aa8fd81c 100644
--- a/lib/regexp-fields.h
+++ b/lib/regexp-fields.h
@@ -27,13 +27,13 @@
#include <sys/types.h>
#include <regex.h>
-#include "database-private.h"
#include "notmuch-private.h"
+#include "database-private.h"
notmuch_status_t
-_notmuch_regex_to_query (notmuch_database_t *notmuch, Xapian::valueno slot, std::string field,
- std::string regexp_str,
- Xapian::Query &output, std::string &msg);
+_notmuch_regexp_to_query (notmuch_database_t *notmuch, Xapian::valueno slot, std::string field,
+ std::string regexp_str,
+ Xapian::Query &output, std::string &msg);
/* A posting source that returns documents where a value matches a
* regexp.
diff --git a/test/T081-sexpr-search.sh b/test/T081-sexpr-search.sh
index 04eba2c0..281a9bf7 100755
--- a/test/T081-sexpr-search.sh
+++ b/test/T081-sexpr-search.sh
@@ -377,4 +377,63 @@ output=$(notmuch search --query-syntax=sexp '(subject deleted)' | notmuch_search
test_expect_equal "$output" "thread:XXX 2001-01-05 [1/1] Notmuch Test Suite; Not deleted (inbox unread)
thread:XXX 2001-01-05 [2/2] Notmuch Test Suite; Deleted (deleted inbox unread)"
+test_begin_subtest "illegal regexp search"
+test_expect_code 1 "notmuch search --query-syntax=sexp '(body :rx foo)'"
+
+notmuch search --output=messages from:cworth > cworth.msg-ids
+
+test_begin_subtest "regexp 'folder' search"
+notmuch search 'folder:/^bar$/' | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(folder :rx ^bar$)' | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp from search"
+notmuch search --output=messages --query-syntax=sexp '(from :rx cworth)' > OUTPUT
+test_expect_equal_file cworth.msg-ids OUTPUT
+
+test_begin_subtest "regexp search for 'from' 2"
+notmuch search from:/cworth@cworth.org/ and subject:patch | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(and (from :rx cworth@cworth.org) (subject patch))' \
+ | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'id' search"
+notmuch search --output=messages --query-syntax=sexp '(id :rx yoom)' > OUTPUT
+test_expect_equal_file cworth.msg-ids OUTPUT
+
+test_begin_subtest "unanchored 'is' search"
+notmuch search tag:signed or tag:inbox > EXPECTED
+notmuch search --query-syntax=sexp '(is :rx i)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "anchored 'is' search"
+notmuch search tag:signed > EXPECTED
+notmuch search --query-syntax=sexp '(is :rx ^si)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "combine regexp mid and subject"
+notmuch search subject:/-C/ and mid:/y..m/ | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(and (subject :rx -C) (mid :rx y..m))' | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'path' search"
+notmuch search 'path:/^bar$/' | notmuch_search_sanitize > EXPECTED
+notmuch search --query-syntax=sexp '(path :rx ^bar$)' | notmuch_search_sanitize > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'property' search"
+notmuch search property:foo=bar > EXPECTED
+notmuch search --query-syntax=sexp '(property :rx foo=.*)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "anchored 'tag' search"
+notmuch search tag:signed > EXPECTED
+notmuch search --query-syntax=sexp '(tag :rx ^si)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
+test_begin_subtest "regexp 'thread' search"
+notmuch search --output=threads '*' | grep '7$' > EXPECTED
+notmuch search --output=threads --query-syntax=sexp '(thread :rx 7$)' > OUTPUT
+test_expect_equal_file EXPECTED OUTPUT
+
test_done
--
2.30.2
next prev parent reply other threads:[~2021-07-18 2:40 UTC|newest]
Thread overview: 26+ messages / expand[flat|nested] mbox.gz Atom feed top
2021-07-18 2:39 v2 sexpr parser David Bremner
2021-07-18 2:39 ` [PATCH 01/25] configure: optional library sfsexp David Bremner
2021-07-18 2:39 ` [PATCH 02/25] lib: split notmuch_query_create David Bremner
2021-07-18 2:39 ` [PATCH 03/25] lib: define notmuch_query_create_sexpr David Bremner
2021-07-18 2:40 ` [PATCH 04/25] CLI/search+address: support sexpr queries David Bremner
2021-07-18 2:40 ` [PATCH 05/25] lib: add new status code for query syntax errors David Bremner
2021-07-18 2:40 ` [PATCH 06/25] lib/parse-sexp: parse 'and', 'not', 'or' David Bremner
2021-07-18 2:40 ` [PATCH 07/25] lib/parse-sexp: parse 'subject' David Bremner
2021-07-18 2:40 ` [PATCH 08/25] lib/parse-sexp: split terms in phrase mode David Bremner
2021-07-18 2:40 ` [PATCH 09/25] lib/parse-sexp: handle most fields David Bremner
2021-07-18 2:40 ` [PATCH 10/25] lib/parse-sexp: handle unprefixed terms David Bremner
2021-07-18 2:40 ` [PATCH 11/25] lib: factor out date to query conversion David Bremner
2021-07-18 2:40 ` [PATCH 12/25] lib/parse-sexp: parse date fields David Bremner
2021-07-18 2:40 ` [PATCH 13/25] lib: factor out expansion of saved queries David Bremner
2021-07-18 2:40 ` [PATCH 14/25] lib/parse-sexp: handle " David Bremner
2021-07-18 2:40 ` [PATCH 15/25] lib/parse-sexp: add keyword arguments for fields David Bremner
2021-07-18 2:40 ` [PATCH 16/25] lib/parse-sexp: initial support for wildcard queries David Bremner
2021-07-18 2:40 ` [PATCH 17/25] lib/query: generalize exclude handling to s-expression queries David Bremner
2021-07-18 2:40 ` [PATCH 18/25] lib: factor out query construction from regexp David Bremner
2021-07-18 2:40 ` David Bremner [this message]
2021-07-18 2:40 ` [PATCH 20/25] lib/thread-fp: factor out query expansion David Bremner
2021-07-18 2:40 ` [PATCH 21/25] lib: define _notmuch_query_from_sexp David Bremner
2021-07-18 2:40 ` [PATCH 22/25] lib: generate actual Xapian query for "*" and "" David Bremner
2021-07-18 2:40 ` [PATCH 23/25] lib/parse-sexp: support thread subqueries David Bremner
2021-07-18 2:40 ` [PATCH 24/25] lib/parse-sexp: support infix subqueries David Bremner
2021-07-18 2:40 ` [PATCH 25/25] lib/parse-sexp: parse user headers David Bremner
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
List information: https://notmuchmail.org/
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20210718024021.3850340-20-david@tethera.net \
--to=david@tethera.net \
--cc=notmuch@notmuchmail.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
Code repositories for project(s) associated with this public inbox
https://yhetil.org/notmuch.git/
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).