From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: from localhost (localhost [127.0.0.1]) by arlo.cworth.org (Postfix) with ESMTP id 428856DE0ABE for ; Sun, 7 May 2017 05:40:33 -0700 (PDT) X-Virus-Scanned: Debian amavisd-new at cworth.org X-Spam-Flag: NO X-Spam-Score: -0.005 X-Spam-Level: X-Spam-Status: No, score=-0.005 tagged_above=-999 required=5 tests=[AWL=0.006, SPF_PASS=-0.001, T_RP_MATCHES_RCVD=-0.01] autolearn=disabled Received: from arlo.cworth.org ([127.0.0.1]) by localhost (arlo.cworth.org [127.0.0.1]) (amavisd-new, port 10024) with ESMTP id 8JjuM5D6faRu for ; Sun, 7 May 2017 05:40:31 -0700 (PDT) Received: from fethera.tethera.net (fethera.tethera.net [198.245.60.197]) by arlo.cworth.org (Postfix) with ESMTPS id 39F786DE0350 for ; Sun, 7 May 2017 05:40:31 -0700 (PDT) Received: from remotemail by fethera.tethera.net with local (Exim 4.84_2) (envelope-from ) id 1d7LTO-0003aL-UZ; Sun, 07 May 2017 08:39:38 -0400 Received: (nullmailer pid 30337 invoked by uid 1000); Sun, 07 May 2017 12:40:26 -0000 From: David Bremner To: notmuch@freelists.org Cc: notmuch@notmuchmail.org, David Bremner Subject: [PATCH 04/12] lib: refactor notmuch_database_add_message header parsing Date: Sun, 7 May 2017 09:40:04 -0300 Message-Id: <20170507124012.30188-5-david@tethera.net> X-Mailer: git-send-email 2.11.0 In-Reply-To: <20170507124012.30188-1-david@tethera.net> References: <20170507124012.30188-1-david@tethera.net> X-BeenThere: notmuch@notmuchmail.org X-Mailman-Version: 2.1.23 Precedence: list List-Id: "Use and development of the notmuch mail system." List-Unsubscribe: , List-Archive: List-Post: List-Help: List-Subscribe: , X-List-Received-Date: Sun, 07 May 2017 12:40:33 -0000 This function is large and hard to understand and modify. Start to break it down into meaningful pieces. --- lib/add-message.cc | 54 +++----------------------------- lib/message-file.c | 86 +++++++++++++++++++++++++++++++++++++++++++++++++++ lib/notmuch-private.h | 11 +++++++ 3 files changed, 101 insertions(+), 50 deletions(-) diff --git a/lib/add-message.cc b/lib/add-message.cc index 314016a8..2922eaa9 100644 --- a/lib/add-message.cc +++ b/lib/add-message.cc @@ -468,7 +468,7 @@ notmuch_database_add_message (notmuch_database_t *notmuch, notmuch_private_status_t private_status; notmuch_bool_t is_ghost = FALSE, is_new = FALSE; - const char *date, *header; + const char *date; const char *from, *to, *subject; char *message_id = NULL; @@ -489,57 +489,12 @@ notmuch_database_add_message (notmuch_database_t *notmuch, if (ret) goto DONE; - /* Parse message up front to get better error status. */ - ret = _notmuch_message_file_parse (message_file); + ret = _notmuch_message_file_get_headers (message_file, + &from, &subject, &to, &date, + &message_id); if (ret) goto DONE; - /* Before we do any real work, (especially before doing a - * potential SHA-1 computation on the entire file's contents), - * let's make sure that what we're looking at looks like an - * actual email message. - */ - from = _notmuch_message_file_get_header (message_file, "from"); - subject = _notmuch_message_file_get_header (message_file, "subject"); - to = _notmuch_message_file_get_header (message_file, "to"); - - if ((from == NULL || *from == '\0') && - (subject == NULL || *subject == '\0') && - (to == NULL || *to == '\0')) { - ret = NOTMUCH_STATUS_FILE_NOT_EMAIL; - goto DONE; - } - - /* Now that we're sure it's mail, the first order of business - * is to find a message ID (or else create one ourselves). - */ - header = _notmuch_message_file_get_header (message_file, "message-id"); - if (header && *header != '\0') { - message_id = _parse_message_id (message_file, header, NULL); - - /* So the header value isn't RFC-compliant, but it's - * better than no message-id at all. - */ - if (message_id == NULL) - message_id = talloc_strdup (message_file, header); - } - - if (message_id == NULL ) { - /* No message-id at all, let's generate one by taking a - * hash over the file's contents. - */ - char *sha1 = _notmuch_sha1_of_file (filename); - - /* If that failed too, something is really wrong. Give up. */ - if (sha1 == NULL) { - ret = NOTMUCH_STATUS_FILE_ERROR; - goto DONE; - } - - message_id = talloc_asprintf (message_file, "notmuch-sha1-%s", sha1); - free (sha1); - } - try { /* Now that we have a message ID, we get a message object, * (which may or may not reference an existing document in the @@ -579,7 +534,6 @@ notmuch_database_add_message (notmuch_database_t *notmuch, if (ret) goto DONE; - date = _notmuch_message_file_get_header (message_file, "date"); _notmuch_message_set_header_values (message, date, from, subject); ret = _notmuch_message_index_file (message, message_file); diff --git a/lib/message-file.c b/lib/message-file.c index db18b163..70526ef0 100644 --- a/lib/message-file.c +++ b/lib/message-file.c @@ -92,6 +92,12 @@ _notmuch_message_file_open (notmuch_database_t *notmuch, return _notmuch_message_file_open_ctx (notmuch, NULL, filename); } +const char * +_notmuch_message_file_get_filename (notmuch_message_file_t *message_file) +{ + return message_file->filename; +} + void _notmuch_message_file_close (notmuch_message_file_t *message) { @@ -304,3 +310,83 @@ _notmuch_message_file_get_header (notmuch_message_file_t *message, return decoded; } + +notmuch_status_t +_notmuch_message_file_get_headers (notmuch_message_file_t *message_file, + const char **from_out, + const char **subject_out, + const char **to_out, + const char **date_out, + char **message_id_out) +{ + notmuch_status_t ret; + const char *header; + const char *from, *to, *subject, *date; + char *message_id = NULL; + + /* Parse message up front to get better error status. */ + ret = _notmuch_message_file_parse (message_file); + if (ret) + goto DONE; + + /* Before we do any real work, (especially before doing a + * potential SHA-1 computation on the entire file's contents), + * let's make sure that what we're looking at looks like an + * actual email message. + */ + from = _notmuch_message_file_get_header (message_file, "from"); + subject = _notmuch_message_file_get_header (message_file, "subject"); + to = _notmuch_message_file_get_header (message_file, "to"); + date = _notmuch_message_file_get_header (message_file, "date"); + + if ((from == NULL || *from == '\0') && + (subject == NULL || *subject == '\0') && + (to == NULL || *to == '\0')) { + ret = NOTMUCH_STATUS_FILE_NOT_EMAIL; + goto DONE; + } + + /* Now that we're sure it's mail, the first order of business + * is to find a message ID (or else create one ourselves). + */ + header = _notmuch_message_file_get_header (message_file, "message-id"); + if (header && *header != '\0') { + message_id = _notmuch_message_id_parse (message_file, header, NULL); + + /* So the header value isn't RFC-compliant, but it's + * better than no message-id at all. + */ + if (message_id == NULL) + message_id = talloc_strdup (message_file, header); + } + + if (message_id == NULL ) { + /* No message-id at all, let's generate one by taking a + * hash over the file's contents. + */ + char *sha1 = _notmuch_sha1_of_file (_notmuch_message_file_get_filename (message_file)); + + /* If that failed too, something is really wrong. Give up. */ + if (sha1 == NULL) { + ret = NOTMUCH_STATUS_FILE_ERROR; + goto DONE; + } + + message_id = talloc_asprintf (message_file, "notmuch-sha1-%s", sha1); + free (sha1); + } + DONE: + if (ret == NOTMUCH_STATUS_SUCCESS) { + if (from_out) + *from_out = from; + if (subject_out) + *subject_out = subject; + if (to_out) + *to_out = to; + if (date_out) + *date_out = date; + if (message_id_out) + *message_id_out = message_id; + } + return ret; +} diff --git a/lib/notmuch-private.h b/lib/notmuch-private.h index a1ae4bd5..f3c058ab 100644 --- a/lib/notmuch-private.h +++ b/lib/notmuch-private.h @@ -433,6 +433,17 @@ const char * _notmuch_message_file_get_header (notmuch_message_file_t *message, const char *header); +notmuch_status_t +_notmuch_message_file_get_headers (notmuch_message_file_t *message_file, + const char **from_out, + const char **subject_out, + const char **to_out, + const char **date_out, + char **message_id_out); + +const char * +_notmuch_message_file_get_filename (notmuch_message_file_t *message); + /* index.cc */ notmuch_status_t -- 2.11.0