unofficial mirror of notmuch@notmuchmail.org
 help / color / mirror / code / Atom feed
From: Jani Nikula <jani@nikula.org>
To: Austin Clements <amdragon@MIT.EDU>, notmuch@notmuchmail.org
Cc: Vladimir Marek <vlmarek@volny.cz>
Subject: Re: [PATCH v2 2/2] new: Centralize file type stat-ing logic
Date: Tue, 08 May 2012 07:58:28 +0000	[thread overview]
Message-ID: <87r4uvdryz.fsf@nikula.org> (raw)
In-Reply-To: <1336429240-1114-3-git-send-email-amdragon@mit.edu>

On Mon,  7 May 2012 18:20:40 -0400, Austin Clements <amdragon@MIT.EDU> wrote:
> This moves our logic to get a file's type into one function.  This has
> several benefits: we can support OSes and file systems that do not
> provide dirent.d_type or always return DT_UNKNOWN, complex
> symlink-handling logic has been replaced by a simple stat fall-through
> in one place, and the error message for un-stat-able file is more
> accurate (previously, the error always mentioned directories, even
> though a broken symlink is not a directory).

LGTM.

> ---
>  notmuch-new.c |  103 +++++++++++++++++++++++++++++++++++----------------------
>  test/new      |    2 +-
>  2 files changed, 64 insertions(+), 41 deletions(-)
> 
> diff --git a/notmuch-new.c b/notmuch-new.c
> index cb720cc..8955677 100644
> --- a/notmuch-new.c
> +++ b/notmuch-new.c
> @@ -154,6 +154,48 @@ dirent_sort_strcmp_name (const struct dirent **a, const struct dirent **b)
>      return strcmp ((*a)->d_name, (*b)->d_name);
>  }
>  
> +/* Return the type of a directory entry relative to path as a stat(2)
> + * mode.  Like stat, this follows symlinks.  Returns -1 and sets errno
> + * if the file's type cannot be determined (which includes dangling
> + * symlinks).
> + */
> +static int
> +dirent_type (const char *path, const struct dirent *entry)
> +{
> +    struct stat statbuf;
> +    char *abspath;
> +    int err, saved_errno;
> +
> +#ifdef _DIRENT_HAVE_D_TYPE
> +    /* Mapping from d_type to stat mode_t.  We omit DT_LNK so that
> +     * we'll fall through to stat and get the real file type. */
> +    static const mode_t modes[] = {
> +	[DT_BLK]  = S_IFBLK,
> +	[DT_CHR]  = S_IFCHR,
> +	[DT_DIR]  = S_IFDIR,
> +	[DT_FIFO] = S_IFIFO,
> +	[DT_REG]  = S_IFREG,
> +	[DT_SOCK] = S_IFSOCK
> +    };
> +    if (entry->d_type < ARRAY_SIZE(modes) && modes[entry->d_type])
> +	return modes[entry->d_type];
> +#endif
> +
> +    abspath = talloc_asprintf (NULL, "%s/%s", path, entry->d_name);
> +    if (!abspath) {
> +	errno = ENOMEM;
> +	return -1;
> +    }
> +    err = stat(abspath, &statbuf);
> +    saved_errno = errno;
> +    talloc_free (abspath);
> +    if (err < 0) {
> +	errno = saved_errno;
> +	return -1;
> +    }
> +    return statbuf.st_mode & S_IFMT;
> +}
> +
>  /* Test if the directory looks like a Maildir directory.
>   *
>   * Search through the array of directory entries to see if we can find all
> @@ -162,12 +204,12 @@ dirent_sort_strcmp_name (const struct dirent **a, const struct dirent **b)
>   * Return 1 if the directory looks like a Maildir and 0 otherwise.
>   */
>  static int
> -_entries_resemble_maildir (struct dirent **entries, int count)
> +_entries_resemble_maildir (const char *path, struct dirent **entries, int count)
>  {
>      int i, found = 0;
>  
>      for (i = 0; i < count; i++) {
> -	if (entries[i]->d_type != DT_DIR && entries[i]->d_type != DT_UNKNOWN)
> +	if (dirent_type (path, entries[i]) != S_IFDIR)
>  	    continue;
>  
>  	if (strcmp(entries[i]->d_name, "new") == 0 ||
> @@ -250,7 +292,7 @@ add_files_recursive (notmuch_database_t *notmuch,
>      notmuch_status_t status, ret = NOTMUCH_STATUS_SUCCESS;
>      notmuch_message_t *message = NULL;
>      struct dirent **fs_entries = NULL;
> -    int i, num_fs_entries;
> +    int i, num_fs_entries, entry_type;
>      notmuch_directory_t *directory;
>      notmuch_filenames_t *db_files = NULL;
>      notmuch_filenames_t *db_subdirs = NULL;
> @@ -317,7 +359,7 @@ add_files_recursive (notmuch_database_t *notmuch,
>      }
>  
>      /* Pass 1: Recurse into all sub-directories. */
> -    is_maildir = _entries_resemble_maildir (fs_entries, num_fs_entries);
> +    is_maildir = _entries_resemble_maildir (path, fs_entries, num_fs_entries);
>  
>      for (i = 0; i < num_fs_entries; i++) {
>  	if (interrupted)
> @@ -325,17 +367,16 @@ add_files_recursive (notmuch_database_t *notmuch,
>  
>  	entry = fs_entries[i];
>  
> -	/* We only want to descend into directories.
> -	 * But symlinks can be to directories too, of course.
> -	 *
> -	 * And if the filesystem doesn't tell us the file type in the
> -	 * scandir results, then it might be a directory (and if not,
> -	 * then we'll stat and return immediately in the next level of
> -	 * recursion). */
> -	if (entry->d_type != DT_DIR &&
> -	    entry->d_type != DT_LNK &&
> -	    entry->d_type != DT_UNKNOWN)
> -	{
> +	/* We only want to descend into directories (and symlinks to
> +	 * directories). */
> +	entry_type = dirent_type (path, entry);
> +	if (entry_type == -1) {
> +	    /* Be pessimistic, e.g. so we don't lose lots of mail just
> +	     * because a user broke a symlink. */
> +	    fprintf (stderr, "Error reading file %s/%s: %s\n",
> +		     path, entry->d_name, strerror (errno));
> +	    return NOTMUCH_STATUS_FILE_ERROR;
> +	} else if (entry_type != S_IFDIR) {
>  	    continue;
>  	}
>  
> @@ -425,31 +466,13 @@ add_files_recursive (notmuch_database_t *notmuch,
>  	    notmuch_filenames_move_to_next (db_subdirs);
>  	}
>  
> -	/* If we're looking at a symlink, we only want to add it if it
> -	 * links to a regular file, (and not to a directory, say).
> -	 *
> -	 * Similarly, if the file is of unknown type (due to filesystem
> -	 * limitations), then we also need to look closer.
> -	 *
> -	 * In either case, a stat does the trick.
> -	 */
> -	if (entry->d_type == DT_LNK || entry->d_type == DT_UNKNOWN) {
> -	    int err;
> -
> -	    next = talloc_asprintf (notmuch, "%s/%s", path, entry->d_name);
> -	    err = stat (next, &st);
> -	    talloc_free (next);
> -	    next = NULL;
> -
> -	    /* Don't emit an error for a link pointing nowhere, since
> -	     * the directory-traversal pass will have already done
> -	     * that. */
> -	    if (err)
> -		continue;
> -
> -	    if (! S_ISREG (st.st_mode))
> -		continue;
> -	} else if (entry->d_type != DT_REG) {
> +	/* Only add regular files (and symlinks to regular files). */
> +	entry_type = dirent_type (path, entry);
> +	if (entry_type == -1) {
> +	    fprintf (stderr, "Error reading file %s/%s: %s\n",
> +		     path, entry->d_name, strerror (errno));
> +	    return NOTMUCH_STATUS_FILE_ERROR;
> +	} else if (entry_type != S_IFREG) {
>  	    continue;
>  	}
>  
> diff --git a/test/new b/test/new
> index 26253db..e3900f5 100755
> --- a/test/new
> +++ b/test/new
> @@ -140,7 +140,7 @@ test_begin_subtest "Broken symlink aborts"
>  ln -s does-not-exist "${MAIL_DIR}/broken"
>  output=$(NOTMUCH_NEW 2>&1)
>  test_expect_equal "$output" \
> -"Error reading directory /run/shm/nm/tmp.new/mail/broken: No such file or directory
> +"Error reading file /run/shm/nm/tmp.new/mail/broken: No such file or directory
>  Note: A fatal error was encountered: Something went wrong trying to read or write a file
>  No new mail."
>  rm "${MAIL_DIR}/broken"
> -- 
> 1.7.10
> 
> _______________________________________________
> notmuch mailing list
> notmuch@notmuchmail.org
> http://notmuchmail.org/mailman/listinfo/notmuch

  reply	other threads:[~2012-05-08  7:58 UTC|newest]

Thread overview: 29+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2012-05-07 18:09 [PATCH 0/2] Better, more portable stat-ing logic for notmuch new Austin Clements
2012-05-07 18:09 ` [PATCH 1/2] test: Test notmuch new with a broken symlink Austin Clements
2012-05-07 18:09 ` [PATCH 2/2] new: Centralize file type stat-ing logic Austin Clements
2012-05-07 21:08   ` Jani Nikula
2012-05-07 21:14     ` Jani Nikula
2012-05-07 22:18     ` Austin Clements
2012-05-07 22:20 ` [PATCH v2 0/2] Better, more portable stat-ing logic for notmuch new Austin Clements
2012-05-07 22:20   ` [PATCH v2 1/2] test: Test notmuch new with a broken symlink Austin Clements
2012-05-07 22:20   ` [PATCH v2 2/2] new: Centralize file type stat-ing logic Austin Clements
2012-05-08  7:58     ` Jani Nikula [this message]
2012-05-08  8:33       ` Jani Nikula
2012-05-09 18:27         ` Austin Clements
2012-05-09 18:45   ` [PATCH v2 0/2] Better, more portable stat-ing logic for notmuch new Austin Clements
2012-05-24 19:31   ` [PATCH v3 0/4] " Austin Clements
2012-05-24 19:31     ` [PATCH v3 1/4] test: Test notmuch new with a broken symlink Austin Clements
2012-05-24 19:32     ` [PATCH v3 2/4] new: Centralize file type stat-ing logic Austin Clements
2012-05-24 19:32     ` [PATCH v3 3/4] new: Merge error checks from add_files and add_files_recursive Austin Clements
2012-05-24 20:57       ` Jani Nikula
2012-05-24 21:57         ` Austin Clements
2012-05-24 20:57       ` Jani Nikula
2012-05-24 21:08         ` Jani Nikula
2012-05-24 21:44           ` Jameson Graef Rollins
2012-05-24 19:32     ` [PATCH v3 4/4] new: Unify " Austin Clements
2012-05-24 22:01     ` [PATCH v4 0/4] Better, more portable stat-ing logic for notmuch new Austin Clements
2012-05-24 22:01       ` [PATCH v4 1/4] test: Test notmuch new with a broken symlink Austin Clements
2012-05-25  1:03         ` David Bremner
2012-05-24 22:01       ` [PATCH v4 2/4] new: Centralize file type stat-ing logic Austin Clements
2012-05-24 22:01       ` [PATCH v4 3/4] new: Merge error checks from add_files and add_files_recursive Austin Clements
2012-05-24 22:01       ` [PATCH v4 4/4] new: Unify " Austin Clements

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

  List information: https://notmuchmail.org/

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=87r4uvdryz.fsf@nikula.org \
    --to=jani@nikula.org \
    --cc=amdragon@MIT.EDU \
    --cc=notmuch@notmuchmail.org \
    --cc=vlmarek@volny.cz \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
Code repositories for project(s) associated with this public inbox

	https://yhetil.org/notmuch.git/

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).