1 Return-Path: <amdragon@mit.edu>
\r
2 X-Original-To: notmuch@notmuchmail.org
\r
3 Delivered-To: notmuch@notmuchmail.org
\r
4 Received: from localhost (localhost [127.0.0.1])
\r
5 by olra.theworths.org (Postfix) with ESMTP id EEEDE431FCF
\r
6 for <notmuch@notmuchmail.org>; Thu, 24 May 2012 12:32:10 -0700 (PDT)
\r
7 X-Virus-Scanned: Debian amavisd-new at olra.theworths.org
\r
11 X-Spam-Status: No, score=-0.7 tagged_above=-999 required=5
\r
12 tests=[RCVD_IN_DNSWL_LOW=-0.7] autolearn=disabled
\r
13 Received: from olra.theworths.org ([127.0.0.1])
\r
14 by localhost (olra.theworths.org [127.0.0.1]) (amavisd-new, port 10024)
\r
15 with ESMTP id yyKD29v-pYp3 for <notmuch@notmuchmail.org>;
\r
16 Thu, 24 May 2012 12:32:09 -0700 (PDT)
\r
17 Received: from dmz-mailsec-scanner-5.mit.edu (DMZ-MAILSEC-SCANNER-5.MIT.EDU
\r
19 by olra.theworths.org (Postfix) with ESMTP id 68701431FBD
\r
20 for <notmuch@notmuchmail.org>; Thu, 24 May 2012 12:32:09 -0700 (PDT)
\r
21 X-AuditID: 12074422-b7fd66d0000008f9-09-4fbe8cb8ca6f
\r
22 Received: from mailhub-auth-4.mit.edu ( [18.7.62.39])
\r
23 by dmz-mailsec-scanner-5.mit.edu (Symantec Messaging Gateway) with SMTP
\r
24 id 0E.9B.02297.8BC8EBF4; Thu, 24 May 2012 15:32:08 -0400 (EDT)
\r
25 Received: from outgoing.mit.edu (OUTGOING-AUTH.MIT.EDU [18.7.22.103])
\r
26 by mailhub-auth-4.mit.edu (8.13.8/8.9.2) with ESMTP id q4OJW7Kt031199;
\r
27 Thu, 24 May 2012 15:32:07 -0400
\r
28 Received: from drake.mit.edu (26-4-163.dynamic.csail.mit.edu [18.26.4.163])
\r
29 (authenticated bits=0)
\r
30 (User authenticated as amdragon@ATHENA.MIT.EDU)
\r
31 by outgoing.mit.edu (8.13.6/8.12.4) with ESMTP id q4OJW5w8014460
\r
32 (version=TLSv1/SSLv3 cipher=AES256-SHA bits=256 verify=NOT);
\r
33 Thu, 24 May 2012 15:32:07 -0400 (EDT)
\r
34 Received: from amthrax by drake.mit.edu with local (Exim 4.77)
\r
35 (envelope-from <amdragon@mit.edu>)
\r
36 id 1SXdlT-0003RZ-Tb; Thu, 24 May 2012 15:32:03 -0400
\r
37 From: Austin Clements <amdragon@MIT.EDU>
\r
38 To: notmuch@notmuchmail.org
\r
39 Subject: [PATCH v3 2/4] new: Centralize file type stat-ing logic
\r
40 Date: Thu, 24 May 2012 15:32:00 -0400
\r
41 Message-Id: <1337887922-13163-3-git-send-email-amdragon@mit.edu>
\r
42 X-Mailer: git-send-email 1.7.10
\r
43 In-Reply-To: <1337887922-13163-1-git-send-email-amdragon@mit.edu>
\r
44 References: <1336429240-1114-1-git-send-email-amdragon@mit.edu>
\r
45 <1337887922-13163-1-git-send-email-amdragon@mit.edu>
\r
46 X-Brightmail-Tracker:
\r
47 H4sIAAAAAAAAA+NgFtrEIsWRmVeSWpSXmKPExsUixG6nrrujZ5+/wbItPBbXb85kdmD0eLbq
\r
48 FnMAYxSXTUpqTmZZapG+XQJXxtvNX9kLLhlVNDxdwd7AuFC9i5GTQ0LARGLPjQksELaYxIV7
\r
49 69m6GLk4hAT2MUrs6DjJCOFsYJT4eaKbCcI5ziQx48ByVghnFqPEprtfGUH62QQ0JLbtXw5m
\r
50 iwhIS+y8OxuoiIODWUBN4k+XCkhYWMBBomXWFLAwi4CqxOxfeSBhXqDwnuc7WSGukJd4er+P
\r
51 DcTmFHCUuPBkMhOILSRQJnH88S6mCYz8CxgZVjHKpuRW6eYmZuYUpybrFicn5uWlFuma6uVm
\r
52 luilppRuYgQHjYvSDsafB5UOMQpwMCrx8LJE7/MXYk0sK67MPcQoycGkJMrL1w0U4kvKT6nM
\r
53 SCzOiC8qzUktPsQowcGsJMIrGAmU401JrKxKLcqHSUlzsCiJ867R3O0vJJCeWJKanZpakFoE
\r
54 k5Xh4FCS4GUBRoeQYFFqempFWmZOCUKaiYMTZDgP0PB9IIt5iwsSc4sz0yHypxgVpcR5L4Ik
\r
55 BEASGaV5cL2wqH7FKA70ijDvX5AqHmBCgOt+BTSYCWjwlsd7QQaXJCKkpBoYJRUY3O7bc9Z5
\r
56 B/pfPbT1177zN0XaN9txrZ7CEVfLWXgi7t81gSWdv+/c/h/Sk2xd0v7O0mrj5Z1zal7lt/lv
\r
57 2FG8aPUZncIZxuGPvoTc1Examb8384yOXaTHXIWW31uC/+0RORDt2JudcDiFhanounNBj/l/
\r
58 CY23Gl8uHlH/5mf8MuqQ5e4CJZbijERDLeai4kQATUuuWcUCAAA=
\r
59 X-BeenThere: notmuch@notmuchmail.org
\r
60 X-Mailman-Version: 2.1.13
\r
62 List-Id: "Use and development of the notmuch mail system."
\r
63 <notmuch.notmuchmail.org>
\r
64 List-Unsubscribe: <http://notmuchmail.org/mailman/options/notmuch>,
\r
65 <mailto:notmuch-request@notmuchmail.org?subject=unsubscribe>
\r
66 List-Archive: <http://notmuchmail.org/pipermail/notmuch>
\r
67 List-Post: <mailto:notmuch@notmuchmail.org>
\r
68 List-Help: <mailto:notmuch-request@notmuchmail.org?subject=help>
\r
69 List-Subscribe: <http://notmuchmail.org/mailman/listinfo/notmuch>,
\r
70 <mailto:notmuch-request@notmuchmail.org?subject=subscribe>
\r
71 X-List-Received-Date: Thu, 24 May 2012 19:32:11 -0000
\r
73 This moves our logic to get a file's type into one function. This has
\r
74 several benefits: we can support OSes and file systems that do not
\r
75 provide dirent.d_type or always return DT_UNKNOWN, complex
\r
76 symlink-handling logic has been replaced by a simple stat fall-through
\r
77 in one place, and the error message for un-stat-able file is more
\r
78 accurate (previously, the error always mentioned directories, even
\r
79 though a broken symlink is not a directory).
\r
81 notmuch-new.c | 103 +++++++++++++++++++++++++++++++++++----------------------
\r
83 2 files changed, 64 insertions(+), 41 deletions(-)
\r
85 diff --git a/notmuch-new.c b/notmuch-new.c
\r
86 index 72dd558..c64f1a7 100644
\r
89 @@ -154,6 +154,48 @@ dirent_sort_strcmp_name (const struct dirent **a, const struct dirent **b)
\r
90 return strcmp ((*a)->d_name, (*b)->d_name);
\r
93 +/* Return the type of a directory entry relative to path as a stat(2)
\r
94 + * mode. Like stat, this follows symlinks. Returns -1 and sets errno
\r
95 + * if the file's type cannot be determined (which includes dangling
\r
99 +dirent_type (const char *path, const struct dirent *entry)
\r
101 + struct stat statbuf;
\r
103 + int err, saved_errno;
\r
105 +#ifdef _DIRENT_HAVE_D_TYPE
\r
106 + /* Mapping from d_type to stat mode_t. We omit DT_LNK so that
\r
107 + * we'll fall through to stat and get the real file type. */
\r
108 + static const mode_t modes[] = {
\r
109 + [DT_BLK] = S_IFBLK,
\r
110 + [DT_CHR] = S_IFCHR,
\r
111 + [DT_DIR] = S_IFDIR,
\r
112 + [DT_FIFO] = S_IFIFO,
\r
113 + [DT_REG] = S_IFREG,
\r
114 + [DT_SOCK] = S_IFSOCK
\r
116 + if (entry->d_type < ARRAY_SIZE(modes) && modes[entry->d_type])
\r
117 + return modes[entry->d_type];
\r
120 + abspath = talloc_asprintf (NULL, "%s/%s", path, entry->d_name);
\r
125 + err = stat(abspath, &statbuf);
\r
126 + saved_errno = errno;
\r
127 + talloc_free (abspath);
\r
129 + errno = saved_errno;
\r
132 + return statbuf.st_mode & S_IFMT;
\r
135 /* Test if the directory looks like a Maildir directory.
\r
137 * Search through the array of directory entries to see if we can find all
\r
138 @@ -162,12 +204,12 @@ dirent_sort_strcmp_name (const struct dirent **a, const struct dirent **b)
\r
139 * Return 1 if the directory looks like a Maildir and 0 otherwise.
\r
142 -_entries_resemble_maildir (struct dirent **entries, int count)
\r
143 +_entries_resemble_maildir (const char *path, struct dirent **entries, int count)
\r
147 for (i = 0; i < count; i++) {
\r
148 - if (entries[i]->d_type != DT_DIR && entries[i]->d_type != DT_UNKNOWN)
\r
149 + if (dirent_type (path, entries[i]) != S_IFDIR)
\r
152 if (strcmp(entries[i]->d_name, "new") == 0 ||
\r
153 @@ -250,7 +292,7 @@ add_files_recursive (notmuch_database_t *notmuch,
\r
154 notmuch_status_t status, ret = NOTMUCH_STATUS_SUCCESS;
\r
155 notmuch_message_t *message = NULL;
\r
156 struct dirent **fs_entries = NULL;
\r
157 - int i, num_fs_entries = 0;
\r
158 + int i, num_fs_entries = 0, entry_type;
\r
159 notmuch_directory_t *directory;
\r
160 notmuch_filenames_t *db_files = NULL;
\r
161 notmuch_filenames_t *db_subdirs = NULL;
\r
162 @@ -300,7 +342,7 @@ add_files_recursive (notmuch_database_t *notmuch,
\r
165 /* Pass 1: Recurse into all sub-directories. */
\r
166 - is_maildir = _entries_resemble_maildir (fs_entries, num_fs_entries);
\r
167 + is_maildir = _entries_resemble_maildir (path, fs_entries, num_fs_entries);
\r
169 for (i = 0; i < num_fs_entries; i++) {
\r
171 @@ -308,17 +350,16 @@ add_files_recursive (notmuch_database_t *notmuch,
\r
173 entry = fs_entries[i];
\r
175 - /* We only want to descend into directories.
\r
176 - * But symlinks can be to directories too, of course.
\r
178 - * And if the filesystem doesn't tell us the file type in the
\r
179 - * scandir results, then it might be a directory (and if not,
\r
180 - * then we'll stat and return immediately in the next level of
\r
182 - if (entry->d_type != DT_DIR &&
\r
183 - entry->d_type != DT_LNK &&
\r
184 - entry->d_type != DT_UNKNOWN)
\r
186 + /* We only want to descend into directories (and symlinks to
\r
187 + * directories). */
\r
188 + entry_type = dirent_type (path, entry);
\r
189 + if (entry_type == -1) {
\r
190 + /* Be pessimistic, e.g. so we don't lose lots of mail just
\r
191 + * because a user broke a symlink. */
\r
192 + fprintf (stderr, "Error reading file %s/%s: %s\n",
\r
193 + path, entry->d_name, strerror (errno));
\r
194 + return NOTMUCH_STATUS_FILE_ERROR;
\r
195 + } else if (entry_type != S_IFDIR) {
\r
199 @@ -407,31 +448,13 @@ add_files_recursive (notmuch_database_t *notmuch,
\r
200 notmuch_filenames_move_to_next (db_subdirs);
\r
203 - /* If we're looking at a symlink, we only want to add it if it
\r
204 - * links to a regular file, (and not to a directory, say).
\r
206 - * Similarly, if the file is of unknown type (due to filesystem
\r
207 - * limitations), then we also need to look closer.
\r
209 - * In either case, a stat does the trick.
\r
211 - if (entry->d_type == DT_LNK || entry->d_type == DT_UNKNOWN) {
\r
214 - next = talloc_asprintf (notmuch, "%s/%s", path, entry->d_name);
\r
215 - err = stat (next, &st);
\r
216 - talloc_free (next);
\r
219 - /* Don't emit an error for a link pointing nowhere, since
\r
220 - * the directory-traversal pass will have already done
\r
225 - if (! S_ISREG (st.st_mode))
\r
227 - } else if (entry->d_type != DT_REG) {
\r
228 + /* Only add regular files (and symlinks to regular files). */
\r
229 + entry_type = dirent_type (path, entry);
\r
230 + if (entry_type == -1) {
\r
231 + fprintf (stderr, "Error reading file %s/%s: %s\n",
\r
232 + path, entry->d_name, strerror (errno));
\r
233 + return NOTMUCH_STATUS_FILE_ERROR;
\r
234 + } else if (entry_type != S_IFREG) {
\r
238 diff --git a/test/new b/test/new
\r
239 index a7bc146..cab7c01 100755
\r
242 @@ -140,7 +140,7 @@ test_begin_subtest "Broken symlink aborts"
\r
243 ln -s does-not-exist "${MAIL_DIR}/broken"
\r
244 output=$(NOTMUCH_NEW 2>&1)
\r
245 test_expect_equal "$output" \
\r
246 -"Error reading directory ${MAIL_DIR}/broken: No such file or directory
\r
247 +"Error reading file ${MAIL_DIR}/broken: No such file or directory
\r
248 Note: A fatal error was encountered: Something went wrong trying to read or write a file
\r
250 rm "${MAIL_DIR}/broken"
\r