From: Jani Nikula Date: Sat, 30 Nov 2013 15:33:55 +0000 (+0200) Subject: [PATCH v2 6/7] lib: parse messages only once X-Git-Url: http://git.tremily.us/?a=commitdiff_plain;h=1ac5e251b9354ad5cbf4b5e318c1243ab7895a7a;p=notmuch-archives.git [PATCH v2 6/7] lib: parse messages only once --- diff --git a/79/73fe9c58986740e9416ca4fe40f2c09729e153 b/79/73fe9c58986740e9416ca4fe40f2c09729e153 new file mode 100644 index 000000000..5469668ff --- /dev/null +++ b/79/73fe9c58986740e9416ca4fe40f2c09729e153 @@ -0,0 +1,244 @@ +Return-Path: +X-Original-To: notmuch@notmuchmail.org +Delivered-To: notmuch@notmuchmail.org +Received: from localhost (localhost [127.0.0.1]) + by olra.theworths.org (Postfix) with ESMTP id 84A8C431FBC + for ; Sat, 30 Nov 2013 07:34:33 -0800 (PST) +X-Virus-Scanned: Debian amavisd-new at olra.theworths.org +X-Amavis-Alert: BAD HEADER SECTION, Duplicate header field: "References" +X-Spam-Flag: NO +X-Spam-Score: -0.7 +X-Spam-Level: +X-Spam-Status: No, score=-0.7 tagged_above=-999 required=5 + tests=[RCVD_IN_DNSWL_LOW=-0.7] autolearn=disabled +Received: from olra.theworths.org ([127.0.0.1]) + by localhost (olra.theworths.org [127.0.0.1]) (amavisd-new, port 10024) + with ESMTP id 1fT0U0XOyEFh for ; + Sat, 30 Nov 2013 07:34:28 -0800 (PST) +Received: from mail-ea0-f169.google.com (mail-ea0-f169.google.com + [209.85.215.169]) (using TLSv1 with cipher RC4-SHA (128/128 bits)) + (No client certificate requested) + by olra.theworths.org (Postfix) with ESMTPS id 942F6431FD9 + for ; Sat, 30 Nov 2013 07:34:15 -0800 (PST) +Received: by mail-ea0-f169.google.com with SMTP id l9so7787649eaj.28 + for ; Sat, 30 Nov 2013 07:34:14 -0800 (PST) +X-Google-DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed; + d=1e100.net; s=20130820; + h=x-gm-message-state:from:to:cc:subject:date:message-id:in-reply-to + :references:in-reply-to:references; + bh=ThStNBfWxPAsiQcOkE7qqDnegjbWfHa/WVixrzqyFXQ=; + b=hcrATJSawqQa3x9zqatur70fCH4dEh4vOGp7nOucGvH8cxWYGFke4H9fqenC5p4Afb + hdiLysHHBETB4qPOg+FPyXUzznfUcVxRUEoE4NTsisuzqOWnuc2JF4PwB5ZxlYJbzJSc + FuhdtwVpzBn+0QeXwBWVel2DfVb5YGireubapnJApqBmhzz9Azukkji1vgJXaX4x2FGO + x5gMxpL1D2mc/oCrn2ceHa5SOJzY5m3A6aQ9X1cfuOhSeKao4vvrh/6vLeRPLY88OAZQ + 4NmBAS5Zrcwqc/vevaIMpipX6nFBoCDjCVKAcA6EcrQ3UVFzoh/NDbn3Bb1cmS2kHv3+ + H04g== +X-Gm-Message-State: + ALoCoQlF/mz7/8ygFnuTxLHfIBGlA239gzkxRbOpMrDuFemeGVlRnm8vIgndpsVAnmUVPrL9DNdY +X-Received: by 10.15.86.75 with SMTP id h51mr1603384eez.44.1385825654569; + Sat, 30 Nov 2013 07:34:14 -0800 (PST) +Received: from localhost (dsl-hkibrasgw2-58c36f-91.dhcp.inet.fi. + [88.195.111.91]) + by mx.google.com with ESMTPSA id a45sm51848238eem.6.2013.11.30.07.34.13 + for + (version=TLSv1.2 cipher=RC4-SHA bits=128/128); + Sat, 30 Nov 2013 07:34:14 -0800 (PST) +From: Jani Nikula +To: notmuch@notmuchmail.org +Subject: [PATCH v2 6/7] lib: parse messages only once +Date: Sat, 30 Nov 2013 17:33:55 +0200 +Message-Id: + <36ef439cffa92d7889a5b1ae984016d3e944edc1.1385825425.git.jani@nikula.org> +X-Mailer: git-send-email 1.8.4.2 +In-Reply-To: +References: +In-Reply-To: +References: +X-BeenThere: notmuch@notmuchmail.org +X-Mailman-Version: 2.1.13 +Precedence: list +List-Id: "Use and development of the notmuch mail system." + +List-Unsubscribe: , + +List-Archive: +List-Post: +List-Help: +List-Subscribe: , + +X-List-Received-Date: Sat, 30 Nov 2013 15:34:33 -0000 + +Make the necessary changes to only do one gmime parse pass during +indexing. +--- + lib/database.cc | 2 +- + lib/index.cc | 59 ++++++--------------------------------------------- + lib/message-file.c | 9 ++++++++ + lib/notmuch-private.h | 16 ++++++++++++-- + 4 files changed, 30 insertions(+), 56 deletions(-) + +diff --git a/lib/database.cc b/lib/database.cc +index d1bea88..3a29fe7 100644 +--- a/lib/database.cc ++++ b/lib/database.cc +@@ -2029,7 +2029,7 @@ notmuch_database_add_message (notmuch_database_t *notmuch, + date = notmuch_message_file_get_header (message_file, "date"); + _notmuch_message_set_header_values (message, date, from, subject); + +- ret = _notmuch_message_index_file (message, filename); ++ ret = _notmuch_message_index_file (message, message_file); + if (ret) + goto DONE; + } else { +diff --git a/lib/index.cc b/lib/index.cc +index 976e49f..71397da 100644 +--- a/lib/index.cc ++++ b/lib/index.cc +@@ -425,52 +425,15 @@ _index_mime_part (notmuch_message_t *message, + + notmuch_status_t + _notmuch_message_index_file (notmuch_message_t *message, +- const char *filename) ++ notmuch_message_file_t *message_file) + { +- GMimeStream *stream = NULL; +- GMimeParser *parser = NULL; +- GMimeMessage *mime_message = NULL; ++ GMimeMessage *mime_message; + InternetAddressList *addresses; +- FILE *file = NULL; + const char *from, *subject; +- notmuch_status_t ret = NOTMUCH_STATUS_SUCCESS; +- static int initialized = 0; +- char from_buf[5]; +- bool is_mbox = false; +- +- if (! initialized) { +- g_mime_init (GMIME_ENABLE_RFC2047_WORKAROUNDS); +- initialized = 1; +- } +- +- file = fopen (filename, "r"); +- if (! file) { +- fprintf (stderr, "Error opening %s: %s\n", filename, strerror (errno)); +- ret = NOTMUCH_STATUS_FILE_ERROR; +- goto DONE; +- } +- +- /* Is this mbox? */ +- if (fread (from_buf, sizeof (from_buf), 1, file) == 1 && +- strncmp (from_buf, "From ", 5) == 0) +- is_mbox = true; +- rewind (file); +- +- /* Evil GMime steals my FILE* here so I won't fclose it. */ +- stream = g_mime_stream_file_new (file); +- +- parser = g_mime_parser_new_with_stream (stream); +- g_mime_parser_set_scan_from (parser, is_mbox); + +- mime_message = g_mime_parser_construct_message (parser); +- +- if (is_mbox) { +- if (!g_mime_parser_eos (parser)) { +- /* This is a multi-message mbox. */ +- ret = NOTMUCH_STATUS_FILE_NOT_EMAIL; +- goto DONE; +- } +- } ++ mime_message = notmuch_message_file_get_mime_message (message_file); ++ if (! mime_message) ++ return NOTMUCH_STATUS_FILE_NOT_EMAIL; /* more like internal error */ + + from = g_mime_message_get_sender (mime_message); + +@@ -491,15 +454,5 @@ _notmuch_message_index_file (notmuch_message_t *message, + + _index_mime_part (message, g_mime_message_get_mime_part (mime_message)); + +- DONE: +- if (mime_message) +- g_object_unref (mime_message); +- +- if (parser) +- g_object_unref (parser); +- +- if (stream) +- g_object_unref (stream); +- +- return ret; ++ return NOTMUCH_STATUS_SUCCESS; + } +diff --git a/lib/message-file.c b/lib/message-file.c +index 3c653d1..0bd8c2e 100644 +--- a/lib/message-file.c ++++ b/lib/message-file.c +@@ -247,6 +247,15 @@ mboxes is deprecated and may be removed in the future.\n", message->filename); + return NOTMUCH_STATUS_SUCCESS; + } + ++GMimeMessage * ++notmuch_message_file_get_mime_message (notmuch_message_file_t *message) ++{ ++ if (! message->parsed) ++ return NULL; ++ ++ return message->message; ++} ++ + /* return NULL on errors, empty string for non-existing headers */ + const char * + notmuch_message_file_get_header (notmuch_message_file_t *message, +diff --git a/lib/notmuch-private.h b/lib/notmuch-private.h +index 7277df1..7559521 100644 +--- a/lib/notmuch-private.h ++++ b/lib/notmuch-private.h +@@ -46,6 +46,8 @@ NOTMUCH_BEGIN_DECLS + + #include + ++#include ++ + #include "xutil.h" + #include "error_util.h" + +@@ -320,9 +322,11 @@ notmuch_message_get_author (notmuch_message_t *message); + + /* index.cc */ + ++typedef struct _notmuch_message_file notmuch_message_file_t; ++ + notmuch_status_t + _notmuch_message_index_file (notmuch_message_t *message, +- const char *filename); ++ notmuch_message_file_t *message_file); + + /* message-file.c */ + +@@ -330,7 +334,6 @@ _notmuch_message_index_file (notmuch_message_t *message, + * into the public interface in notmuch.h + */ + +-typedef struct _notmuch_message_file notmuch_message_file_t; + + /* Open a file containing a single email message. + * +@@ -377,6 +380,15 @@ void + notmuch_message_file_restrict_headersv (notmuch_message_file_t *message, + va_list va_headers); + ++/* Get the gmime message of a parsed message file. ++ * ++ * Returns NULL if the message file has not been parsed. ++ * ++ * XXX: Would be nice to not have to expose GMimeMessage here. ++ */ ++GMimeMessage * ++notmuch_message_file_get_mime_message (notmuch_message_file_t *message); ++ + /* Get the value of the specified header from the message as a UTF-8 string. + * + * The header name is case insensitive. +-- +1.8.4.2 +