Convert non-UTF-8 parts to UTF-8 before indexing them

This fixes a bug that didn't allow to search for non-ASCII words such parts. The code here was copied from show_text_part_content(), because the show command already does the needed conversion when showing the message.
2024-11-25 04:18:08 +01:00 · 2012-02-24 08:36:22 +01:00 · 2012-02-24 08:36:22 +01:00 · 40edc971a8
commit 40edc971a8
parent 74f8f15adc
1 changed files with 15 additions and 0 deletions
--- a/lib/index.cc
+++ b/lib/index.cc
@ -315,6 +315,7 @@ _index_mime_part (notmuch_message_t *message,
    GByteArray *byte_array;
    GMimeContentDisposition *disposition;
    char *body;
    const char *charset;
    if (! part) {
 	fprintf (stderr, "Warning: Not indexing empty mime part.\n");
@ -390,6 +391,20 @@ _index_mime_part (notmuch_message_t *message,
    g_mime_stream_filter_add (GMIME_STREAM_FILTER (filter),
 			      discard_uuencode_filter);
    charset = g_mime_object_get_content_type_parameter (part, "charset");
    if (charset) {
 	GMimeFilter *charset_filter;
 	charset_filter = g_mime_filter_charset_new (charset, "UTF-8");
 	/* This result can be NULL for things like "unknown-8bit".
 	 * Don't set a NULL filter as that makes GMime print
 	 * annoying assertion-failure messages on stderr. */
 	if (charset_filter) {
 	    g_mime_stream_filter_add (GMIME_STREAM_FILTER (filter),
 				      charset_filter);
 	    g_object_unref (charset_filter);
 	}
    }
    wrapper = g_mime_part_get_content_object (GMIME_PART (part));
    if (wrapper)
 	g_mime_data_wrapper_write_to_stream (wrapper, filter);