2010-12-01 21:27:52 +01:00
|
|
|
|
#!/usr/bin/env bash
|
2010-09-20 23:39:06 +02:00
|
|
|
|
test_description="encoding issues"
|
2017-09-25 22:38:19 +02:00
|
|
|
|
. $(dirname "$0")/test-lib.sh || exit 1
|
2010-06-10 08:48:03 +02:00
|
|
|
|
|
2010-09-18 00:25:39 +02:00
|
|
|
|
test_begin_subtest "Message with text of unknown charset"
|
|
|
|
|
add_message '[content-type]="text/plain; charset=unknown-8bit"' \
|
2012-01-11 17:53:59 +01:00
|
|
|
|
"[body]=irrelevant"
|
2013-12-08 15:52:41 +01:00
|
|
|
|
output=$(notmuch show id:${gen_msg_id} 2>&1 | notmuch_show_sanitize_all)
|
|
|
|
|
test_expect_equal "$output" "message{ id:XXXXX depth:0 match:1 excluded:0 filename:XXXXX
|
2010-06-10 08:48:03 +02:00
|
|
|
|
header{
|
|
|
|
|
Notmuch Test Suite <test_suite@notmuchmail.org> (2001-01-05) (inbox unread)
|
2012-03-10 02:24:51 +01:00
|
|
|
|
Subject: Message with text of unknown charset
|
2010-06-10 08:48:03 +02:00
|
|
|
|
From: Notmuch Test Suite <test_suite@notmuchmail.org>
|
|
|
|
|
To: Notmuch Test Suite <test_suite@notmuchmail.org>
|
2013-12-08 15:52:41 +01:00
|
|
|
|
Date: GENERATED_DATE
|
2010-06-10 08:48:03 +02:00
|
|
|
|
header}
|
|
|
|
|
body{
|
|
|
|
|
part{ ID: 1, Content-type: text/plain
|
|
|
|
|
irrelevant
|
|
|
|
|
part}
|
|
|
|
|
body}
|
|
|
|
|
message}"
|
|
|
|
|
|
2012-02-24 01:33:15 +01:00
|
|
|
|
test_begin_subtest "Search for ISO-8859-2 encoded message"
|
|
|
|
|
add_message '[content-type]="text/plain; charset=iso-8859-2"' \
|
|
|
|
|
'[content-transfer-encoding]=8bit' \
|
|
|
|
|
'[subject]="ISO-8859-2 encoded message"' \
|
|
|
|
|
"[body]=$'Czech word tu\350\362\341\350\350\355 means pinguin\'s.'" # ISO-8859-2 characters are generated by shell's escape sequences
|
2013-12-08 15:52:41 +01:00
|
|
|
|
output=$(notmuch search tučňáččí 2>&1 | notmuch_show_sanitize_all)
|
2012-02-24 01:33:15 +01:00
|
|
|
|
test_expect_equal "$output" "thread:0000000000000002 2001-01-05 [1/1] Notmuch Test Suite; ISO-8859-2 encoded message (inbox unread)"
|
|
|
|
|
|
2013-09-11 19:36:42 +02:00
|
|
|
|
test_begin_subtest "RFC 2047 encoded word with spaces"
|
|
|
|
|
add_message '[subject]="=?utf-8?q?encoded word with spaces?="'
|
2021-05-16 14:37:40 +02:00
|
|
|
|
output=$(notmuch search id:${gen_msg_id} 2>&1 | notmuch_search_sanitize)
|
|
|
|
|
test_expect_equal "$output" "thread:XXX 2001-01-05 [1/1] Notmuch Test Suite; encoded word with spaces (inbox unread)"
|
2013-09-11 19:36:42 +02:00
|
|
|
|
|
|
|
|
|
test_begin_subtest "RFC 2047 encoded words back to back"
|
|
|
|
|
add_message '[subject]="=?utf-8?q?encoded-words-back?==?utf-8?q?to-back?="'
|
2021-05-16 14:37:40 +02:00
|
|
|
|
output=$(notmuch search id:${gen_msg_id} 2>&1 | notmuch_search_sanitize)
|
|
|
|
|
test_expect_equal "$output" "thread:XXX 2001-01-05 [1/1] Notmuch Test Suite; encoded-words-backto-back (inbox unread)"
|
2013-09-11 19:36:42 +02:00
|
|
|
|
|
|
|
|
|
test_begin_subtest "RFC 2047 encoded words without space before or after"
|
|
|
|
|
add_message '[subject]="=?utf-8?q?encoded?=word without=?utf-8?q?space?=" '
|
2021-05-16 14:37:40 +02:00
|
|
|
|
output=$(notmuch search id:${gen_msg_id} 2>&1 | notmuch_search_sanitize)
|
|
|
|
|
test_expect_equal "$output" "thread:XXX 2001-01-05 [1/1] Notmuch Test Suite; encodedword withoutspace (inbox unread)"
|
2013-09-11 19:36:42 +02:00
|
|
|
|
|
2018-08-07 14:48:21 +02:00
|
|
|
|
test_begin_subtest "Mislabeled Windows-1252 encoding"
|
|
|
|
|
add_message '[content-type]="text/plain; charset=iso-8859-1"' \
|
|
|
|
|
"[body]=$'This text contains \x93Windows-1252\x94 character codes.'"
|
|
|
|
|
cat <<EOF > EXPECTED
|
|
|
|
|
message{ id:XXXXX depth:0 match:1 excluded:0 filename:XXXXX
|
|
|
|
|
header{
|
|
|
|
|
Notmuch Test Suite <test_suite@notmuchmail.org> (2001-01-05) (inbox unread)
|
|
|
|
|
Subject: Mislabeled Windows-1252 encoding
|
|
|
|
|
From: Notmuch Test Suite <test_suite@notmuchmail.org>
|
|
|
|
|
To: Notmuch Test Suite <test_suite@notmuchmail.org>
|
|
|
|
|
Date: GENERATED_DATE
|
|
|
|
|
header}
|
|
|
|
|
body{
|
|
|
|
|
part{ ID: 1, Content-type: text/plain
|
|
|
|
|
This text contains “Windows-1252” character codes.
|
|
|
|
|
part}
|
|
|
|
|
body}
|
|
|
|
|
message}
|
|
|
|
|
EOF
|
|
|
|
|
notmuch show id:${gen_msg_id} 2>&1 | notmuch_show_sanitize_all > OUTPUT
|
|
|
|
|
test_expect_equal_file EXPECTED OUTPUT
|
|
|
|
|
|
2010-06-10 08:48:03 +02:00
|
|
|
|
test_done
|