1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
|
# -*- coding: utf-8 -*-
import unittest
import email
from mock import Mock
from kittystore.scrub import Scrubber
from kittystore.test import get_test_file
class TestScrubber(unittest.TestCase):
def test_attachment_1(self):
with open(get_test_file("attachment-1.txt")) as email_file:
msg = email.message_from_file(email_file)
store = Mock()
scrubber = Scrubber("testlist@example.com", msg, store)
contents = scrubber.scrub()
self.assertEqual(store.add_attachment.call_count, 1)
store.add_attachment.assert_called_with(
'testlist@example.com', '505E5185.5040208@libero.it', 2,
'puntogil.vcf', 'text/x-vcard', "utf-8",
'begin:vcard\r\nfn:gil\r\nn:;gil\r\nversion:2.1\r\n'
'end:vcard\r\n\r\n')
self.assertEqual(contents,
"This is a test message.\r\n\r\n"
"\n-- \ndevel mailing list\ndevel@lists.fedoraproject.org\n"
"https://admin.fedoraproject.org/mailman/listinfo/devel\n"
)
def test_attachment_2(self):
with open(get_test_file("attachment-2.txt")) as email_file:
msg = email.message_from_file(email_file)
store = Mock()
scrubber = Scrubber("testlist@example.com", msg, store)
contents = scrubber.scrub()
self.assertEqual(store.add_attachment.call_count, 1)
store.add_attachment.assert_called_with(
'testlist@example.com', '50619B7A.2030404@thelounge.net', 3,
'signature.asc', 'application/pgp-signature', None,
'-----BEGIN PGP SIGNATURE-----\r\nVersion: GnuPG v1.4.12 '
'(GNU/Linux)\r\nComment: Using GnuPG with Mozilla - '
'http://www.enigmail.net/\r\n\r\niEYEARECAAYFAlBhm3oACgkQhmBj'
'z394AnmMnQCcC+6tWcqE1dPQmIdRbLXgKGVp\r\nEeUAn2OqtaXaXaQV7rx+'
'SmOldmSzcFw4\r\n=OEJv\r\n-----END PGP SIGNATURE-----\r\n')
self.assertEqual(contents,
u"This is a test message\r\nNon-ascii chars: Hofm\xfchlgasse\r\n"
u"\n-- \ndevel mailing list\ndevel@lists.fedoraproject.org\n"
u"https://admin.fedoraproject.org/mailman/listinfo/devel\n"
)
def test_attachment_3(self):
with open(get_test_file("attachment-3.txt")) as email_file:
msg = email.message_from_file(email_file)
store = Mock()
scrubber = Scrubber("testlist@example.com", msg, store)
contents = scrubber.scrub()
self.assertEqual(store.add_attachment.call_count, 2)
args_1, args_2 = store.add_attachment.call_args_list
# HTML part
self.assertEqual(args_1[0][0:6], ("testlist@example.com",
"CACec3Lup8apbhUMcm_Ktn1dPxx4eWr2y1RV7ZSYhy0tzmjSrgQ@mail.gmail.com",
3, "attachment.html", "text/html", "iso-8859-1"))
self.assertEqual(len(args_1[0][6]), 3134)
# Image attachment
self.assertEqual(args_2[0][0:6], ("testlist@example.com",
"CACec3Lup8apbhUMcm_Ktn1dPxx4eWr2y1RV7ZSYhy0tzmjSrgQ@mail.gmail.com",
4, "GeoffreyRoucourt.jpg", "image/jpeg", None))
self.assertEqual(len(args_2[0][6]), 282180)
# Scrubbed content
self.assertEqual(contents, u"This is a test message\r\n")
def test_html_email_1(self):
with open(get_test_file("html-email-1.txt")) as email_file:
msg = email.message_from_file(email_file)
store = Mock()
scrubber = Scrubber("testlist@example.com", msg, store)
contents = scrubber.scrub()
self.assertEqual(store.add_attachment.call_count, 1)
args = store.add_attachment.call_args[0]
# HTML part
self.assertEqual(args[0:6], ("testlist@example.com",
"016001cd9b3b$b71efed0$255cfc70$@fr",
2, "attachment.html", "text/html", "iso-8859-1"))
self.assertEqual(len(args[6]), 2723)
# Scrubbed content
self.assertEqual(contents,
u"This is a test message\r\n"
u"Non-ASCII chars: r\xe9ponse fran\xe7ais \n")
def test_non_ascii_payload(self):
"""Scrubber must handle non-ascii messages"""
for enc in ["utf8", "iso8859"]:
with open(get_test_file("payload-%s.txt" % enc)) as email_file:
msg = email.message_from_file(email_file)
store = Mock()
scrubber = Scrubber("testlist@example.com", msg, store)
contents = scrubber.scrub()
self.assertTrue(isinstance(contents, unicode))
self.assertEqual(contents, u'This message contains non-ascii '
u'characters:\n\xe9 \xe8 \xe7 \xe0 \xee \xef \xeb \u20ac\n')
def test_attachment_4(self):
with open(get_test_file("attachment-4.txt")) as email_file:
msg = email.message_from_file(email_file)
store = Mock()
scrubber = Scrubber("testlist@example.com", msg, store)
contents = scrubber.scrub()
self.assertEqual(store.add_attachment.call_count, 2)
args_1, args_2 = store.add_attachment.call_args_list
# HTML part
self.assertEqual(args_1[0][0:6], ("testlist@example.com",
"CAHmoxtXXb3un1C=ZvYNtz-eYghm-GH925gDVHyjhvL2YEsZ-Yw@mail.gmail.com",
3, "attachment.html", "text/html", "iso-8859-1"))
self.assertEqual(len(args_1[0][6]), 114)
# Image attachment
self.assertEqual(args_2[0][0:6], ("testlist@example.com",
"CAHmoxtXXb3un1C=ZvYNtz-eYghm-GH925gDVHyjhvL2YEsZ-Yw@mail.gmail.com",
4, u"todo-déjeuner.txt", "text/plain", "utf-8"))
self.assertEqual(len(args_2[0][6]), 112)
# Scrubbed content
self.assertEqual(contents, u'This is a test, HTML message with '
u'accented letters : \xe9 \xe8 \xe7 \xe0.\r\nAnd an '
u'attachment with an accented filename\r\n')
|