• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1import datetime
2import textwrap
3import unittest
4from email import errors
5from email import policy
6from email.message import Message
7from test.test_email import TestEmailBase, parameterize
8from email import headerregistry
9from email.headerregistry import Address, Group
10from test.support import ALWAYS_EQ
11
12
13DITTO = object()
14
15
16class TestHeaderRegistry(TestEmailBase):
17
18    def test_arbitrary_name_unstructured(self):
19        factory = headerregistry.HeaderRegistry()
20        h = factory('foobar', 'test')
21        self.assertIsInstance(h, headerregistry.BaseHeader)
22        self.assertIsInstance(h, headerregistry.UnstructuredHeader)
23
24    def test_name_case_ignored(self):
25        factory = headerregistry.HeaderRegistry()
26        # Whitebox check that test is valid
27        self.assertNotIn('Subject', factory.registry)
28        h = factory('Subject', 'test')
29        self.assertIsInstance(h, headerregistry.BaseHeader)
30        self.assertIsInstance(h, headerregistry.UniqueUnstructuredHeader)
31
32    class FooBase:
33        def __init__(self, *args, **kw):
34            pass
35
36    def test_override_default_base_class(self):
37        factory = headerregistry.HeaderRegistry(base_class=self.FooBase)
38        h = factory('foobar', 'test')
39        self.assertIsInstance(h, self.FooBase)
40        self.assertIsInstance(h, headerregistry.UnstructuredHeader)
41
42    class FooDefault:
43        parse = headerregistry.UnstructuredHeader.parse
44
45    def test_override_default_class(self):
46        factory = headerregistry.HeaderRegistry(default_class=self.FooDefault)
47        h = factory('foobar', 'test')
48        self.assertIsInstance(h, headerregistry.BaseHeader)
49        self.assertIsInstance(h, self.FooDefault)
50
51    def test_override_default_class_only_overrides_default(self):
52        factory = headerregistry.HeaderRegistry(default_class=self.FooDefault)
53        h = factory('subject', 'test')
54        self.assertIsInstance(h, headerregistry.BaseHeader)
55        self.assertIsInstance(h, headerregistry.UniqueUnstructuredHeader)
56
57    def test_dont_use_default_map(self):
58        factory = headerregistry.HeaderRegistry(use_default_map=False)
59        h = factory('subject', 'test')
60        self.assertIsInstance(h, headerregistry.BaseHeader)
61        self.assertIsInstance(h, headerregistry.UnstructuredHeader)
62
63    def test_map_to_type(self):
64        factory = headerregistry.HeaderRegistry()
65        h1 = factory('foobar', 'test')
66        factory.map_to_type('foobar', headerregistry.UniqueUnstructuredHeader)
67        h2 = factory('foobar', 'test')
68        self.assertIsInstance(h1, headerregistry.BaseHeader)
69        self.assertIsInstance(h1, headerregistry.UnstructuredHeader)
70        self.assertIsInstance(h2, headerregistry.BaseHeader)
71        self.assertIsInstance(h2, headerregistry.UniqueUnstructuredHeader)
72
73
74class TestHeaderBase(TestEmailBase):
75
76    factory = headerregistry.HeaderRegistry()
77
78    def make_header(self, name, value):
79        return self.factory(name, value)
80
81
82class TestBaseHeaderFeatures(TestHeaderBase):
83
84    def test_str(self):
85        h = self.make_header('subject', 'this is a test')
86        self.assertIsInstance(h, str)
87        self.assertEqual(h, 'this is a test')
88        self.assertEqual(str(h), 'this is a test')
89
90    def test_substr(self):
91        h = self.make_header('subject', 'this is a test')
92        self.assertEqual(h[5:7], 'is')
93
94    def test_has_name(self):
95        h = self.make_header('subject', 'this is a test')
96        self.assertEqual(h.name, 'subject')
97
98    def _test_attr_ro(self, attr):
99        h = self.make_header('subject', 'this is a test')
100        with self.assertRaises(AttributeError):
101            setattr(h, attr, 'foo')
102
103    def test_name_read_only(self):
104        self._test_attr_ro('name')
105
106    def test_defects_read_only(self):
107        self._test_attr_ro('defects')
108
109    def test_defects_is_tuple(self):
110        h = self.make_header('subject', 'this is a test')
111        self.assertEqual(len(h.defects), 0)
112        self.assertIsInstance(h.defects, tuple)
113        # Make sure it is still true when there are defects.
114        h = self.make_header('date', '')
115        self.assertEqual(len(h.defects), 1)
116        self.assertIsInstance(h.defects, tuple)
117
118    # XXX: FIXME
119    #def test_CR_in_value(self):
120    #    # XXX: this also re-raises the issue of embedded headers,
121    #    # need test and solution for that.
122    #    value = '\r'.join(['this is', ' a test'])
123    #    h = self.make_header('subject', value)
124    #    self.assertEqual(h, value)
125    #    self.assertDefectsEqual(h.defects, [errors.ObsoleteHeaderDefect])
126
127
128@parameterize
129class TestUnstructuredHeader(TestHeaderBase):
130
131    def string_as_value(self,
132                        source,
133                        decoded,
134                        *args):
135        l = len(args)
136        defects = args[0] if l>0 else []
137        header = 'Subject:' + (' ' if source else '')
138        folded = header + (args[1] if l>1 else source) + '\n'
139        h = self.make_header('Subject', source)
140        self.assertEqual(h, decoded)
141        self.assertDefectsEqual(h.defects, defects)
142        self.assertEqual(h.fold(policy=policy.default), folded)
143
144    string_params = {
145
146        'rfc2047_simple_quopri': (
147            '=?utf-8?q?this_is_a_test?=',
148            'this is a test',
149            [],
150            'this is a test'),
151
152        'rfc2047_gb2312_base64': (
153            '=?gb2312?b?1eLKx9bQzsSy4srUo6E=?=',
154            '\u8fd9\u662f\u4e2d\u6587\u6d4b\u8bd5\uff01',
155            [],
156            '=?utf-8?b?6L+Z5piv5Lit5paH5rWL6K+V77yB?='),
157
158        'rfc2047_simple_nonascii_quopri': (
159            '=?utf-8?q?=C3=89ric?=',
160            'Éric'),
161
162        'rfc2047_quopri_with_regular_text': (
163            'The =?utf-8?q?=C3=89ric=2C?= Himself',
164            'The Éric, Himself'),
165
166    }
167
168
169@parameterize
170class TestDateHeader(TestHeaderBase):
171
172    datestring = 'Sun, 23 Sep 2001 20:10:55 -0700'
173    utcoffset = datetime.timedelta(hours=-7)
174    tz = datetime.timezone(utcoffset)
175    dt = datetime.datetime(2001, 9, 23, 20, 10, 55, tzinfo=tz)
176
177    def test_parse_date(self):
178        h = self.make_header('date', self.datestring)
179        self.assertEqual(h, self.datestring)
180        self.assertEqual(h.datetime, self.dt)
181        self.assertEqual(h.datetime.utcoffset(), self.utcoffset)
182        self.assertEqual(h.defects, ())
183
184    def test_set_from_datetime(self):
185        h = self.make_header('date', self.dt)
186        self.assertEqual(h, self.datestring)
187        self.assertEqual(h.datetime, self.dt)
188        self.assertEqual(h.defects, ())
189
190    def test_date_header_properties(self):
191        h = self.make_header('date', self.datestring)
192        self.assertIsInstance(h, headerregistry.UniqueDateHeader)
193        self.assertEqual(h.max_count, 1)
194        self.assertEqual(h.defects, ())
195
196    def test_resent_date_header_properties(self):
197        h = self.make_header('resent-date', self.datestring)
198        self.assertIsInstance(h, headerregistry.DateHeader)
199        self.assertEqual(h.max_count, None)
200        self.assertEqual(h.defects, ())
201
202    def test_no_value_is_defect(self):
203        h = self.make_header('date', '')
204        self.assertEqual(len(h.defects), 1)
205        self.assertIsInstance(h.defects[0], errors.HeaderMissingRequiredValue)
206
207    def test_datetime_read_only(self):
208        h = self.make_header('date', self.datestring)
209        with self.assertRaises(AttributeError):
210            h.datetime = 'foo'
211
212    def test_set_date_header_from_datetime(self):
213        m = Message(policy=policy.default)
214        m['Date'] = self.dt
215        self.assertEqual(m['Date'], self.datestring)
216        self.assertEqual(m['Date'].datetime, self.dt)
217
218
219@parameterize
220class TestContentTypeHeader(TestHeaderBase):
221
222    def content_type_as_value(self,
223                              source,
224                              content_type,
225                              maintype,
226                              subtype,
227                              *args):
228        l = len(args)
229        parmdict = args[0] if l>0 else {}
230        defects =  args[1] if l>1 else []
231        decoded =  args[2] if l>2 and args[2] is not DITTO else source
232        header = 'Content-Type:' + ' ' if source else ''
233        folded = args[3] if l>3 else header + decoded + '\n'
234        h = self.make_header('Content-Type', source)
235        self.assertEqual(h.content_type, content_type)
236        self.assertEqual(h.maintype, maintype)
237        self.assertEqual(h.subtype, subtype)
238        self.assertEqual(h.params, parmdict)
239        with self.assertRaises(TypeError):
240            h.params['abc'] = 'xyz'   # make sure params is read-only.
241        self.assertDefectsEqual(h.defects, defects)
242        self.assertEqual(h, decoded)
243        self.assertEqual(h.fold(policy=policy.default), folded)
244
245    content_type_params = {
246
247        # Examples from RFC 2045.
248
249        'RFC_2045_1': (
250            'text/plain; charset=us-ascii (Plain text)',
251            'text/plain',
252            'text',
253            'plain',
254            {'charset': 'us-ascii'},
255            [],
256            'text/plain; charset="us-ascii"'),
257
258        'RFC_2045_2': (
259            'text/plain; charset=us-ascii',
260            'text/plain',
261            'text',
262            'plain',
263            {'charset': 'us-ascii'},
264            [],
265            'text/plain; charset="us-ascii"'),
266
267        'RFC_2045_3': (
268            'text/plain; charset="us-ascii"',
269            'text/plain',
270            'text',
271            'plain',
272            {'charset': 'us-ascii'}),
273
274        # RFC 2045 5.2 says syntactically invalid values are to be treated as
275        # text/plain.
276
277        'no_subtype_in_content_type': (
278            'text/',
279            'text/plain',
280            'text',
281            'plain',
282            {},
283            [errors.InvalidHeaderDefect]),
284
285        'no_slash_in_content_type': (
286            'foo',
287            'text/plain',
288            'text',
289            'plain',
290            {},
291            [errors.InvalidHeaderDefect]),
292
293        'junk_text_in_content_type': (
294            '<crazy "stuff">',
295            'text/plain',
296            'text',
297            'plain',
298            {},
299            [errors.InvalidHeaderDefect]),
300
301        'too_many_slashes_in_content_type': (
302            'image/jpeg/foo',
303            'text/plain',
304            'text',
305            'plain',
306            {},
307            [errors.InvalidHeaderDefect]),
308
309        # But unknown names are OK.  We could make non-IANA names a defect, but
310        # by not doing so we make ourselves future proof.  The fact that they
311        # are unknown will be detectable by the fact that they don't appear in
312        # the mime_registry...and the application is free to extend that list
313        # to handle them even if the core library doesn't.
314
315        'unknown_content_type': (
316            'bad/names',
317            'bad/names',
318            'bad',
319            'names'),
320
321        # The content type is case insensitive, and CFWS is ignored.
322
323        'mixed_case_content_type': (
324            'ImAge/JPeg',
325            'image/jpeg',
326            'image',
327            'jpeg'),
328
329        'spaces_in_content_type': (
330            '  text  /  plain  ',
331            'text/plain',
332            'text',
333            'plain'),
334
335        'cfws_in_content_type': (
336            '(foo) text (bar)/(baz)plain(stuff)',
337            'text/plain',
338            'text',
339            'plain'),
340
341        # test some parameters (more tests could be added for parameters
342        # associated with other content types, but since parameter parsing is
343        # generic they would be redundant for the current implementation).
344
345        'charset_param': (
346            'text/plain; charset="utf-8"',
347            'text/plain',
348            'text',
349            'plain',
350            {'charset': 'utf-8'}),
351
352        'capitalized_charset': (
353            'text/plain; charset="US-ASCII"',
354            'text/plain',
355            'text',
356            'plain',
357            {'charset': 'US-ASCII'}),
358
359        'unknown_charset': (
360            'text/plain; charset="fOo"',
361            'text/plain',
362            'text',
363            'plain',
364            {'charset': 'fOo'}),
365
366        'capitalized_charset_param_name_and_comment': (
367            'text/plain; (interjection) Charset="utf-8"',
368            'text/plain',
369            'text',
370            'plain',
371            {'charset': 'utf-8'},
372            [],
373            # Should the parameter name be lowercased here?
374            'text/plain; Charset="utf-8"'),
375
376        # Since this is pretty much the ur-mimeheader, we'll put all the tests
377        # that exercise the parameter parsing and formatting here.  Note that
378        # when we refold we may canonicalize, so things like whitespace,
379        # quoting, and rfc2231 encoding may change from what was in the input
380        # header.
381
382        'unquoted_param_value': (
383            'text/plain; title=foo',
384            'text/plain',
385            'text',
386            'plain',
387            {'title': 'foo'},
388            [],
389            'text/plain; title="foo"',
390            ),
391
392        'param_value_with_tspecials': (
393            'text/plain; title="(bar)foo blue"',
394            'text/plain',
395            'text',
396            'plain',
397            {'title': '(bar)foo blue'}),
398
399        'param_with_extra_quoted_whitespace': (
400            'text/plain; title="  a     loong  way \t home   "',
401            'text/plain',
402            'text',
403            'plain',
404            {'title': '  a     loong  way \t home   '}),
405
406        'bad_params': (
407            'blarg; baz; boo',
408            'text/plain',
409            'text',
410            'plain',
411            {'baz': '', 'boo': ''},
412            [errors.InvalidHeaderDefect]*3),
413
414        'spaces_around_param_equals': (
415            'Multipart/mixed; boundary = "CPIMSSMTPC06p5f3tG"',
416            'multipart/mixed',
417            'multipart',
418            'mixed',
419            {'boundary': 'CPIMSSMTPC06p5f3tG'},
420            [],
421            'Multipart/mixed; boundary="CPIMSSMTPC06p5f3tG"',
422            ),
423
424        'spaces_around_semis': (
425            ('image/jpeg; name="wibble.JPG" ; x-mac-type="4A504547" ; '
426                'x-mac-creator="474B4F4E"'),
427            'image/jpeg',
428            'image',
429            'jpeg',
430            {'name': 'wibble.JPG',
431             'x-mac-type': '4A504547',
432             'x-mac-creator': '474B4F4E'},
433            [],
434            ('image/jpeg; name="wibble.JPG"; x-mac-type="4A504547"; '
435                'x-mac-creator="474B4F4E"'),
436            ('Content-Type: image/jpeg; name="wibble.JPG";'
437                ' x-mac-type="4A504547";\n'
438             ' x-mac-creator="474B4F4E"\n'),
439            ),
440
441        'lots_of_mime_params': (
442            ('image/jpeg; name="wibble.JPG"; x-mac-type="4A504547"; '
443                'x-mac-creator="474B4F4E"; x-extrastuff="make it longer"'),
444            'image/jpeg',
445            'image',
446            'jpeg',
447            {'name': 'wibble.JPG',
448             'x-mac-type': '4A504547',
449             'x-mac-creator': '474B4F4E',
450             'x-extrastuff': 'make it longer'},
451            [],
452            ('image/jpeg; name="wibble.JPG"; x-mac-type="4A504547"; '
453                'x-mac-creator="474B4F4E"; x-extrastuff="make it longer"'),
454            # In this case the whole of the MimeParameters does *not* fit
455            # one one line, so we break at a lower syntactic level.
456            ('Content-Type: image/jpeg; name="wibble.JPG";'
457                ' x-mac-type="4A504547";\n'
458             ' x-mac-creator="474B4F4E"; x-extrastuff="make it longer"\n'),
459            ),
460
461        'semis_inside_quotes': (
462            'image/jpeg; name="Jim&amp;&amp;Jill"',
463            'image/jpeg',
464            'image',
465            'jpeg',
466            {'name': 'Jim&amp;&amp;Jill'}),
467
468        'single_quotes_inside_quotes': (
469            'image/jpeg; name="Jim \'Bob\' Jill"',
470            'image/jpeg',
471            'image',
472            'jpeg',
473            {'name': "Jim 'Bob' Jill"}),
474
475        'double_quotes_inside_quotes': (
476            r'image/jpeg; name="Jim \"Bob\" Jill"',
477            'image/jpeg',
478            'image',
479            'jpeg',
480            {'name': 'Jim "Bob" Jill'},
481            [],
482            r'image/jpeg; name="Jim \"Bob\" Jill"'),
483
484        'non_ascii_in_params': (
485            ('foo\xa7/bar; b\xa7r=two; '
486                'baz=thr\xa7e'.encode('latin-1').decode('us-ascii',
487                                                        'surrogateescape')),
488            'foo\uFFFD/bar',
489            'foo\uFFFD',
490            'bar',
491            {'b\uFFFDr': 'two', 'baz': 'thr\uFFFDe'},
492            [errors.UndecodableBytesDefect]*3,
493            'foo�/bar; b�r="two"; baz="thr�e"',
494            # XXX Two bugs here: the mime type is not allowed to be an encoded
495            # word, and we shouldn't be emitting surrogates in the parameter
496            # names.  But I don't know what the behavior should be here, so I'm
497            # punting for now.  In practice this is unlikely to be encountered
498            # since headers with binary in them only come from a binary source
499            # and are almost certain to be re-emitted without refolding.
500            'Content-Type: =?unknown-8bit?q?foo=A7?=/bar; b\udca7r="two";\n'
501            " baz*=unknown-8bit''thr%A7e\n",
502            ),
503
504        # RFC 2231 parameter tests.
505
506        'rfc2231_segmented_normal_values': (
507            'image/jpeg; name*0="abc"; name*1=".html"',
508            'image/jpeg',
509            'image',
510            'jpeg',
511            {'name': "abc.html"},
512            [],
513            'image/jpeg; name="abc.html"'),
514
515        'quotes_inside_rfc2231_value': (
516            r'image/jpeg; bar*0="baz\"foobar"; bar*1="\"baz"',
517            'image/jpeg',
518            'image',
519            'jpeg',
520            {'bar': 'baz"foobar"baz'},
521            [],
522            r'image/jpeg; bar="baz\"foobar\"baz"'),
523
524        'non_ascii_rfc2231_value': (
525            ('text/plain; charset=us-ascii; '
526             "title*=us-ascii'en'This%20is%20"
527             'not%20f\xa7n').encode('latin-1').decode('us-ascii',
528                                                     'surrogateescape'),
529            'text/plain',
530            'text',
531            'plain',
532            {'charset': 'us-ascii', 'title': 'This is not f\uFFFDn'},
533             [errors.UndecodableBytesDefect],
534             'text/plain; charset="us-ascii"; title="This is not f�n"',
535            'Content-Type: text/plain; charset="us-ascii";\n'
536            " title*=unknown-8bit''This%20is%20not%20f%A7n\n",
537            ),
538
539        'rfc2231_encoded_charset': (
540            'text/plain; charset*=ansi-x3.4-1968\'\'us-ascii',
541            'text/plain',
542            'text',
543            'plain',
544            {'charset': 'us-ascii'},
545            [],
546            'text/plain; charset="us-ascii"'),
547
548        # This follows the RFC: no double quotes around encoded values.
549        'rfc2231_encoded_no_double_quotes': (
550            ("text/plain;"
551                "\tname*0*=''This%20is%20;"
552                "\tname*1*=%2A%2A%2Afun%2A%2A%2A%20;"
553                '\tname*2="is it not.pdf"'),
554            'text/plain',
555            'text',
556            'plain',
557            {'name': 'This is ***fun*** is it not.pdf'},
558            [],
559            'text/plain; name="This is ***fun*** is it not.pdf"',
560            ),
561
562        # Make sure we also handle it if there are spurious double quotes.
563        'rfc2231_encoded_with_double_quotes': (
564            ("text/plain;"
565                '\tname*0*="us-ascii\'\'This%20is%20even%20more%20";'
566                '\tname*1*="%2A%2A%2Afun%2A%2A%2A%20";'
567                '\tname*2="is it not.pdf"'),
568            'text/plain',
569            'text',
570            'plain',
571            {'name': 'This is even more ***fun*** is it not.pdf'},
572            [errors.InvalidHeaderDefect]*2,
573            'text/plain; name="This is even more ***fun*** is it not.pdf"',
574            ),
575
576        'rfc2231_single_quote_inside_double_quotes': (
577            ('text/plain; charset=us-ascii;'
578               '\ttitle*0*="us-ascii\'en\'This%20is%20really%20";'
579               '\ttitle*1*="%2A%2A%2Afun%2A%2A%2A%20";'
580               '\ttitle*2="isn\'t it!"'),
581            'text/plain',
582            'text',
583            'plain',
584            {'charset': 'us-ascii', 'title': "This is really ***fun*** isn't it!"},
585            [errors.InvalidHeaderDefect]*2,
586            ('text/plain; charset="us-ascii"; '
587               'title="This is really ***fun*** isn\'t it!"'),
588            ('Content-Type: text/plain; charset="us-ascii";\n'
589                ' title="This is really ***fun*** isn\'t it!"\n'),
590            ),
591
592        'rfc2231_single_quote_in_value_with_charset_and_lang': (
593            ('application/x-foo;'
594                "\tname*0*=\"us-ascii'en-us'Frank's\"; name*1*=\" Document\""),
595            'application/x-foo',
596            'application',
597            'x-foo',
598            {'name': "Frank's Document"},
599            [errors.InvalidHeaderDefect]*2,
600            'application/x-foo; name="Frank\'s Document"',
601            ),
602
603        'rfc2231_single_quote_in_non_encoded_value': (
604            ('application/x-foo;'
605                "\tname*0=\"us-ascii'en-us'Frank's\"; name*1=\" Document\""),
606            'application/x-foo',
607            'application',
608            'x-foo',
609            {'name': "us-ascii'en-us'Frank's Document"},
610            [],
611            'application/x-foo; name="us-ascii\'en-us\'Frank\'s Document"',
612             ),
613
614        'rfc2231_no_language_or_charset': (
615            'text/plain; NAME*0*=english_is_the_default.html',
616            'text/plain',
617            'text',
618            'plain',
619            {'name': 'english_is_the_default.html'},
620            [errors.InvalidHeaderDefect],
621            'text/plain; NAME="english_is_the_default.html"'),
622
623        'rfc2231_encoded_no_charset': (
624            ("text/plain;"
625                '\tname*0*="\'\'This%20is%20even%20more%20";'
626                '\tname*1*="%2A%2A%2Afun%2A%2A%2A%20";'
627                '\tname*2="is it.pdf"'),
628            'text/plain',
629            'text',
630            'plain',
631            {'name': 'This is even more ***fun*** is it.pdf'},
632            [errors.InvalidHeaderDefect]*2,
633            'text/plain; name="This is even more ***fun*** is it.pdf"',
634            ),
635
636        'rfc2231_partly_encoded': (
637            ("text/plain;"
638                '\tname*0*="\'\'This%20is%20even%20more%20";'
639                '\tname*1*="%2A%2A%2Afun%2A%2A%2A%20";'
640                '\tname*2="is it.pdf"'),
641            'text/plain',
642            'text',
643            'plain',
644            {'name': 'This is even more ***fun*** is it.pdf'},
645            [errors.InvalidHeaderDefect]*2,
646            'text/plain; name="This is even more ***fun*** is it.pdf"',
647            ),
648
649        'rfc2231_partly_encoded_2': (
650            ("text/plain;"
651                '\tname*0*="\'\'This%20is%20even%20more%20";'
652                '\tname*1="%2A%2A%2Afun%2A%2A%2A%20";'
653                '\tname*2="is it.pdf"'),
654            'text/plain',
655            'text',
656            'plain',
657            {'name': 'This is even more %2A%2A%2Afun%2A%2A%2A%20is it.pdf'},
658            [errors.InvalidHeaderDefect],
659            ('text/plain;'
660             ' name="This is even more %2A%2A%2Afun%2A%2A%2A%20is it.pdf"'),
661            ('Content-Type: text/plain;\n'
662             ' name="This is even more %2A%2A%2Afun%2A%2A%2A%20is'
663                ' it.pdf"\n'),
664            ),
665
666        'rfc2231_unknown_charset_treated_as_ascii': (
667            "text/plain; name*0*=bogus'xx'ascii_is_the_default",
668            'text/plain',
669            'text',
670            'plain',
671            {'name': 'ascii_is_the_default'},
672            [],
673            'text/plain; name="ascii_is_the_default"'),
674
675        'rfc2231_bad_character_in_charset_parameter_value': (
676            "text/plain; charset*=ascii''utf-8%F1%F2%F3",
677            'text/plain',
678            'text',
679            'plain',
680            {'charset': 'utf-8\uFFFD\uFFFD\uFFFD'},
681            [errors.UndecodableBytesDefect],
682            'text/plain; charset="utf-8\uFFFD\uFFFD\uFFFD"',
683            "Content-Type: text/plain;"
684            " charset*=unknown-8bit''utf-8%F1%F2%F3\n",
685            ),
686
687        'rfc2231_utf8_in_supposedly_ascii_charset_parameter_value': (
688            "text/plain; charset*=ascii''utf-8%E2%80%9D",
689            'text/plain',
690            'text',
691            'plain',
692            {'charset': 'utf-8”'},
693            [errors.UndecodableBytesDefect],
694            'text/plain; charset="utf-8”"',
695            # XXX Should folding change the charset to utf8?  Currently it just
696            # reproduces the original, which is arguably fine.
697            "Content-Type: text/plain;"
698            " charset*=unknown-8bit''utf-8%E2%80%9D\n",
699            ),
700
701        'rfc2231_encoded_then_unencoded_segments': (
702            ('application/x-foo;'
703                '\tname*0*="us-ascii\'en-us\'My";'
704                '\tname*1=" Document";'
705                '\tname*2=" For You"'),
706            'application/x-foo',
707            'application',
708            'x-foo',
709            {'name': 'My Document For You'},
710            [errors.InvalidHeaderDefect],
711            'application/x-foo; name="My Document For You"',
712            ),
713
714        # My reading of the RFC is that this is an invalid header.  The RFC
715        # says that if charset and language information is given, the first
716        # segment *must* be encoded.
717        'rfc2231_unencoded_then_encoded_segments': (
718            ('application/x-foo;'
719                '\tname*0=us-ascii\'en-us\'My;'
720                '\tname*1*=" Document";'
721                '\tname*2*=" For You"'),
722            'application/x-foo',
723            'application',
724            'x-foo',
725            {'name': 'My Document For You'},
726            [errors.InvalidHeaderDefect]*3,
727            'application/x-foo; name="My Document For You"',
728            ),
729
730        # XXX: I would say this one should default to ascii/en for the
731        # "encoded" segment, since the first segment is not encoded and is
732        # in double quotes, making the value a valid non-encoded string.  The
733        # old parser decodes this just like the previous case, which may be the
734        # better Postel rule, but could equally result in borking headers that
735        # intentionally have quoted quotes in them.  We could get this 98%
736        # right if we treat it as a quoted string *unless* it matches the
737        # charset'lang'value pattern exactly *and* there is at least one
738        # encoded segment.  Implementing that algorithm will require some
739        # refactoring, so I haven't done it (yet).
740        'rfc2231_quoted_unencoded_then_encoded_segments': (
741            ('application/x-foo;'
742                '\tname*0="us-ascii\'en-us\'My";'
743                '\tname*1*=" Document";'
744                '\tname*2*=" For You"'),
745            'application/x-foo',
746            'application',
747            'x-foo',
748            {'name': "us-ascii'en-us'My Document For You"},
749            [errors.InvalidHeaderDefect]*2,
750            'application/x-foo; name="us-ascii\'en-us\'My Document For You"',
751            ),
752
753        # Make sure our folding algorithm produces multiple sections correctly.
754        # We could mix encoded and non-encoded segments, but we don't, we just
755        # make them all encoded.  It might be worth fixing that, since the
756        # sections can get used for wrapping ascii text.
757        'rfc2231_folded_segments_correctly_formatted': (
758            ('application/x-foo;'
759                '\tname="' + "with spaces"*8 + '"'),
760            'application/x-foo',
761            'application',
762            'x-foo',
763            {'name': "with spaces"*8},
764            [],
765            'application/x-foo; name="' + "with spaces"*8 + '"',
766            "Content-Type: application/x-foo;\n"
767            " name*0*=us-ascii''with%20spaceswith%20spaceswith%20spaceswith"
768                "%20spaceswith;\n"
769            " name*1*=%20spaceswith%20spaceswith%20spaceswith%20spaces\n"
770            ),
771
772    }
773
774
775@parameterize
776class TestContentTransferEncoding(TestHeaderBase):
777
778    def cte_as_value(self,
779                     source,
780                     cte,
781                     *args):
782        l = len(args)
783        defects =  args[0] if l>0 else []
784        decoded =  args[1] if l>1 and args[1] is not DITTO else source
785        header = 'Content-Transfer-Encoding:' + ' ' if source else ''
786        folded = args[2] if l>2 else header + source + '\n'
787        h = self.make_header('Content-Transfer-Encoding', source)
788        self.assertEqual(h.cte, cte)
789        self.assertDefectsEqual(h.defects, defects)
790        self.assertEqual(h, decoded)
791        self.assertEqual(h.fold(policy=policy.default), folded)
792
793    cte_params = {
794
795        'RFC_2183_1': (
796            'base64',
797            'base64',),
798
799        'no_value': (
800            '',
801            '7bit',
802            [errors.HeaderMissingRequiredValue],
803            '',
804            'Content-Transfer-Encoding:\n',
805            ),
806
807        'junk_after_cte': (
808            '7bit and a bunch more',
809            '7bit',
810            [errors.InvalidHeaderDefect]),
811
812    }
813
814
815@parameterize
816class TestContentDisposition(TestHeaderBase):
817
818    def content_disp_as_value(self,
819                              source,
820                              content_disposition,
821                              *args):
822        l = len(args)
823        parmdict = args[0] if l>0 else {}
824        defects =  args[1] if l>1 else []
825        decoded =  args[2] if l>2 and args[2] is not DITTO else source
826        header = 'Content-Disposition:' + ' ' if source else ''
827        folded = args[3] if l>3 else header + source + '\n'
828        h = self.make_header('Content-Disposition', source)
829        self.assertEqual(h.content_disposition, content_disposition)
830        self.assertEqual(h.params, parmdict)
831        self.assertDefectsEqual(h.defects, defects)
832        self.assertEqual(h, decoded)
833        self.assertEqual(h.fold(policy=policy.default), folded)
834
835    content_disp_params = {
836
837        # Examples from RFC 2183.
838
839        'RFC_2183_1': (
840            'inline',
841            'inline',),
842
843        'RFC_2183_2': (
844            ('attachment; filename=genome.jpeg;'
845             '  modification-date="Wed, 12 Feb 1997 16:29:51 -0500";'),
846            'attachment',
847            {'filename': 'genome.jpeg',
848             'modification-date': 'Wed, 12 Feb 1997 16:29:51 -0500'},
849            [],
850            ('attachment; filename="genome.jpeg"; '
851                 'modification-date="Wed, 12 Feb 1997 16:29:51 -0500"'),
852            ('Content-Disposition: attachment; filename="genome.jpeg";\n'
853             ' modification-date="Wed, 12 Feb 1997 16:29:51 -0500"\n'),
854            ),
855
856        'no_value': (
857            '',
858            None,
859            {},
860            [errors.HeaderMissingRequiredValue],
861            '',
862            'Content-Disposition:\n'),
863
864        'invalid_value': (
865            'ab./k',
866            'ab.',
867            {},
868            [errors.InvalidHeaderDefect]),
869
870        'invalid_value_with_params': (
871            'ab./k; filename="foo"',
872            'ab.',
873            {'filename': 'foo'},
874            [errors.InvalidHeaderDefect]),
875
876        'invalid_parameter_value_with_fws_between_ew': (
877            'attachment; filename="=?UTF-8?Q?Schulbesuchsbest=C3=A4ttigung=2E?='
878            '               =?UTF-8?Q?pdf?="',
879            'attachment',
880            {'filename': 'Schulbesuchsbestättigung.pdf'},
881            [errors.InvalidHeaderDefect]*3,
882            ('attachment; filename="Schulbesuchsbestättigung.pdf"'),
883            ('Content-Disposition: attachment;\n'
884             ' filename*=utf-8\'\'Schulbesuchsbest%C3%A4ttigung.pdf\n'),
885            ),
886
887        'parameter_value_with_fws_between_tokens': (
888            'attachment; filename="File =?utf-8?q?Name?= With Spaces.pdf"',
889            'attachment',
890            {'filename': 'File Name With Spaces.pdf'},
891            [errors.InvalidHeaderDefect],
892            'attachment; filename="File Name With Spaces.pdf"',
893            ('Content-Disposition: attachment; filename="File Name With Spaces.pdf"\n'),
894            )
895    }
896
897
898@parameterize
899class TestMIMEVersionHeader(TestHeaderBase):
900
901    def version_string_as_MIME_Version(self,
902                                       source,
903                                       decoded,
904                                       version,
905                                       major,
906                                       minor,
907                                       defects):
908        h = self.make_header('MIME-Version', source)
909        self.assertEqual(h, decoded)
910        self.assertEqual(h.version, version)
911        self.assertEqual(h.major, major)
912        self.assertEqual(h.minor, minor)
913        self.assertDefectsEqual(h.defects, defects)
914        if source:
915            source = ' ' + source
916        self.assertEqual(h.fold(policy=policy.default),
917                         'MIME-Version:' + source + '\n')
918
919    version_string_params = {
920
921        # Examples from the RFC.
922
923        'RFC_2045_1': (
924            '1.0',
925            '1.0',
926            '1.0',
927            1,
928            0,
929            []),
930
931        'RFC_2045_2': (
932            '1.0 (produced by MetaSend Vx.x)',
933            '1.0 (produced by MetaSend Vx.x)',
934            '1.0',
935            1,
936            0,
937            []),
938
939        'RFC_2045_3': (
940            '(produced by MetaSend Vx.x) 1.0',
941            '(produced by MetaSend Vx.x) 1.0',
942            '1.0',
943            1,
944            0,
945            []),
946
947        'RFC_2045_4': (
948            '1.(produced by MetaSend Vx.x)0',
949            '1.(produced by MetaSend Vx.x)0',
950            '1.0',
951            1,
952            0,
953            []),
954
955        # Other valid values.
956
957        '1_1': (
958            '1.1',
959            '1.1',
960            '1.1',
961            1,
962            1,
963            []),
964
965        '2_1': (
966            '2.1',
967            '2.1',
968            '2.1',
969            2,
970            1,
971            []),
972
973        'whitespace': (
974            '1 .0',
975            '1 .0',
976            '1.0',
977            1,
978            0,
979            []),
980
981        'leading_trailing_whitespace_ignored': (
982            '  1.0  ',
983            '  1.0  ',
984            '1.0',
985            1,
986            0,
987            []),
988
989        # Recoverable invalid values.  We can recover here only because we
990        # already have a valid value by the time we encounter the garbage.
991        # Anywhere else, and we don't know where the garbage ends.
992
993        'non_comment_garbage_after': (
994            '1.0 <abc>',
995            '1.0 <abc>',
996            '1.0',
997            1,
998            0,
999            [errors.InvalidHeaderDefect]),
1000
1001        # Unrecoverable invalid values.  We *could* apply more heuristics to
1002        # get something out of the first two, but doing so is not worth the
1003        # effort.
1004
1005        'non_comment_garbage_before': (
1006            '<abc> 1.0',
1007            '<abc> 1.0',
1008            None,
1009            None,
1010            None,
1011            [errors.InvalidHeaderDefect]),
1012
1013        'non_comment_garbage_inside': (
1014            '1.<abc>0',
1015            '1.<abc>0',
1016            None,
1017            None,
1018            None,
1019            [errors.InvalidHeaderDefect]),
1020
1021        'two_periods': (
1022            '1..0',
1023            '1..0',
1024            None,
1025            None,
1026            None,
1027            [errors.InvalidHeaderDefect]),
1028
1029        '2_x': (
1030            '2.x',
1031            '2.x',
1032            None,  # This could be 2, but it seems safer to make it None.
1033            None,
1034            None,
1035            [errors.InvalidHeaderDefect]),
1036
1037        'foo': (
1038            'foo',
1039            'foo',
1040            None,
1041            None,
1042            None,
1043            [errors.InvalidHeaderDefect]),
1044
1045        'missing': (
1046            '',
1047            '',
1048            None,
1049            None,
1050            None,
1051            [errors.HeaderMissingRequiredValue]),
1052
1053        }
1054
1055
1056@parameterize
1057class TestAddressHeader(TestHeaderBase):
1058
1059    example_params = {
1060
1061        'empty':
1062            ('<>',
1063             [errors.InvalidHeaderDefect],
1064             '<>',
1065             '',
1066             '<>',
1067             '',
1068             '',
1069             None),
1070
1071        'address_only':
1072            ('zippy@pinhead.com',
1073             [],
1074             'zippy@pinhead.com',
1075             '',
1076             'zippy@pinhead.com',
1077             'zippy',
1078             'pinhead.com',
1079             None),
1080
1081        'name_and_address':
1082            ('Zaphrod Beblebrux <zippy@pinhead.com>',
1083             [],
1084             'Zaphrod Beblebrux <zippy@pinhead.com>',
1085             'Zaphrod Beblebrux',
1086             'zippy@pinhead.com',
1087             'zippy',
1088             'pinhead.com',
1089             None),
1090
1091        'quoted_local_part':
1092            ('Zaphrod Beblebrux <"foo bar"@pinhead.com>',
1093             [],
1094             'Zaphrod Beblebrux <"foo bar"@pinhead.com>',
1095             'Zaphrod Beblebrux',
1096             '"foo bar"@pinhead.com',
1097             'foo bar',
1098             'pinhead.com',
1099             None),
1100
1101        'quoted_parens_in_name':
1102            (r'"A \(Special\) Person" <person@dom.ain>',
1103             [],
1104             '"A (Special) Person" <person@dom.ain>',
1105             'A (Special) Person',
1106             'person@dom.ain',
1107             'person',
1108             'dom.ain',
1109             None),
1110
1111        'quoted_backslashes_in_name':
1112            (r'"Arthur \\Backslash\\ Foobar" <person@dom.ain>',
1113             [],
1114             r'"Arthur \\Backslash\\ Foobar" <person@dom.ain>',
1115             r'Arthur \Backslash\ Foobar',
1116             'person@dom.ain',
1117             'person',
1118             'dom.ain',
1119             None),
1120
1121        'name_with_dot':
1122            ('John X. Doe <jxd@example.com>',
1123             [errors.ObsoleteHeaderDefect],
1124             '"John X. Doe" <jxd@example.com>',
1125             'John X. Doe',
1126             'jxd@example.com',
1127             'jxd',
1128             'example.com',
1129             None),
1130
1131        'quoted_strings_in_local_part':
1132            ('""example" example"@example.com',
1133             [errors.InvalidHeaderDefect]*3,
1134             '"example example"@example.com',
1135             '',
1136             '"example example"@example.com',
1137             'example example',
1138             'example.com',
1139             None),
1140
1141        'escaped_quoted_strings_in_local_part':
1142            (r'"\"example\" example"@example.com',
1143             [],
1144             r'"\"example\" example"@example.com',
1145             '',
1146             r'"\"example\" example"@example.com',
1147             r'"example" example',
1148             'example.com',
1149            None),
1150
1151        'escaped_escapes_in_local_part':
1152            (r'"\\"example\\" example"@example.com',
1153             [errors.InvalidHeaderDefect]*5,
1154             r'"\\example\\\\ example"@example.com',
1155             '',
1156             r'"\\example\\\\ example"@example.com',
1157             r'\example\\ example',
1158             'example.com',
1159            None),
1160
1161        'spaces_in_unquoted_local_part_collapsed':
1162            ('merwok  wok  @example.com',
1163             [errors.InvalidHeaderDefect]*2,
1164             '"merwok wok"@example.com',
1165             '',
1166             '"merwok wok"@example.com',
1167             'merwok wok',
1168             'example.com',
1169             None),
1170
1171        'spaces_around_dots_in_local_part_removed':
1172            ('merwok. wok .  wok@example.com',
1173             [errors.ObsoleteHeaderDefect],
1174             'merwok.wok.wok@example.com',
1175             '',
1176             'merwok.wok.wok@example.com',
1177             'merwok.wok.wok',
1178             'example.com',
1179             None),
1180
1181        'rfc2047_atom_is_decoded':
1182            ('=?utf-8?q?=C3=89ric?= <foo@example.com>',
1183            [],
1184            'Éric <foo@example.com>',
1185            'Éric',
1186            'foo@example.com',
1187            'foo',
1188            'example.com',
1189            None),
1190
1191        'rfc2047_atom_in_phrase_is_decoded':
1192            ('The =?utf-8?q?=C3=89ric=2C?= Himself <foo@example.com>',
1193            [],
1194            '"The Éric, Himself" <foo@example.com>',
1195            'The Éric, Himself',
1196            'foo@example.com',
1197            'foo',
1198            'example.com',
1199            None),
1200
1201        'rfc2047_atom_in_quoted_string_is_decoded':
1202            ('"=?utf-8?q?=C3=89ric?=" <foo@example.com>',
1203            [errors.InvalidHeaderDefect,
1204            errors.InvalidHeaderDefect],
1205            'Éric <foo@example.com>',
1206            'Éric',
1207            'foo@example.com',
1208            'foo',
1209            'example.com',
1210            None),
1211
1212        }
1213
1214        # XXX: Need many more examples, and in particular some with names in
1215        # trailing comments, which aren't currently handled.  comments in
1216        # general are not handled yet.
1217
1218    def example_as_address(self, source, defects, decoded, display_name,
1219                           addr_spec, username, domain, comment):
1220        h = self.make_header('sender', source)
1221        self.assertEqual(h, decoded)
1222        self.assertDefectsEqual(h.defects, defects)
1223        a = h.address
1224        self.assertEqual(str(a), decoded)
1225        self.assertEqual(len(h.groups), 1)
1226        self.assertEqual([a], list(h.groups[0].addresses))
1227        self.assertEqual([a], list(h.addresses))
1228        self.assertEqual(a.display_name, display_name)
1229        self.assertEqual(a.addr_spec, addr_spec)
1230        self.assertEqual(a.username, username)
1231        self.assertEqual(a.domain, domain)
1232        # XXX: we have no comment support yet.
1233        #self.assertEqual(a.comment, comment)
1234
1235    def example_as_group(self, source, defects, decoded, display_name,
1236                         addr_spec, username, domain, comment):
1237        source = 'foo: {};'.format(source)
1238        gdecoded = 'foo: {};'.format(decoded) if decoded else 'foo:;'
1239        h = self.make_header('to', source)
1240        self.assertEqual(h, gdecoded)
1241        self.assertDefectsEqual(h.defects, defects)
1242        self.assertEqual(h.groups[0].addresses, h.addresses)
1243        self.assertEqual(len(h.groups), 1)
1244        self.assertEqual(len(h.addresses), 1)
1245        a = h.addresses[0]
1246        self.assertEqual(str(a), decoded)
1247        self.assertEqual(a.display_name, display_name)
1248        self.assertEqual(a.addr_spec, addr_spec)
1249        self.assertEqual(a.username, username)
1250        self.assertEqual(a.domain, domain)
1251
1252    def test_simple_address_list(self):
1253        value = ('Fred <dinsdale@python.org>, foo@example.com, '
1254                    '"Harry W. Hastings" <hasty@example.com>')
1255        h = self.make_header('to', value)
1256        self.assertEqual(h, value)
1257        self.assertEqual(len(h.groups), 3)
1258        self.assertEqual(len(h.addresses), 3)
1259        for i in range(3):
1260            self.assertEqual(h.groups[i].addresses[0], h.addresses[i])
1261        self.assertEqual(str(h.addresses[0]), 'Fred <dinsdale@python.org>')
1262        self.assertEqual(str(h.addresses[1]), 'foo@example.com')
1263        self.assertEqual(str(h.addresses[2]),
1264            '"Harry W. Hastings" <hasty@example.com>')
1265        self.assertEqual(h.addresses[2].display_name,
1266            'Harry W. Hastings')
1267
1268    def test_complex_address_list(self):
1269        examples = list(self.example_params.values())
1270        source = ('dummy list:;, another: (empty);,' +
1271                 ', '.join([x[0] for x in examples[:4]]) + ', ' +
1272                 r'"A \"list\"": ' +
1273                    ', '.join([x[0] for x in examples[4:6]]) + ';,' +
1274                 ', '.join([x[0] for x in examples[6:]])
1275            )
1276        # XXX: the fact that (empty) disappears here is a potential API design
1277        # bug.  We don't currently have a way to preserve comments.
1278        expected = ('dummy list:;, another:;, ' +
1279                 ', '.join([x[2] for x in examples[:4]]) + ', ' +
1280                 r'"A \"list\"": ' +
1281                    ', '.join([x[2] for x in examples[4:6]]) + ';, ' +
1282                 ', '.join([x[2] for x in examples[6:]])
1283            )
1284
1285        h = self.make_header('to', source)
1286        self.assertEqual(h.split(','), expected.split(','))
1287        self.assertEqual(h, expected)
1288        self.assertEqual(len(h.groups), 7 + len(examples) - 6)
1289        self.assertEqual(h.groups[0].display_name, 'dummy list')
1290        self.assertEqual(h.groups[1].display_name, 'another')
1291        self.assertEqual(h.groups[6].display_name, 'A "list"')
1292        self.assertEqual(len(h.addresses), len(examples))
1293        for i in range(4):
1294            self.assertIsNone(h.groups[i+2].display_name)
1295            self.assertEqual(str(h.groups[i+2].addresses[0]), examples[i][2])
1296        for i in range(7, 7 + len(examples) - 6):
1297            self.assertIsNone(h.groups[i].display_name)
1298            self.assertEqual(str(h.groups[i].addresses[0]), examples[i-1][2])
1299        for i in range(len(examples)):
1300            self.assertEqual(str(h.addresses[i]), examples[i][2])
1301            self.assertEqual(h.addresses[i].addr_spec, examples[i][4])
1302
1303    def test_address_read_only(self):
1304        h = self.make_header('sender', 'abc@xyz.com')
1305        with self.assertRaises(AttributeError):
1306            h.address = 'foo'
1307
1308    def test_addresses_read_only(self):
1309        h = self.make_header('sender', 'abc@xyz.com')
1310        with self.assertRaises(AttributeError):
1311            h.addresses = 'foo'
1312
1313    def test_groups_read_only(self):
1314        h = self.make_header('sender', 'abc@xyz.com')
1315        with self.assertRaises(AttributeError):
1316            h.groups = 'foo'
1317
1318    def test_addresses_types(self):
1319        source = 'me <who@example.com>'
1320        h = self.make_header('to', source)
1321        self.assertIsInstance(h.addresses, tuple)
1322        self.assertIsInstance(h.addresses[0], Address)
1323
1324    def test_groups_types(self):
1325        source = 'me <who@example.com>'
1326        h = self.make_header('to', source)
1327        self.assertIsInstance(h.groups, tuple)
1328        self.assertIsInstance(h.groups[0], Group)
1329
1330    def test_set_from_Address(self):
1331        h = self.make_header('to', Address('me', 'foo', 'example.com'))
1332        self.assertEqual(h, 'me <foo@example.com>')
1333
1334    def test_set_from_Address_list(self):
1335        h = self.make_header('to', [Address('me', 'foo', 'example.com'),
1336                                    Address('you', 'bar', 'example.com')])
1337        self.assertEqual(h, 'me <foo@example.com>, you <bar@example.com>')
1338
1339    def test_set_from_Address_and_Group_list(self):
1340        h = self.make_header('to', [Address('me', 'foo', 'example.com'),
1341                                    Group('bing', [Address('fiz', 'z', 'b.com'),
1342                                                   Address('zif', 'f', 'c.com')]),
1343                                    Address('you', 'bar', 'example.com')])
1344        self.assertEqual(h, 'me <foo@example.com>, bing: fiz <z@b.com>, '
1345                            'zif <f@c.com>;, you <bar@example.com>')
1346        self.assertEqual(h.fold(policy=policy.default.clone(max_line_length=40)),
1347                        'to: me <foo@example.com>,\n'
1348                        ' bing: fiz <z@b.com>, zif <f@c.com>;,\n'
1349                        ' you <bar@example.com>\n')
1350
1351    def test_set_from_Group_list(self):
1352        h = self.make_header('to', [Group('bing', [Address('fiz', 'z', 'b.com'),
1353                                                   Address('zif', 'f', 'c.com')])])
1354        self.assertEqual(h, 'bing: fiz <z@b.com>, zif <f@c.com>;')
1355
1356
1357class TestAddressAndGroup(TestEmailBase):
1358
1359    def _test_attr_ro(self, obj, attr):
1360        with self.assertRaises(AttributeError):
1361            setattr(obj, attr, 'foo')
1362
1363    def test_address_display_name_ro(self):
1364        self._test_attr_ro(Address('foo', 'bar', 'baz'), 'display_name')
1365
1366    def test_address_username_ro(self):
1367        self._test_attr_ro(Address('foo', 'bar', 'baz'), 'username')
1368
1369    def test_address_domain_ro(self):
1370        self._test_attr_ro(Address('foo', 'bar', 'baz'), 'domain')
1371
1372    def test_group_display_name_ro(self):
1373        self._test_attr_ro(Group('foo'), 'display_name')
1374
1375    def test_group_addresses_ro(self):
1376        self._test_attr_ro(Group('foo'), 'addresses')
1377
1378    def test_address_from_username_domain(self):
1379        a = Address('foo', 'bar', 'baz')
1380        self.assertEqual(a.display_name, 'foo')
1381        self.assertEqual(a.username, 'bar')
1382        self.assertEqual(a.domain, 'baz')
1383        self.assertEqual(a.addr_spec, 'bar@baz')
1384        self.assertEqual(str(a), 'foo <bar@baz>')
1385
1386    def test_address_from_addr_spec(self):
1387        a = Address('foo', addr_spec='bar@baz')
1388        self.assertEqual(a.display_name, 'foo')
1389        self.assertEqual(a.username, 'bar')
1390        self.assertEqual(a.domain, 'baz')
1391        self.assertEqual(a.addr_spec, 'bar@baz')
1392        self.assertEqual(str(a), 'foo <bar@baz>')
1393
1394    def test_address_with_no_display_name(self):
1395        a = Address(addr_spec='bar@baz')
1396        self.assertEqual(a.display_name, '')
1397        self.assertEqual(a.username, 'bar')
1398        self.assertEqual(a.domain, 'baz')
1399        self.assertEqual(a.addr_spec, 'bar@baz')
1400        self.assertEqual(str(a), 'bar@baz')
1401
1402    def test_null_address(self):
1403        a = Address()
1404        self.assertEqual(a.display_name, '')
1405        self.assertEqual(a.username, '')
1406        self.assertEqual(a.domain, '')
1407        self.assertEqual(a.addr_spec, '<>')
1408        self.assertEqual(str(a), '<>')
1409
1410    def test_domain_only(self):
1411        # This isn't really a valid address.
1412        a = Address(domain='buzz')
1413        self.assertEqual(a.display_name, '')
1414        self.assertEqual(a.username, '')
1415        self.assertEqual(a.domain, 'buzz')
1416        self.assertEqual(a.addr_spec, '@buzz')
1417        self.assertEqual(str(a), '@buzz')
1418
1419    def test_username_only(self):
1420        # This isn't really a valid address.
1421        a = Address(username='buzz')
1422        self.assertEqual(a.display_name, '')
1423        self.assertEqual(a.username, 'buzz')
1424        self.assertEqual(a.domain, '')
1425        self.assertEqual(a.addr_spec, 'buzz')
1426        self.assertEqual(str(a), 'buzz')
1427
1428    def test_display_name_only(self):
1429        a = Address('buzz')
1430        self.assertEqual(a.display_name, 'buzz')
1431        self.assertEqual(a.username, '')
1432        self.assertEqual(a.domain, '')
1433        self.assertEqual(a.addr_spec, '<>')
1434        self.assertEqual(str(a), 'buzz <>')
1435
1436    def test_quoting(self):
1437        # Ideally we'd check every special individually, but I'm not up for
1438        # writing that many tests.
1439        a = Address('Sara J.', 'bad name', 'example.com')
1440        self.assertEqual(a.display_name, 'Sara J.')
1441        self.assertEqual(a.username, 'bad name')
1442        self.assertEqual(a.domain, 'example.com')
1443        self.assertEqual(a.addr_spec, '"bad name"@example.com')
1444        self.assertEqual(str(a), '"Sara J." <"bad name"@example.com>')
1445
1446    def test_il8n(self):
1447        a = Address('Éric', 'wok', 'exàmple.com')
1448        self.assertEqual(a.display_name, 'Éric')
1449        self.assertEqual(a.username, 'wok')
1450        self.assertEqual(a.domain, 'exàmple.com')
1451        self.assertEqual(a.addr_spec, 'wok@exàmple.com')
1452        self.assertEqual(str(a), 'Éric <wok@exàmple.com>')
1453
1454    # XXX: there is an API design issue that needs to be solved here.
1455    #def test_non_ascii_username_raises(self):
1456    #    with self.assertRaises(ValueError):
1457    #        Address('foo', 'wők', 'example.com')
1458
1459    def test_crlf_in_constructor_args_raises(self):
1460        cases = (
1461            dict(display_name='foo\r'),
1462            dict(display_name='foo\n'),
1463            dict(display_name='foo\r\n'),
1464            dict(domain='example.com\r'),
1465            dict(domain='example.com\n'),
1466            dict(domain='example.com\r\n'),
1467            dict(username='wok\r'),
1468            dict(username='wok\n'),
1469            dict(username='wok\r\n'),
1470            dict(addr_spec='wok@example.com\r'),
1471            dict(addr_spec='wok@example.com\n'),
1472            dict(addr_spec='wok@example.com\r\n')
1473        )
1474        for kwargs in cases:
1475            with self.subTest(kwargs=kwargs), self.assertRaisesRegex(ValueError, "invalid arguments"):
1476                Address(**kwargs)
1477
1478    def test_non_ascii_username_in_addr_spec_raises(self):
1479        with self.assertRaises(ValueError):
1480            Address('foo', addr_spec='wők@example.com')
1481
1482    def test_address_addr_spec_and_username_raises(self):
1483        with self.assertRaises(TypeError):
1484            Address('foo', username='bing', addr_spec='bar@baz')
1485
1486    def test_address_addr_spec_and_domain_raises(self):
1487        with self.assertRaises(TypeError):
1488            Address('foo', domain='bing', addr_spec='bar@baz')
1489
1490    def test_address_addr_spec_and_username_and_domain_raises(self):
1491        with self.assertRaises(TypeError):
1492            Address('foo', username='bong', domain='bing', addr_spec='bar@baz')
1493
1494    def test_space_in_addr_spec_username_raises(self):
1495        with self.assertRaises(ValueError):
1496            Address('foo', addr_spec="bad name@example.com")
1497
1498    def test_bad_addr_sepc_raises(self):
1499        with self.assertRaises(ValueError):
1500            Address('foo', addr_spec="name@ex[]ample.com")
1501
1502    def test_empty_group(self):
1503        g = Group('foo')
1504        self.assertEqual(g.display_name, 'foo')
1505        self.assertEqual(g.addresses, tuple())
1506        self.assertEqual(str(g), 'foo:;')
1507
1508    def test_empty_group_list(self):
1509        g = Group('foo', addresses=[])
1510        self.assertEqual(g.display_name, 'foo')
1511        self.assertEqual(g.addresses, tuple())
1512        self.assertEqual(str(g), 'foo:;')
1513
1514    def test_null_group(self):
1515        g = Group()
1516        self.assertIsNone(g.display_name)
1517        self.assertEqual(g.addresses, tuple())
1518        self.assertEqual(str(g), 'None:;')
1519
1520    def test_group_with_addresses(self):
1521        addrs = [Address('b', 'b', 'c'), Address('a', 'b','c')]
1522        g = Group('foo', addrs)
1523        self.assertEqual(g.display_name, 'foo')
1524        self.assertEqual(g.addresses, tuple(addrs))
1525        self.assertEqual(str(g), 'foo: b <b@c>, a <b@c>;')
1526
1527    def test_group_with_addresses_no_display_name(self):
1528        addrs = [Address('b', 'b', 'c'), Address('a', 'b','c')]
1529        g = Group(addresses=addrs)
1530        self.assertIsNone(g.display_name)
1531        self.assertEqual(g.addresses, tuple(addrs))
1532        self.assertEqual(str(g), 'None: b <b@c>, a <b@c>;')
1533
1534    def test_group_with_one_address_no_display_name(self):
1535        addrs = [Address('b', 'b', 'c')]
1536        g = Group(addresses=addrs)
1537        self.assertIsNone(g.display_name)
1538        self.assertEqual(g.addresses, tuple(addrs))
1539        self.assertEqual(str(g), 'b <b@c>')
1540
1541    def test_display_name_quoting(self):
1542        g = Group('foo.bar')
1543        self.assertEqual(g.display_name, 'foo.bar')
1544        self.assertEqual(g.addresses, tuple())
1545        self.assertEqual(str(g), '"foo.bar":;')
1546
1547    def test_display_name_blanks_not_quoted(self):
1548        g = Group('foo bar')
1549        self.assertEqual(g.display_name, 'foo bar')
1550        self.assertEqual(g.addresses, tuple())
1551        self.assertEqual(str(g), 'foo bar:;')
1552
1553    def test_set_message_header_from_address(self):
1554        a = Address('foo', 'bar', 'example.com')
1555        m = Message(policy=policy.default)
1556        m['To'] = a
1557        self.assertEqual(m['to'], 'foo <bar@example.com>')
1558        self.assertEqual(m['to'].addresses, (a,))
1559
1560    def test_set_message_header_from_group(self):
1561        g = Group('foo bar')
1562        m = Message(policy=policy.default)
1563        m['To'] = g
1564        self.assertEqual(m['to'], 'foo bar:;')
1565        self.assertEqual(m['to'].addresses, g.addresses)
1566
1567    def test_address_comparison(self):
1568        a = Address('foo', 'bar', 'example.com')
1569        self.assertEqual(Address('foo', 'bar', 'example.com'), a)
1570        self.assertNotEqual(Address('baz', 'bar', 'example.com'), a)
1571        self.assertNotEqual(Address('foo', 'baz', 'example.com'), a)
1572        self.assertNotEqual(Address('foo', 'bar', 'baz'), a)
1573        self.assertFalse(a == object())
1574        self.assertTrue(a == ALWAYS_EQ)
1575
1576    def test_group_comparison(self):
1577        a = Address('foo', 'bar', 'example.com')
1578        g = Group('foo bar', [a])
1579        self.assertEqual(Group('foo bar', (a,)), g)
1580        self.assertNotEqual(Group('baz', [a]), g)
1581        self.assertNotEqual(Group('foo bar', []), g)
1582        self.assertFalse(g == object())
1583        self.assertTrue(g == ALWAYS_EQ)
1584
1585
1586class TestFolding(TestHeaderBase):
1587
1588    def test_address_display_names(self):
1589        """Test the folding and encoding of address headers."""
1590        for name, result in (
1591                ('Foo Bar, France', '"Foo Bar, France"'),
1592                ('Foo Bar (France)', '"Foo Bar (France)"'),
1593                ('Foo Bar, España', 'Foo =?utf-8?q?Bar=2C_Espa=C3=B1a?='),
1594                ('Foo Bar (España)', 'Foo Bar =?utf-8?b?KEVzcGHDsWEp?='),
1595                ('Foo, Bar España', '=?utf-8?q?Foo=2C_Bar_Espa=C3=B1a?='),
1596                ('Foo, Bar [España]', '=?utf-8?q?Foo=2C_Bar_=5BEspa=C3=B1a=5D?='),
1597                ('Foo Bär, France', 'Foo =?utf-8?q?B=C3=A4r=2C?= France'),
1598                ('Foo Bär <France>', 'Foo =?utf-8?q?B=C3=A4r_=3CFrance=3E?='),
1599                (
1600                    'Lôrem ipsum dôlôr sit amet, cônsectetuer adipiscing. '
1601                    'Suspendisse pôtenti. Aliquam nibh. Suspendisse pôtenti.',
1602                    '=?utf-8?q?L=C3=B4rem_ipsum_d=C3=B4l=C3=B4r_sit_amet=2C_c'
1603                    '=C3=B4nsectetuer?=\n =?utf-8?q?adipiscing=2E_Suspendisse'
1604                    '_p=C3=B4tenti=2E_Aliquam_nibh=2E?=\n Suspendisse =?utf-8'
1605                    '?q?p=C3=B4tenti=2E?=',
1606                    ),
1607                ):
1608            h = self.make_header('To', Address(name, addr_spec='a@b.com'))
1609            self.assertEqual(h.fold(policy=policy.default),
1610                                    'To: %s <a@b.com>\n' % result)
1611
1612    def test_short_unstructured(self):
1613        h = self.make_header('subject', 'this is a test')
1614        self.assertEqual(h.fold(policy=policy.default),
1615                         'subject: this is a test\n')
1616
1617    def test_long_unstructured(self):
1618        h = self.make_header('Subject', 'This is a long header '
1619            'line that will need to be folded into two lines '
1620            'and will demonstrate basic folding')
1621        self.assertEqual(h.fold(policy=policy.default),
1622                        'Subject: This is a long header line that will '
1623                            'need to be folded into two lines\n'
1624                        ' and will demonstrate basic folding\n')
1625
1626    def test_unstructured_short_max_line_length(self):
1627        h = self.make_header('Subject', 'this is a short header '
1628            'that will be folded anyway')
1629        self.assertEqual(
1630            h.fold(policy=policy.default.clone(max_line_length=20)),
1631            textwrap.dedent("""\
1632                Subject: this is a
1633                 short header that
1634                 will be folded
1635                 anyway
1636                """))
1637
1638    def test_fold_unstructured_single_word(self):
1639        h = self.make_header('Subject', 'test')
1640        self.assertEqual(h.fold(policy=policy.default), 'Subject: test\n')
1641
1642    def test_fold_unstructured_short(self):
1643        h = self.make_header('Subject', 'test test test')
1644        self.assertEqual(h.fold(policy=policy.default),
1645                        'Subject: test test test\n')
1646
1647    def test_fold_unstructured_with_overlong_word(self):
1648        h = self.make_header('Subject', 'thisisaverylonglineconsistingofa'
1649            'singlewordthatwontfit')
1650        self.assertEqual(
1651            h.fold(policy=policy.default.clone(max_line_length=20)),
1652            'Subject: \n'
1653            ' =?utf-8?q?thisisa?=\n'
1654            ' =?utf-8?q?verylon?=\n'
1655            ' =?utf-8?q?glineco?=\n'
1656            ' =?utf-8?q?nsistin?=\n'
1657            ' =?utf-8?q?gofasin?=\n'
1658            ' =?utf-8?q?gleword?=\n'
1659            ' =?utf-8?q?thatwon?=\n'
1660            ' =?utf-8?q?tfit?=\n'
1661            )
1662
1663    def test_fold_unstructured_with_two_overlong_words(self):
1664        h = self.make_header('Subject', 'thisisaverylonglineconsistingofa'
1665            'singlewordthatwontfit plusanotherverylongwordthatwontfit')
1666        self.assertEqual(
1667            h.fold(policy=policy.default.clone(max_line_length=20)),
1668            'Subject: \n'
1669            ' =?utf-8?q?thisisa?=\n'
1670            ' =?utf-8?q?verylon?=\n'
1671            ' =?utf-8?q?glineco?=\n'
1672            ' =?utf-8?q?nsistin?=\n'
1673            ' =?utf-8?q?gofasin?=\n'
1674            ' =?utf-8?q?gleword?=\n'
1675            ' =?utf-8?q?thatwon?=\n'
1676            ' =?utf-8?q?tfit_pl?=\n'
1677            ' =?utf-8?q?usanoth?=\n'
1678            ' =?utf-8?q?erveryl?=\n'
1679            ' =?utf-8?q?ongword?=\n'
1680            ' =?utf-8?q?thatwon?=\n'
1681            ' =?utf-8?q?tfit?=\n'
1682            )
1683
1684    # XXX Need test for when max_line_length is less than the chrome size.
1685
1686    def test_fold_unstructured_with_slightly_long_word(self):
1687        h = self.make_header('Subject', 'thislongwordislessthanmaxlinelen')
1688        self.assertEqual(
1689            h.fold(policy=policy.default.clone(max_line_length=35)),
1690            'Subject:\n thislongwordislessthanmaxlinelen\n')
1691
1692    def test_fold_unstructured_with_commas(self):
1693        # The old wrapper would fold this at the commas.
1694        h = self.make_header('Subject', "This header is intended to "
1695            "demonstrate, in a fairly succinct way, that we now do "
1696            "not give a , special treatment in unstructured headers.")
1697        self.assertEqual(
1698            h.fold(policy=policy.default.clone(max_line_length=60)),
1699            textwrap.dedent("""\
1700                Subject: This header is intended to demonstrate, in a fairly
1701                 succinct way, that we now do not give a , special treatment
1702                 in unstructured headers.
1703                 """))
1704
1705    def test_fold_address_list(self):
1706        h = self.make_header('To', '"Theodore H. Perfect" <yes@man.com>, '
1707            '"My address is very long because my name is long" <foo@bar.com>, '
1708            '"Only A. Friend" <no@yes.com>')
1709        self.assertEqual(h.fold(policy=policy.default), textwrap.dedent("""\
1710            To: "Theodore H. Perfect" <yes@man.com>,
1711             "My address is very long because my name is long" <foo@bar.com>,
1712             "Only A. Friend" <no@yes.com>
1713             """))
1714
1715    def test_fold_date_header(self):
1716        h = self.make_header('Date', 'Sat, 2 Feb 2002 17:00:06 -0800')
1717        self.assertEqual(h.fold(policy=policy.default),
1718                        'Date: Sat, 02 Feb 2002 17:00:06 -0800\n')
1719
1720    def test_fold_overlong_words_using_RFC2047(self):
1721        h = self.make_header(
1722            'X-Report-Abuse',
1723            '<https://www.mailitapp.com/report_abuse.php?'
1724              'mid=xxx-xxx-xxxxxxxxxxxxxxxxxxxxxxxx==-xxx-xx-xx>')
1725        self.assertEqual(
1726            h.fold(policy=policy.default),
1727            'X-Report-Abuse: =?utf-8?q?=3Chttps=3A//www=2Emailitapp=2E'
1728                'com/report=5Fabuse?=\n'
1729            ' =?utf-8?q?=2Ephp=3Fmid=3Dxxx-xxx-xxxx'
1730                'xxxxxxxxxxxxxxxxxxxx=3D=3D-xxx-xx-xx?=\n'
1731            ' =?utf-8?q?=3E?=\n')
1732
1733    def test_message_id_header_is_not_folded(self):
1734        h = self.make_header(
1735            'Message-ID',
1736            '<somemessageidlongerthan@maxlinelength.com>')
1737        self.assertEqual(
1738            h.fold(policy=policy.default.clone(max_line_length=20)),
1739            'Message-ID: <somemessageidlongerthan@maxlinelength.com>\n')
1740
1741        # Test message-id isn't folded when id-right is no-fold-literal.
1742        h = self.make_header(
1743            'Message-ID',
1744            '<somemessageidlongerthan@[127.0.0.0.0.0.0.0.0.1]>')
1745        self.assertEqual(
1746            h.fold(policy=policy.default.clone(max_line_length=20)),
1747            'Message-ID: <somemessageidlongerthan@[127.0.0.0.0.0.0.0.0.1]>\n')
1748
1749        # Test message-id isn't folded when id-right is non-ascii characters.
1750        h = self.make_header('Message-ID', '<ईमेल@wők.com>')
1751        self.assertEqual(
1752            h.fold(policy=policy.default.clone(max_line_length=30)),
1753            'Message-ID: <ईमेल@wők.com>\n')
1754
1755        # Test message-id is folded without breaking the msg-id token into
1756        # encoded words, *even* if they don't fit into max_line_length.
1757        h = self.make_header('Message-ID', '<ईमेलfromMessage@wők.com>')
1758        self.assertEqual(
1759            h.fold(policy=policy.default.clone(max_line_length=20)),
1760            'Message-ID:\n <ईमेलfromMessage@wők.com>\n')
1761
1762if __name__ == '__main__':
1763    unittest.main()
1764