1import datetime 2import textwrap 3import unittest 4from email import errors 5from email import policy 6from email.message import Message 7from test.test_email import TestEmailBase, parameterize 8from email import headerregistry 9from email.headerregistry import Address, Group 10from test.support import ALWAYS_EQ 11 12 13DITTO = object() 14 15 16class TestHeaderRegistry(TestEmailBase): 17 18 def test_arbitrary_name_unstructured(self): 19 factory = headerregistry.HeaderRegistry() 20 h = factory('foobar', 'test') 21 self.assertIsInstance(h, headerregistry.BaseHeader) 22 self.assertIsInstance(h, headerregistry.UnstructuredHeader) 23 24 def test_name_case_ignored(self): 25 factory = headerregistry.HeaderRegistry() 26 # Whitebox check that test is valid 27 self.assertNotIn('Subject', factory.registry) 28 h = factory('Subject', 'test') 29 self.assertIsInstance(h, headerregistry.BaseHeader) 30 self.assertIsInstance(h, headerregistry.UniqueUnstructuredHeader) 31 32 class FooBase: 33 def __init__(self, *args, **kw): 34 pass 35 36 def test_override_default_base_class(self): 37 factory = headerregistry.HeaderRegistry(base_class=self.FooBase) 38 h = factory('foobar', 'test') 39 self.assertIsInstance(h, self.FooBase) 40 self.assertIsInstance(h, headerregistry.UnstructuredHeader) 41 42 class FooDefault: 43 parse = headerregistry.UnstructuredHeader.parse 44 45 def test_override_default_class(self): 46 factory = headerregistry.HeaderRegistry(default_class=self.FooDefault) 47 h = factory('foobar', 'test') 48 self.assertIsInstance(h, headerregistry.BaseHeader) 49 self.assertIsInstance(h, self.FooDefault) 50 51 def test_override_default_class_only_overrides_default(self): 52 factory = headerregistry.HeaderRegistry(default_class=self.FooDefault) 53 h = factory('subject', 'test') 54 self.assertIsInstance(h, headerregistry.BaseHeader) 55 self.assertIsInstance(h, headerregistry.UniqueUnstructuredHeader) 56 57 def test_dont_use_default_map(self): 58 factory = headerregistry.HeaderRegistry(use_default_map=False) 59 h = factory('subject', 'test') 60 self.assertIsInstance(h, headerregistry.BaseHeader) 61 self.assertIsInstance(h, headerregistry.UnstructuredHeader) 62 63 def test_map_to_type(self): 64 factory = headerregistry.HeaderRegistry() 65 h1 = factory('foobar', 'test') 66 factory.map_to_type('foobar', headerregistry.UniqueUnstructuredHeader) 67 h2 = factory('foobar', 'test') 68 self.assertIsInstance(h1, headerregistry.BaseHeader) 69 self.assertIsInstance(h1, headerregistry.UnstructuredHeader) 70 self.assertIsInstance(h2, headerregistry.BaseHeader) 71 self.assertIsInstance(h2, headerregistry.UniqueUnstructuredHeader) 72 73 74class TestHeaderBase(TestEmailBase): 75 76 factory = headerregistry.HeaderRegistry() 77 78 def make_header(self, name, value): 79 return self.factory(name, value) 80 81 82class TestBaseHeaderFeatures(TestHeaderBase): 83 84 def test_str(self): 85 h = self.make_header('subject', 'this is a test') 86 self.assertIsInstance(h, str) 87 self.assertEqual(h, 'this is a test') 88 self.assertEqual(str(h), 'this is a test') 89 90 def test_substr(self): 91 h = self.make_header('subject', 'this is a test') 92 self.assertEqual(h[5:7], 'is') 93 94 def test_has_name(self): 95 h = self.make_header('subject', 'this is a test') 96 self.assertEqual(h.name, 'subject') 97 98 def _test_attr_ro(self, attr): 99 h = self.make_header('subject', 'this is a test') 100 with self.assertRaises(AttributeError): 101 setattr(h, attr, 'foo') 102 103 def test_name_read_only(self): 104 self._test_attr_ro('name') 105 106 def test_defects_read_only(self): 107 self._test_attr_ro('defects') 108 109 def test_defects_is_tuple(self): 110 h = self.make_header('subject', 'this is a test') 111 self.assertEqual(len(h.defects), 0) 112 self.assertIsInstance(h.defects, tuple) 113 # Make sure it is still true when there are defects. 114 h = self.make_header('date', '') 115 self.assertEqual(len(h.defects), 1) 116 self.assertIsInstance(h.defects, tuple) 117 118 # XXX: FIXME 119 #def test_CR_in_value(self): 120 # # XXX: this also re-raises the issue of embedded headers, 121 # # need test and solution for that. 122 # value = '\r'.join(['this is', ' a test']) 123 # h = self.make_header('subject', value) 124 # self.assertEqual(h, value) 125 # self.assertDefectsEqual(h.defects, [errors.ObsoleteHeaderDefect]) 126 127 128@parameterize 129class TestUnstructuredHeader(TestHeaderBase): 130 131 def string_as_value(self, 132 source, 133 decoded, 134 *args): 135 l = len(args) 136 defects = args[0] if l>0 else [] 137 header = 'Subject:' + (' ' if source else '') 138 folded = header + (args[1] if l>1 else source) + '\n' 139 h = self.make_header('Subject', source) 140 self.assertEqual(h, decoded) 141 self.assertDefectsEqual(h.defects, defects) 142 self.assertEqual(h.fold(policy=policy.default), folded) 143 144 string_params = { 145 146 'rfc2047_simple_quopri': ( 147 '=?utf-8?q?this_is_a_test?=', 148 'this is a test', 149 [], 150 'this is a test'), 151 152 'rfc2047_gb2312_base64': ( 153 '=?gb2312?b?1eLKx9bQzsSy4srUo6E=?=', 154 '\u8fd9\u662f\u4e2d\u6587\u6d4b\u8bd5\uff01', 155 [], 156 '=?utf-8?b?6L+Z5piv5Lit5paH5rWL6K+V77yB?='), 157 158 'rfc2047_simple_nonascii_quopri': ( 159 '=?utf-8?q?=C3=89ric?=', 160 'Éric'), 161 162 'rfc2047_quopri_with_regular_text': ( 163 'The =?utf-8?q?=C3=89ric=2C?= Himself', 164 'The Éric, Himself'), 165 166 } 167 168 169@parameterize 170class TestDateHeader(TestHeaderBase): 171 172 datestring = 'Sun, 23 Sep 2001 20:10:55 -0700' 173 utcoffset = datetime.timedelta(hours=-7) 174 tz = datetime.timezone(utcoffset) 175 dt = datetime.datetime(2001, 9, 23, 20, 10, 55, tzinfo=tz) 176 177 def test_parse_date(self): 178 h = self.make_header('date', self.datestring) 179 self.assertEqual(h, self.datestring) 180 self.assertEqual(h.datetime, self.dt) 181 self.assertEqual(h.datetime.utcoffset(), self.utcoffset) 182 self.assertEqual(h.defects, ()) 183 184 def test_set_from_datetime(self): 185 h = self.make_header('date', self.dt) 186 self.assertEqual(h, self.datestring) 187 self.assertEqual(h.datetime, self.dt) 188 self.assertEqual(h.defects, ()) 189 190 def test_date_header_properties(self): 191 h = self.make_header('date', self.datestring) 192 self.assertIsInstance(h, headerregistry.UniqueDateHeader) 193 self.assertEqual(h.max_count, 1) 194 self.assertEqual(h.defects, ()) 195 196 def test_resent_date_header_properties(self): 197 h = self.make_header('resent-date', self.datestring) 198 self.assertIsInstance(h, headerregistry.DateHeader) 199 self.assertEqual(h.max_count, None) 200 self.assertEqual(h.defects, ()) 201 202 def test_no_value_is_defect(self): 203 h = self.make_header('date', '') 204 self.assertEqual(len(h.defects), 1) 205 self.assertIsInstance(h.defects[0], errors.HeaderMissingRequiredValue) 206 207 def test_datetime_read_only(self): 208 h = self.make_header('date', self.datestring) 209 with self.assertRaises(AttributeError): 210 h.datetime = 'foo' 211 212 def test_set_date_header_from_datetime(self): 213 m = Message(policy=policy.default) 214 m['Date'] = self.dt 215 self.assertEqual(m['Date'], self.datestring) 216 self.assertEqual(m['Date'].datetime, self.dt) 217 218 219@parameterize 220class TestContentTypeHeader(TestHeaderBase): 221 222 def content_type_as_value(self, 223 source, 224 content_type, 225 maintype, 226 subtype, 227 *args): 228 l = len(args) 229 parmdict = args[0] if l>0 else {} 230 defects = args[1] if l>1 else [] 231 decoded = args[2] if l>2 and args[2] is not DITTO else source 232 header = 'Content-Type:' + ' ' if source else '' 233 folded = args[3] if l>3 else header + decoded + '\n' 234 h = self.make_header('Content-Type', source) 235 self.assertEqual(h.content_type, content_type) 236 self.assertEqual(h.maintype, maintype) 237 self.assertEqual(h.subtype, subtype) 238 self.assertEqual(h.params, parmdict) 239 with self.assertRaises(TypeError): 240 h.params['abc'] = 'xyz' # make sure params is read-only. 241 self.assertDefectsEqual(h.defects, defects) 242 self.assertEqual(h, decoded) 243 self.assertEqual(h.fold(policy=policy.default), folded) 244 245 content_type_params = { 246 247 # Examples from RFC 2045. 248 249 'RFC_2045_1': ( 250 'text/plain; charset=us-ascii (Plain text)', 251 'text/plain', 252 'text', 253 'plain', 254 {'charset': 'us-ascii'}, 255 [], 256 'text/plain; charset="us-ascii"'), 257 258 'RFC_2045_2': ( 259 'text/plain; charset=us-ascii', 260 'text/plain', 261 'text', 262 'plain', 263 {'charset': 'us-ascii'}, 264 [], 265 'text/plain; charset="us-ascii"'), 266 267 'RFC_2045_3': ( 268 'text/plain; charset="us-ascii"', 269 'text/plain', 270 'text', 271 'plain', 272 {'charset': 'us-ascii'}), 273 274 # RFC 2045 5.2 says syntactically invalid values are to be treated as 275 # text/plain. 276 277 'no_subtype_in_content_type': ( 278 'text/', 279 'text/plain', 280 'text', 281 'plain', 282 {}, 283 [errors.InvalidHeaderDefect]), 284 285 'no_slash_in_content_type': ( 286 'foo', 287 'text/plain', 288 'text', 289 'plain', 290 {}, 291 [errors.InvalidHeaderDefect]), 292 293 'junk_text_in_content_type': ( 294 '<crazy "stuff">', 295 'text/plain', 296 'text', 297 'plain', 298 {}, 299 [errors.InvalidHeaderDefect]), 300 301 'too_many_slashes_in_content_type': ( 302 'image/jpeg/foo', 303 'text/plain', 304 'text', 305 'plain', 306 {}, 307 [errors.InvalidHeaderDefect]), 308 309 # But unknown names are OK. We could make non-IANA names a defect, but 310 # by not doing so we make ourselves future proof. The fact that they 311 # are unknown will be detectable by the fact that they don't appear in 312 # the mime_registry...and the application is free to extend that list 313 # to handle them even if the core library doesn't. 314 315 'unknown_content_type': ( 316 'bad/names', 317 'bad/names', 318 'bad', 319 'names'), 320 321 # The content type is case insensitive, and CFWS is ignored. 322 323 'mixed_case_content_type': ( 324 'ImAge/JPeg', 325 'image/jpeg', 326 'image', 327 'jpeg'), 328 329 'spaces_in_content_type': ( 330 ' text / plain ', 331 'text/plain', 332 'text', 333 'plain'), 334 335 'cfws_in_content_type': ( 336 '(foo) text (bar)/(baz)plain(stuff)', 337 'text/plain', 338 'text', 339 'plain'), 340 341 # test some parameters (more tests could be added for parameters 342 # associated with other content types, but since parameter parsing is 343 # generic they would be redundant for the current implementation). 344 345 'charset_param': ( 346 'text/plain; charset="utf-8"', 347 'text/plain', 348 'text', 349 'plain', 350 {'charset': 'utf-8'}), 351 352 'capitalized_charset': ( 353 'text/plain; charset="US-ASCII"', 354 'text/plain', 355 'text', 356 'plain', 357 {'charset': 'US-ASCII'}), 358 359 'unknown_charset': ( 360 'text/plain; charset="fOo"', 361 'text/plain', 362 'text', 363 'plain', 364 {'charset': 'fOo'}), 365 366 'capitalized_charset_param_name_and_comment': ( 367 'text/plain; (interjection) Charset="utf-8"', 368 'text/plain', 369 'text', 370 'plain', 371 {'charset': 'utf-8'}, 372 [], 373 # Should the parameter name be lowercased here? 374 'text/plain; Charset="utf-8"'), 375 376 # Since this is pretty much the ur-mimeheader, we'll put all the tests 377 # that exercise the parameter parsing and formatting here. Note that 378 # when we refold we may canonicalize, so things like whitespace, 379 # quoting, and rfc2231 encoding may change from what was in the input 380 # header. 381 382 'unquoted_param_value': ( 383 'text/plain; title=foo', 384 'text/plain', 385 'text', 386 'plain', 387 {'title': 'foo'}, 388 [], 389 'text/plain; title="foo"', 390 ), 391 392 'param_value_with_tspecials': ( 393 'text/plain; title="(bar)foo blue"', 394 'text/plain', 395 'text', 396 'plain', 397 {'title': '(bar)foo blue'}), 398 399 'param_with_extra_quoted_whitespace': ( 400 'text/plain; title=" a loong way \t home "', 401 'text/plain', 402 'text', 403 'plain', 404 {'title': ' a loong way \t home '}), 405 406 'bad_params': ( 407 'blarg; baz; boo', 408 'text/plain', 409 'text', 410 'plain', 411 {'baz': '', 'boo': ''}, 412 [errors.InvalidHeaderDefect]*3), 413 414 'spaces_around_param_equals': ( 415 'Multipart/mixed; boundary = "CPIMSSMTPC06p5f3tG"', 416 'multipart/mixed', 417 'multipart', 418 'mixed', 419 {'boundary': 'CPIMSSMTPC06p5f3tG'}, 420 [], 421 'Multipart/mixed; boundary="CPIMSSMTPC06p5f3tG"', 422 ), 423 424 'spaces_around_semis': ( 425 ('image/jpeg; name="wibble.JPG" ; x-mac-type="4A504547" ; ' 426 'x-mac-creator="474B4F4E"'), 427 'image/jpeg', 428 'image', 429 'jpeg', 430 {'name': 'wibble.JPG', 431 'x-mac-type': '4A504547', 432 'x-mac-creator': '474B4F4E'}, 433 [], 434 ('image/jpeg; name="wibble.JPG"; x-mac-type="4A504547"; ' 435 'x-mac-creator="474B4F4E"'), 436 ('Content-Type: image/jpeg; name="wibble.JPG";' 437 ' x-mac-type="4A504547";\n' 438 ' x-mac-creator="474B4F4E"\n'), 439 ), 440 441 'lots_of_mime_params': ( 442 ('image/jpeg; name="wibble.JPG"; x-mac-type="4A504547"; ' 443 'x-mac-creator="474B4F4E"; x-extrastuff="make it longer"'), 444 'image/jpeg', 445 'image', 446 'jpeg', 447 {'name': 'wibble.JPG', 448 'x-mac-type': '4A504547', 449 'x-mac-creator': '474B4F4E', 450 'x-extrastuff': 'make it longer'}, 451 [], 452 ('image/jpeg; name="wibble.JPG"; x-mac-type="4A504547"; ' 453 'x-mac-creator="474B4F4E"; x-extrastuff="make it longer"'), 454 # In this case the whole of the MimeParameters does *not* fit 455 # one one line, so we break at a lower syntactic level. 456 ('Content-Type: image/jpeg; name="wibble.JPG";' 457 ' x-mac-type="4A504547";\n' 458 ' x-mac-creator="474B4F4E"; x-extrastuff="make it longer"\n'), 459 ), 460 461 'semis_inside_quotes': ( 462 'image/jpeg; name="Jim&&Jill"', 463 'image/jpeg', 464 'image', 465 'jpeg', 466 {'name': 'Jim&&Jill'}), 467 468 'single_quotes_inside_quotes': ( 469 'image/jpeg; name="Jim \'Bob\' Jill"', 470 'image/jpeg', 471 'image', 472 'jpeg', 473 {'name': "Jim 'Bob' Jill"}), 474 475 'double_quotes_inside_quotes': ( 476 r'image/jpeg; name="Jim \"Bob\" Jill"', 477 'image/jpeg', 478 'image', 479 'jpeg', 480 {'name': 'Jim "Bob" Jill'}, 481 [], 482 r'image/jpeg; name="Jim \"Bob\" Jill"'), 483 484 'non_ascii_in_params': ( 485 ('foo\xa7/bar; b\xa7r=two; ' 486 'baz=thr\xa7e'.encode('latin-1').decode('us-ascii', 487 'surrogateescape')), 488 'foo\uFFFD/bar', 489 'foo\uFFFD', 490 'bar', 491 {'b\uFFFDr': 'two', 'baz': 'thr\uFFFDe'}, 492 [errors.UndecodableBytesDefect]*3, 493 'foo�/bar; b�r="two"; baz="thr�e"', 494 # XXX Two bugs here: the mime type is not allowed to be an encoded 495 # word, and we shouldn't be emitting surrogates in the parameter 496 # names. But I don't know what the behavior should be here, so I'm 497 # punting for now. In practice this is unlikely to be encountered 498 # since headers with binary in them only come from a binary source 499 # and are almost certain to be re-emitted without refolding. 500 'Content-Type: =?unknown-8bit?q?foo=A7?=/bar; b\udca7r="two";\n' 501 " baz*=unknown-8bit''thr%A7e\n", 502 ), 503 504 # RFC 2231 parameter tests. 505 506 'rfc2231_segmented_normal_values': ( 507 'image/jpeg; name*0="abc"; name*1=".html"', 508 'image/jpeg', 509 'image', 510 'jpeg', 511 {'name': "abc.html"}, 512 [], 513 'image/jpeg; name="abc.html"'), 514 515 'quotes_inside_rfc2231_value': ( 516 r'image/jpeg; bar*0="baz\"foobar"; bar*1="\"baz"', 517 'image/jpeg', 518 'image', 519 'jpeg', 520 {'bar': 'baz"foobar"baz'}, 521 [], 522 r'image/jpeg; bar="baz\"foobar\"baz"'), 523 524 'non_ascii_rfc2231_value': ( 525 ('text/plain; charset=us-ascii; ' 526 "title*=us-ascii'en'This%20is%20" 527 'not%20f\xa7n').encode('latin-1').decode('us-ascii', 528 'surrogateescape'), 529 'text/plain', 530 'text', 531 'plain', 532 {'charset': 'us-ascii', 'title': 'This is not f\uFFFDn'}, 533 [errors.UndecodableBytesDefect], 534 'text/plain; charset="us-ascii"; title="This is not f�n"', 535 'Content-Type: text/plain; charset="us-ascii";\n' 536 " title*=unknown-8bit''This%20is%20not%20f%A7n\n", 537 ), 538 539 'rfc2231_encoded_charset': ( 540 'text/plain; charset*=ansi-x3.4-1968\'\'us-ascii', 541 'text/plain', 542 'text', 543 'plain', 544 {'charset': 'us-ascii'}, 545 [], 546 'text/plain; charset="us-ascii"'), 547 548 # This follows the RFC: no double quotes around encoded values. 549 'rfc2231_encoded_no_double_quotes': ( 550 ("text/plain;" 551 "\tname*0*=''This%20is%20;" 552 "\tname*1*=%2A%2A%2Afun%2A%2A%2A%20;" 553 '\tname*2="is it not.pdf"'), 554 'text/plain', 555 'text', 556 'plain', 557 {'name': 'This is ***fun*** is it not.pdf'}, 558 [], 559 'text/plain; name="This is ***fun*** is it not.pdf"', 560 ), 561 562 # Make sure we also handle it if there are spurious double quotes. 563 'rfc2231_encoded_with_double_quotes': ( 564 ("text/plain;" 565 '\tname*0*="us-ascii\'\'This%20is%20even%20more%20";' 566 '\tname*1*="%2A%2A%2Afun%2A%2A%2A%20";' 567 '\tname*2="is it not.pdf"'), 568 'text/plain', 569 'text', 570 'plain', 571 {'name': 'This is even more ***fun*** is it not.pdf'}, 572 [errors.InvalidHeaderDefect]*2, 573 'text/plain; name="This is even more ***fun*** is it not.pdf"', 574 ), 575 576 'rfc2231_single_quote_inside_double_quotes': ( 577 ('text/plain; charset=us-ascii;' 578 '\ttitle*0*="us-ascii\'en\'This%20is%20really%20";' 579 '\ttitle*1*="%2A%2A%2Afun%2A%2A%2A%20";' 580 '\ttitle*2="isn\'t it!"'), 581 'text/plain', 582 'text', 583 'plain', 584 {'charset': 'us-ascii', 'title': "This is really ***fun*** isn't it!"}, 585 [errors.InvalidHeaderDefect]*2, 586 ('text/plain; charset="us-ascii"; ' 587 'title="This is really ***fun*** isn\'t it!"'), 588 ('Content-Type: text/plain; charset="us-ascii";\n' 589 ' title="This is really ***fun*** isn\'t it!"\n'), 590 ), 591 592 'rfc2231_single_quote_in_value_with_charset_and_lang': ( 593 ('application/x-foo;' 594 "\tname*0*=\"us-ascii'en-us'Frank's\"; name*1*=\" Document\""), 595 'application/x-foo', 596 'application', 597 'x-foo', 598 {'name': "Frank's Document"}, 599 [errors.InvalidHeaderDefect]*2, 600 'application/x-foo; name="Frank\'s Document"', 601 ), 602 603 'rfc2231_single_quote_in_non_encoded_value': ( 604 ('application/x-foo;' 605 "\tname*0=\"us-ascii'en-us'Frank's\"; name*1=\" Document\""), 606 'application/x-foo', 607 'application', 608 'x-foo', 609 {'name': "us-ascii'en-us'Frank's Document"}, 610 [], 611 'application/x-foo; name="us-ascii\'en-us\'Frank\'s Document"', 612 ), 613 614 'rfc2231_no_language_or_charset': ( 615 'text/plain; NAME*0*=english_is_the_default.html', 616 'text/plain', 617 'text', 618 'plain', 619 {'name': 'english_is_the_default.html'}, 620 [errors.InvalidHeaderDefect], 621 'text/plain; NAME="english_is_the_default.html"'), 622 623 'rfc2231_encoded_no_charset': ( 624 ("text/plain;" 625 '\tname*0*="\'\'This%20is%20even%20more%20";' 626 '\tname*1*="%2A%2A%2Afun%2A%2A%2A%20";' 627 '\tname*2="is it.pdf"'), 628 'text/plain', 629 'text', 630 'plain', 631 {'name': 'This is even more ***fun*** is it.pdf'}, 632 [errors.InvalidHeaderDefect]*2, 633 'text/plain; name="This is even more ***fun*** is it.pdf"', 634 ), 635 636 'rfc2231_partly_encoded': ( 637 ("text/plain;" 638 '\tname*0*="\'\'This%20is%20even%20more%20";' 639 '\tname*1*="%2A%2A%2Afun%2A%2A%2A%20";' 640 '\tname*2="is it.pdf"'), 641 'text/plain', 642 'text', 643 'plain', 644 {'name': 'This is even more ***fun*** is it.pdf'}, 645 [errors.InvalidHeaderDefect]*2, 646 'text/plain; name="This is even more ***fun*** is it.pdf"', 647 ), 648 649 'rfc2231_partly_encoded_2': ( 650 ("text/plain;" 651 '\tname*0*="\'\'This%20is%20even%20more%20";' 652 '\tname*1="%2A%2A%2Afun%2A%2A%2A%20";' 653 '\tname*2="is it.pdf"'), 654 'text/plain', 655 'text', 656 'plain', 657 {'name': 'This is even more %2A%2A%2Afun%2A%2A%2A%20is it.pdf'}, 658 [errors.InvalidHeaderDefect], 659 ('text/plain;' 660 ' name="This is even more %2A%2A%2Afun%2A%2A%2A%20is it.pdf"'), 661 ('Content-Type: text/plain;\n' 662 ' name="This is even more %2A%2A%2Afun%2A%2A%2A%20is' 663 ' it.pdf"\n'), 664 ), 665 666 'rfc2231_unknown_charset_treated_as_ascii': ( 667 "text/plain; name*0*=bogus'xx'ascii_is_the_default", 668 'text/plain', 669 'text', 670 'plain', 671 {'name': 'ascii_is_the_default'}, 672 [], 673 'text/plain; name="ascii_is_the_default"'), 674 675 'rfc2231_bad_character_in_charset_parameter_value': ( 676 "text/plain; charset*=ascii''utf-8%F1%F2%F3", 677 'text/plain', 678 'text', 679 'plain', 680 {'charset': 'utf-8\uFFFD\uFFFD\uFFFD'}, 681 [errors.UndecodableBytesDefect], 682 'text/plain; charset="utf-8\uFFFD\uFFFD\uFFFD"', 683 "Content-Type: text/plain;" 684 " charset*=unknown-8bit''utf-8%F1%F2%F3\n", 685 ), 686 687 'rfc2231_utf8_in_supposedly_ascii_charset_parameter_value': ( 688 "text/plain; charset*=ascii''utf-8%E2%80%9D", 689 'text/plain', 690 'text', 691 'plain', 692 {'charset': 'utf-8”'}, 693 [errors.UndecodableBytesDefect], 694 'text/plain; charset="utf-8”"', 695 # XXX Should folding change the charset to utf8? Currently it just 696 # reproduces the original, which is arguably fine. 697 "Content-Type: text/plain;" 698 " charset*=unknown-8bit''utf-8%E2%80%9D\n", 699 ), 700 701 'rfc2231_encoded_then_unencoded_segments': ( 702 ('application/x-foo;' 703 '\tname*0*="us-ascii\'en-us\'My";' 704 '\tname*1=" Document";' 705 '\tname*2=" For You"'), 706 'application/x-foo', 707 'application', 708 'x-foo', 709 {'name': 'My Document For You'}, 710 [errors.InvalidHeaderDefect], 711 'application/x-foo; name="My Document For You"', 712 ), 713 714 # My reading of the RFC is that this is an invalid header. The RFC 715 # says that if charset and language information is given, the first 716 # segment *must* be encoded. 717 'rfc2231_unencoded_then_encoded_segments': ( 718 ('application/x-foo;' 719 '\tname*0=us-ascii\'en-us\'My;' 720 '\tname*1*=" Document";' 721 '\tname*2*=" For You"'), 722 'application/x-foo', 723 'application', 724 'x-foo', 725 {'name': 'My Document For You'}, 726 [errors.InvalidHeaderDefect]*3, 727 'application/x-foo; name="My Document For You"', 728 ), 729 730 # XXX: I would say this one should default to ascii/en for the 731 # "encoded" segment, since the first segment is not encoded and is 732 # in double quotes, making the value a valid non-encoded string. The 733 # old parser decodes this just like the previous case, which may be the 734 # better Postel rule, but could equally result in borking headers that 735 # intentionally have quoted quotes in them. We could get this 98% 736 # right if we treat it as a quoted string *unless* it matches the 737 # charset'lang'value pattern exactly *and* there is at least one 738 # encoded segment. Implementing that algorithm will require some 739 # refactoring, so I haven't done it (yet). 740 'rfc2231_quoted_unencoded_then_encoded_segments': ( 741 ('application/x-foo;' 742 '\tname*0="us-ascii\'en-us\'My";' 743 '\tname*1*=" Document";' 744 '\tname*2*=" For You"'), 745 'application/x-foo', 746 'application', 747 'x-foo', 748 {'name': "us-ascii'en-us'My Document For You"}, 749 [errors.InvalidHeaderDefect]*2, 750 'application/x-foo; name="us-ascii\'en-us\'My Document For You"', 751 ), 752 753 # Make sure our folding algorithm produces multiple sections correctly. 754 # We could mix encoded and non-encoded segments, but we don't, we just 755 # make them all encoded. It might be worth fixing that, since the 756 # sections can get used for wrapping ascii text. 757 'rfc2231_folded_segments_correctly_formatted': ( 758 ('application/x-foo;' 759 '\tname="' + "with spaces"*8 + '"'), 760 'application/x-foo', 761 'application', 762 'x-foo', 763 {'name': "with spaces"*8}, 764 [], 765 'application/x-foo; name="' + "with spaces"*8 + '"', 766 "Content-Type: application/x-foo;\n" 767 " name*0*=us-ascii''with%20spaceswith%20spaceswith%20spaceswith" 768 "%20spaceswith;\n" 769 " name*1*=%20spaceswith%20spaceswith%20spaceswith%20spaces\n" 770 ), 771 772 } 773 774 775@parameterize 776class TestContentTransferEncoding(TestHeaderBase): 777 778 def cte_as_value(self, 779 source, 780 cte, 781 *args): 782 l = len(args) 783 defects = args[0] if l>0 else [] 784 decoded = args[1] if l>1 and args[1] is not DITTO else source 785 header = 'Content-Transfer-Encoding:' + ' ' if source else '' 786 folded = args[2] if l>2 else header + source + '\n' 787 h = self.make_header('Content-Transfer-Encoding', source) 788 self.assertEqual(h.cte, cte) 789 self.assertDefectsEqual(h.defects, defects) 790 self.assertEqual(h, decoded) 791 self.assertEqual(h.fold(policy=policy.default), folded) 792 793 cte_params = { 794 795 'RFC_2183_1': ( 796 'base64', 797 'base64',), 798 799 'no_value': ( 800 '', 801 '7bit', 802 [errors.HeaderMissingRequiredValue], 803 '', 804 'Content-Transfer-Encoding:\n', 805 ), 806 807 'junk_after_cte': ( 808 '7bit and a bunch more', 809 '7bit', 810 [errors.InvalidHeaderDefect]), 811 812 } 813 814 815@parameterize 816class TestContentDisposition(TestHeaderBase): 817 818 def content_disp_as_value(self, 819 source, 820 content_disposition, 821 *args): 822 l = len(args) 823 parmdict = args[0] if l>0 else {} 824 defects = args[1] if l>1 else [] 825 decoded = args[2] if l>2 and args[2] is not DITTO else source 826 header = 'Content-Disposition:' + ' ' if source else '' 827 folded = args[3] if l>3 else header + source + '\n' 828 h = self.make_header('Content-Disposition', source) 829 self.assertEqual(h.content_disposition, content_disposition) 830 self.assertEqual(h.params, parmdict) 831 self.assertDefectsEqual(h.defects, defects) 832 self.assertEqual(h, decoded) 833 self.assertEqual(h.fold(policy=policy.default), folded) 834 835 content_disp_params = { 836 837 # Examples from RFC 2183. 838 839 'RFC_2183_1': ( 840 'inline', 841 'inline',), 842 843 'RFC_2183_2': ( 844 ('attachment; filename=genome.jpeg;' 845 ' modification-date="Wed, 12 Feb 1997 16:29:51 -0500";'), 846 'attachment', 847 {'filename': 'genome.jpeg', 848 'modification-date': 'Wed, 12 Feb 1997 16:29:51 -0500'}, 849 [], 850 ('attachment; filename="genome.jpeg"; ' 851 'modification-date="Wed, 12 Feb 1997 16:29:51 -0500"'), 852 ('Content-Disposition: attachment; filename="genome.jpeg";\n' 853 ' modification-date="Wed, 12 Feb 1997 16:29:51 -0500"\n'), 854 ), 855 856 'no_value': ( 857 '', 858 None, 859 {}, 860 [errors.HeaderMissingRequiredValue], 861 '', 862 'Content-Disposition:\n'), 863 864 'invalid_value': ( 865 'ab./k', 866 'ab.', 867 {}, 868 [errors.InvalidHeaderDefect]), 869 870 'invalid_value_with_params': ( 871 'ab./k; filename="foo"', 872 'ab.', 873 {'filename': 'foo'}, 874 [errors.InvalidHeaderDefect]), 875 876 'invalid_parameter_value_with_fws_between_ew': ( 877 'attachment; filename="=?UTF-8?Q?Schulbesuchsbest=C3=A4ttigung=2E?=' 878 ' =?UTF-8?Q?pdf?="', 879 'attachment', 880 {'filename': 'Schulbesuchsbestättigung.pdf'}, 881 [errors.InvalidHeaderDefect]*3, 882 ('attachment; filename="Schulbesuchsbestättigung.pdf"'), 883 ('Content-Disposition: attachment;\n' 884 ' filename*=utf-8\'\'Schulbesuchsbest%C3%A4ttigung.pdf\n'), 885 ), 886 887 'parameter_value_with_fws_between_tokens': ( 888 'attachment; filename="File =?utf-8?q?Name?= With Spaces.pdf"', 889 'attachment', 890 {'filename': 'File Name With Spaces.pdf'}, 891 [errors.InvalidHeaderDefect], 892 'attachment; filename="File Name With Spaces.pdf"', 893 ('Content-Disposition: attachment; filename="File Name With Spaces.pdf"\n'), 894 ) 895 } 896 897 898@parameterize 899class TestMIMEVersionHeader(TestHeaderBase): 900 901 def version_string_as_MIME_Version(self, 902 source, 903 decoded, 904 version, 905 major, 906 minor, 907 defects): 908 h = self.make_header('MIME-Version', source) 909 self.assertEqual(h, decoded) 910 self.assertEqual(h.version, version) 911 self.assertEqual(h.major, major) 912 self.assertEqual(h.minor, minor) 913 self.assertDefectsEqual(h.defects, defects) 914 if source: 915 source = ' ' + source 916 self.assertEqual(h.fold(policy=policy.default), 917 'MIME-Version:' + source + '\n') 918 919 version_string_params = { 920 921 # Examples from the RFC. 922 923 'RFC_2045_1': ( 924 '1.0', 925 '1.0', 926 '1.0', 927 1, 928 0, 929 []), 930 931 'RFC_2045_2': ( 932 '1.0 (produced by MetaSend Vx.x)', 933 '1.0 (produced by MetaSend Vx.x)', 934 '1.0', 935 1, 936 0, 937 []), 938 939 'RFC_2045_3': ( 940 '(produced by MetaSend Vx.x) 1.0', 941 '(produced by MetaSend Vx.x) 1.0', 942 '1.0', 943 1, 944 0, 945 []), 946 947 'RFC_2045_4': ( 948 '1.(produced by MetaSend Vx.x)0', 949 '1.(produced by MetaSend Vx.x)0', 950 '1.0', 951 1, 952 0, 953 []), 954 955 # Other valid values. 956 957 '1_1': ( 958 '1.1', 959 '1.1', 960 '1.1', 961 1, 962 1, 963 []), 964 965 '2_1': ( 966 '2.1', 967 '2.1', 968 '2.1', 969 2, 970 1, 971 []), 972 973 'whitespace': ( 974 '1 .0', 975 '1 .0', 976 '1.0', 977 1, 978 0, 979 []), 980 981 'leading_trailing_whitespace_ignored': ( 982 ' 1.0 ', 983 ' 1.0 ', 984 '1.0', 985 1, 986 0, 987 []), 988 989 # Recoverable invalid values. We can recover here only because we 990 # already have a valid value by the time we encounter the garbage. 991 # Anywhere else, and we don't know where the garbage ends. 992 993 'non_comment_garbage_after': ( 994 '1.0 <abc>', 995 '1.0 <abc>', 996 '1.0', 997 1, 998 0, 999 [errors.InvalidHeaderDefect]), 1000 1001 # Unrecoverable invalid values. We *could* apply more heuristics to 1002 # get something out of the first two, but doing so is not worth the 1003 # effort. 1004 1005 'non_comment_garbage_before': ( 1006 '<abc> 1.0', 1007 '<abc> 1.0', 1008 None, 1009 None, 1010 None, 1011 [errors.InvalidHeaderDefect]), 1012 1013 'non_comment_garbage_inside': ( 1014 '1.<abc>0', 1015 '1.<abc>0', 1016 None, 1017 None, 1018 None, 1019 [errors.InvalidHeaderDefect]), 1020 1021 'two_periods': ( 1022 '1..0', 1023 '1..0', 1024 None, 1025 None, 1026 None, 1027 [errors.InvalidHeaderDefect]), 1028 1029 '2_x': ( 1030 '2.x', 1031 '2.x', 1032 None, # This could be 2, but it seems safer to make it None. 1033 None, 1034 None, 1035 [errors.InvalidHeaderDefect]), 1036 1037 'foo': ( 1038 'foo', 1039 'foo', 1040 None, 1041 None, 1042 None, 1043 [errors.InvalidHeaderDefect]), 1044 1045 'missing': ( 1046 '', 1047 '', 1048 None, 1049 None, 1050 None, 1051 [errors.HeaderMissingRequiredValue]), 1052 1053 } 1054 1055 1056@parameterize 1057class TestAddressHeader(TestHeaderBase): 1058 1059 example_params = { 1060 1061 'empty': 1062 ('<>', 1063 [errors.InvalidHeaderDefect], 1064 '<>', 1065 '', 1066 '<>', 1067 '', 1068 '', 1069 None), 1070 1071 'address_only': 1072 ('zippy@pinhead.com', 1073 [], 1074 'zippy@pinhead.com', 1075 '', 1076 'zippy@pinhead.com', 1077 'zippy', 1078 'pinhead.com', 1079 None), 1080 1081 'name_and_address': 1082 ('Zaphrod Beblebrux <zippy@pinhead.com>', 1083 [], 1084 'Zaphrod Beblebrux <zippy@pinhead.com>', 1085 'Zaphrod Beblebrux', 1086 'zippy@pinhead.com', 1087 'zippy', 1088 'pinhead.com', 1089 None), 1090 1091 'quoted_local_part': 1092 ('Zaphrod Beblebrux <"foo bar"@pinhead.com>', 1093 [], 1094 'Zaphrod Beblebrux <"foo bar"@pinhead.com>', 1095 'Zaphrod Beblebrux', 1096 '"foo bar"@pinhead.com', 1097 'foo bar', 1098 'pinhead.com', 1099 None), 1100 1101 'quoted_parens_in_name': 1102 (r'"A \(Special\) Person" <person@dom.ain>', 1103 [], 1104 '"A (Special) Person" <person@dom.ain>', 1105 'A (Special) Person', 1106 'person@dom.ain', 1107 'person', 1108 'dom.ain', 1109 None), 1110 1111 'quoted_backslashes_in_name': 1112 (r'"Arthur \\Backslash\\ Foobar" <person@dom.ain>', 1113 [], 1114 r'"Arthur \\Backslash\\ Foobar" <person@dom.ain>', 1115 r'Arthur \Backslash\ Foobar', 1116 'person@dom.ain', 1117 'person', 1118 'dom.ain', 1119 None), 1120 1121 'name_with_dot': 1122 ('John X. Doe <jxd@example.com>', 1123 [errors.ObsoleteHeaderDefect], 1124 '"John X. Doe" <jxd@example.com>', 1125 'John X. Doe', 1126 'jxd@example.com', 1127 'jxd', 1128 'example.com', 1129 None), 1130 1131 'quoted_strings_in_local_part': 1132 ('""example" example"@example.com', 1133 [errors.InvalidHeaderDefect]*3, 1134 '"example example"@example.com', 1135 '', 1136 '"example example"@example.com', 1137 'example example', 1138 'example.com', 1139 None), 1140 1141 'escaped_quoted_strings_in_local_part': 1142 (r'"\"example\" example"@example.com', 1143 [], 1144 r'"\"example\" example"@example.com', 1145 '', 1146 r'"\"example\" example"@example.com', 1147 r'"example" example', 1148 'example.com', 1149 None), 1150 1151 'escaped_escapes_in_local_part': 1152 (r'"\\"example\\" example"@example.com', 1153 [errors.InvalidHeaderDefect]*5, 1154 r'"\\example\\\\ example"@example.com', 1155 '', 1156 r'"\\example\\\\ example"@example.com', 1157 r'\example\\ example', 1158 'example.com', 1159 None), 1160 1161 'spaces_in_unquoted_local_part_collapsed': 1162 ('merwok wok @example.com', 1163 [errors.InvalidHeaderDefect]*2, 1164 '"merwok wok"@example.com', 1165 '', 1166 '"merwok wok"@example.com', 1167 'merwok wok', 1168 'example.com', 1169 None), 1170 1171 'spaces_around_dots_in_local_part_removed': 1172 ('merwok. wok . wok@example.com', 1173 [errors.ObsoleteHeaderDefect], 1174 'merwok.wok.wok@example.com', 1175 '', 1176 'merwok.wok.wok@example.com', 1177 'merwok.wok.wok', 1178 'example.com', 1179 None), 1180 1181 'rfc2047_atom_is_decoded': 1182 ('=?utf-8?q?=C3=89ric?= <foo@example.com>', 1183 [], 1184 'Éric <foo@example.com>', 1185 'Éric', 1186 'foo@example.com', 1187 'foo', 1188 'example.com', 1189 None), 1190 1191 'rfc2047_atom_in_phrase_is_decoded': 1192 ('The =?utf-8?q?=C3=89ric=2C?= Himself <foo@example.com>', 1193 [], 1194 '"The Éric, Himself" <foo@example.com>', 1195 'The Éric, Himself', 1196 'foo@example.com', 1197 'foo', 1198 'example.com', 1199 None), 1200 1201 'rfc2047_atom_in_quoted_string_is_decoded': 1202 ('"=?utf-8?q?=C3=89ric?=" <foo@example.com>', 1203 [errors.InvalidHeaderDefect, 1204 errors.InvalidHeaderDefect], 1205 'Éric <foo@example.com>', 1206 'Éric', 1207 'foo@example.com', 1208 'foo', 1209 'example.com', 1210 None), 1211 1212 } 1213 1214 # XXX: Need many more examples, and in particular some with names in 1215 # trailing comments, which aren't currently handled. comments in 1216 # general are not handled yet. 1217 1218 def example_as_address(self, source, defects, decoded, display_name, 1219 addr_spec, username, domain, comment): 1220 h = self.make_header('sender', source) 1221 self.assertEqual(h, decoded) 1222 self.assertDefectsEqual(h.defects, defects) 1223 a = h.address 1224 self.assertEqual(str(a), decoded) 1225 self.assertEqual(len(h.groups), 1) 1226 self.assertEqual([a], list(h.groups[0].addresses)) 1227 self.assertEqual([a], list(h.addresses)) 1228 self.assertEqual(a.display_name, display_name) 1229 self.assertEqual(a.addr_spec, addr_spec) 1230 self.assertEqual(a.username, username) 1231 self.assertEqual(a.domain, domain) 1232 # XXX: we have no comment support yet. 1233 #self.assertEqual(a.comment, comment) 1234 1235 def example_as_group(self, source, defects, decoded, display_name, 1236 addr_spec, username, domain, comment): 1237 source = 'foo: {};'.format(source) 1238 gdecoded = 'foo: {};'.format(decoded) if decoded else 'foo:;' 1239 h = self.make_header('to', source) 1240 self.assertEqual(h, gdecoded) 1241 self.assertDefectsEqual(h.defects, defects) 1242 self.assertEqual(h.groups[0].addresses, h.addresses) 1243 self.assertEqual(len(h.groups), 1) 1244 self.assertEqual(len(h.addresses), 1) 1245 a = h.addresses[0] 1246 self.assertEqual(str(a), decoded) 1247 self.assertEqual(a.display_name, display_name) 1248 self.assertEqual(a.addr_spec, addr_spec) 1249 self.assertEqual(a.username, username) 1250 self.assertEqual(a.domain, domain) 1251 1252 def test_simple_address_list(self): 1253 value = ('Fred <dinsdale@python.org>, foo@example.com, ' 1254 '"Harry W. Hastings" <hasty@example.com>') 1255 h = self.make_header('to', value) 1256 self.assertEqual(h, value) 1257 self.assertEqual(len(h.groups), 3) 1258 self.assertEqual(len(h.addresses), 3) 1259 for i in range(3): 1260 self.assertEqual(h.groups[i].addresses[0], h.addresses[i]) 1261 self.assertEqual(str(h.addresses[0]), 'Fred <dinsdale@python.org>') 1262 self.assertEqual(str(h.addresses[1]), 'foo@example.com') 1263 self.assertEqual(str(h.addresses[2]), 1264 '"Harry W. Hastings" <hasty@example.com>') 1265 self.assertEqual(h.addresses[2].display_name, 1266 'Harry W. Hastings') 1267 1268 def test_complex_address_list(self): 1269 examples = list(self.example_params.values()) 1270 source = ('dummy list:;, another: (empty);,' + 1271 ', '.join([x[0] for x in examples[:4]]) + ', ' + 1272 r'"A \"list\"": ' + 1273 ', '.join([x[0] for x in examples[4:6]]) + ';,' + 1274 ', '.join([x[0] for x in examples[6:]]) 1275 ) 1276 # XXX: the fact that (empty) disappears here is a potential API design 1277 # bug. We don't currently have a way to preserve comments. 1278 expected = ('dummy list:;, another:;, ' + 1279 ', '.join([x[2] for x in examples[:4]]) + ', ' + 1280 r'"A \"list\"": ' + 1281 ', '.join([x[2] for x in examples[4:6]]) + ';, ' + 1282 ', '.join([x[2] for x in examples[6:]]) 1283 ) 1284 1285 h = self.make_header('to', source) 1286 self.assertEqual(h.split(','), expected.split(',')) 1287 self.assertEqual(h, expected) 1288 self.assertEqual(len(h.groups), 7 + len(examples) - 6) 1289 self.assertEqual(h.groups[0].display_name, 'dummy list') 1290 self.assertEqual(h.groups[1].display_name, 'another') 1291 self.assertEqual(h.groups[6].display_name, 'A "list"') 1292 self.assertEqual(len(h.addresses), len(examples)) 1293 for i in range(4): 1294 self.assertIsNone(h.groups[i+2].display_name) 1295 self.assertEqual(str(h.groups[i+2].addresses[0]), examples[i][2]) 1296 for i in range(7, 7 + len(examples) - 6): 1297 self.assertIsNone(h.groups[i].display_name) 1298 self.assertEqual(str(h.groups[i].addresses[0]), examples[i-1][2]) 1299 for i in range(len(examples)): 1300 self.assertEqual(str(h.addresses[i]), examples[i][2]) 1301 self.assertEqual(h.addresses[i].addr_spec, examples[i][4]) 1302 1303 def test_address_read_only(self): 1304 h = self.make_header('sender', 'abc@xyz.com') 1305 with self.assertRaises(AttributeError): 1306 h.address = 'foo' 1307 1308 def test_addresses_read_only(self): 1309 h = self.make_header('sender', 'abc@xyz.com') 1310 with self.assertRaises(AttributeError): 1311 h.addresses = 'foo' 1312 1313 def test_groups_read_only(self): 1314 h = self.make_header('sender', 'abc@xyz.com') 1315 with self.assertRaises(AttributeError): 1316 h.groups = 'foo' 1317 1318 def test_addresses_types(self): 1319 source = 'me <who@example.com>' 1320 h = self.make_header('to', source) 1321 self.assertIsInstance(h.addresses, tuple) 1322 self.assertIsInstance(h.addresses[0], Address) 1323 1324 def test_groups_types(self): 1325 source = 'me <who@example.com>' 1326 h = self.make_header('to', source) 1327 self.assertIsInstance(h.groups, tuple) 1328 self.assertIsInstance(h.groups[0], Group) 1329 1330 def test_set_from_Address(self): 1331 h = self.make_header('to', Address('me', 'foo', 'example.com')) 1332 self.assertEqual(h, 'me <foo@example.com>') 1333 1334 def test_set_from_Address_list(self): 1335 h = self.make_header('to', [Address('me', 'foo', 'example.com'), 1336 Address('you', 'bar', 'example.com')]) 1337 self.assertEqual(h, 'me <foo@example.com>, you <bar@example.com>') 1338 1339 def test_set_from_Address_and_Group_list(self): 1340 h = self.make_header('to', [Address('me', 'foo', 'example.com'), 1341 Group('bing', [Address('fiz', 'z', 'b.com'), 1342 Address('zif', 'f', 'c.com')]), 1343 Address('you', 'bar', 'example.com')]) 1344 self.assertEqual(h, 'me <foo@example.com>, bing: fiz <z@b.com>, ' 1345 'zif <f@c.com>;, you <bar@example.com>') 1346 self.assertEqual(h.fold(policy=policy.default.clone(max_line_length=40)), 1347 'to: me <foo@example.com>,\n' 1348 ' bing: fiz <z@b.com>, zif <f@c.com>;,\n' 1349 ' you <bar@example.com>\n') 1350 1351 def test_set_from_Group_list(self): 1352 h = self.make_header('to', [Group('bing', [Address('fiz', 'z', 'b.com'), 1353 Address('zif', 'f', 'c.com')])]) 1354 self.assertEqual(h, 'bing: fiz <z@b.com>, zif <f@c.com>;') 1355 1356 1357class TestAddressAndGroup(TestEmailBase): 1358 1359 def _test_attr_ro(self, obj, attr): 1360 with self.assertRaises(AttributeError): 1361 setattr(obj, attr, 'foo') 1362 1363 def test_address_display_name_ro(self): 1364 self._test_attr_ro(Address('foo', 'bar', 'baz'), 'display_name') 1365 1366 def test_address_username_ro(self): 1367 self._test_attr_ro(Address('foo', 'bar', 'baz'), 'username') 1368 1369 def test_address_domain_ro(self): 1370 self._test_attr_ro(Address('foo', 'bar', 'baz'), 'domain') 1371 1372 def test_group_display_name_ro(self): 1373 self._test_attr_ro(Group('foo'), 'display_name') 1374 1375 def test_group_addresses_ro(self): 1376 self._test_attr_ro(Group('foo'), 'addresses') 1377 1378 def test_address_from_username_domain(self): 1379 a = Address('foo', 'bar', 'baz') 1380 self.assertEqual(a.display_name, 'foo') 1381 self.assertEqual(a.username, 'bar') 1382 self.assertEqual(a.domain, 'baz') 1383 self.assertEqual(a.addr_spec, 'bar@baz') 1384 self.assertEqual(str(a), 'foo <bar@baz>') 1385 1386 def test_address_from_addr_spec(self): 1387 a = Address('foo', addr_spec='bar@baz') 1388 self.assertEqual(a.display_name, 'foo') 1389 self.assertEqual(a.username, 'bar') 1390 self.assertEqual(a.domain, 'baz') 1391 self.assertEqual(a.addr_spec, 'bar@baz') 1392 self.assertEqual(str(a), 'foo <bar@baz>') 1393 1394 def test_address_with_no_display_name(self): 1395 a = Address(addr_spec='bar@baz') 1396 self.assertEqual(a.display_name, '') 1397 self.assertEqual(a.username, 'bar') 1398 self.assertEqual(a.domain, 'baz') 1399 self.assertEqual(a.addr_spec, 'bar@baz') 1400 self.assertEqual(str(a), 'bar@baz') 1401 1402 def test_null_address(self): 1403 a = Address() 1404 self.assertEqual(a.display_name, '') 1405 self.assertEqual(a.username, '') 1406 self.assertEqual(a.domain, '') 1407 self.assertEqual(a.addr_spec, '<>') 1408 self.assertEqual(str(a), '<>') 1409 1410 def test_domain_only(self): 1411 # This isn't really a valid address. 1412 a = Address(domain='buzz') 1413 self.assertEqual(a.display_name, '') 1414 self.assertEqual(a.username, '') 1415 self.assertEqual(a.domain, 'buzz') 1416 self.assertEqual(a.addr_spec, '@buzz') 1417 self.assertEqual(str(a), '@buzz') 1418 1419 def test_username_only(self): 1420 # This isn't really a valid address. 1421 a = Address(username='buzz') 1422 self.assertEqual(a.display_name, '') 1423 self.assertEqual(a.username, 'buzz') 1424 self.assertEqual(a.domain, '') 1425 self.assertEqual(a.addr_spec, 'buzz') 1426 self.assertEqual(str(a), 'buzz') 1427 1428 def test_display_name_only(self): 1429 a = Address('buzz') 1430 self.assertEqual(a.display_name, 'buzz') 1431 self.assertEqual(a.username, '') 1432 self.assertEqual(a.domain, '') 1433 self.assertEqual(a.addr_spec, '<>') 1434 self.assertEqual(str(a), 'buzz <>') 1435 1436 def test_quoting(self): 1437 # Ideally we'd check every special individually, but I'm not up for 1438 # writing that many tests. 1439 a = Address('Sara J.', 'bad name', 'example.com') 1440 self.assertEqual(a.display_name, 'Sara J.') 1441 self.assertEqual(a.username, 'bad name') 1442 self.assertEqual(a.domain, 'example.com') 1443 self.assertEqual(a.addr_spec, '"bad name"@example.com') 1444 self.assertEqual(str(a), '"Sara J." <"bad name"@example.com>') 1445 1446 def test_il8n(self): 1447 a = Address('Éric', 'wok', 'exàmple.com') 1448 self.assertEqual(a.display_name, 'Éric') 1449 self.assertEqual(a.username, 'wok') 1450 self.assertEqual(a.domain, 'exàmple.com') 1451 self.assertEqual(a.addr_spec, 'wok@exàmple.com') 1452 self.assertEqual(str(a), 'Éric <wok@exàmple.com>') 1453 1454 # XXX: there is an API design issue that needs to be solved here. 1455 #def test_non_ascii_username_raises(self): 1456 # with self.assertRaises(ValueError): 1457 # Address('foo', 'wők', 'example.com') 1458 1459 def test_crlf_in_constructor_args_raises(self): 1460 cases = ( 1461 dict(display_name='foo\r'), 1462 dict(display_name='foo\n'), 1463 dict(display_name='foo\r\n'), 1464 dict(domain='example.com\r'), 1465 dict(domain='example.com\n'), 1466 dict(domain='example.com\r\n'), 1467 dict(username='wok\r'), 1468 dict(username='wok\n'), 1469 dict(username='wok\r\n'), 1470 dict(addr_spec='wok@example.com\r'), 1471 dict(addr_spec='wok@example.com\n'), 1472 dict(addr_spec='wok@example.com\r\n') 1473 ) 1474 for kwargs in cases: 1475 with self.subTest(kwargs=kwargs), self.assertRaisesRegex(ValueError, "invalid arguments"): 1476 Address(**kwargs) 1477 1478 def test_non_ascii_username_in_addr_spec_raises(self): 1479 with self.assertRaises(ValueError): 1480 Address('foo', addr_spec='wők@example.com') 1481 1482 def test_address_addr_spec_and_username_raises(self): 1483 with self.assertRaises(TypeError): 1484 Address('foo', username='bing', addr_spec='bar@baz') 1485 1486 def test_address_addr_spec_and_domain_raises(self): 1487 with self.assertRaises(TypeError): 1488 Address('foo', domain='bing', addr_spec='bar@baz') 1489 1490 def test_address_addr_spec_and_username_and_domain_raises(self): 1491 with self.assertRaises(TypeError): 1492 Address('foo', username='bong', domain='bing', addr_spec='bar@baz') 1493 1494 def test_space_in_addr_spec_username_raises(self): 1495 with self.assertRaises(ValueError): 1496 Address('foo', addr_spec="bad name@example.com") 1497 1498 def test_bad_addr_sepc_raises(self): 1499 with self.assertRaises(ValueError): 1500 Address('foo', addr_spec="name@ex[]ample.com") 1501 1502 def test_empty_group(self): 1503 g = Group('foo') 1504 self.assertEqual(g.display_name, 'foo') 1505 self.assertEqual(g.addresses, tuple()) 1506 self.assertEqual(str(g), 'foo:;') 1507 1508 def test_empty_group_list(self): 1509 g = Group('foo', addresses=[]) 1510 self.assertEqual(g.display_name, 'foo') 1511 self.assertEqual(g.addresses, tuple()) 1512 self.assertEqual(str(g), 'foo:;') 1513 1514 def test_null_group(self): 1515 g = Group() 1516 self.assertIsNone(g.display_name) 1517 self.assertEqual(g.addresses, tuple()) 1518 self.assertEqual(str(g), 'None:;') 1519 1520 def test_group_with_addresses(self): 1521 addrs = [Address('b', 'b', 'c'), Address('a', 'b','c')] 1522 g = Group('foo', addrs) 1523 self.assertEqual(g.display_name, 'foo') 1524 self.assertEqual(g.addresses, tuple(addrs)) 1525 self.assertEqual(str(g), 'foo: b <b@c>, a <b@c>;') 1526 1527 def test_group_with_addresses_no_display_name(self): 1528 addrs = [Address('b', 'b', 'c'), Address('a', 'b','c')] 1529 g = Group(addresses=addrs) 1530 self.assertIsNone(g.display_name) 1531 self.assertEqual(g.addresses, tuple(addrs)) 1532 self.assertEqual(str(g), 'None: b <b@c>, a <b@c>;') 1533 1534 def test_group_with_one_address_no_display_name(self): 1535 addrs = [Address('b', 'b', 'c')] 1536 g = Group(addresses=addrs) 1537 self.assertIsNone(g.display_name) 1538 self.assertEqual(g.addresses, tuple(addrs)) 1539 self.assertEqual(str(g), 'b <b@c>') 1540 1541 def test_display_name_quoting(self): 1542 g = Group('foo.bar') 1543 self.assertEqual(g.display_name, 'foo.bar') 1544 self.assertEqual(g.addresses, tuple()) 1545 self.assertEqual(str(g), '"foo.bar":;') 1546 1547 def test_display_name_blanks_not_quoted(self): 1548 g = Group('foo bar') 1549 self.assertEqual(g.display_name, 'foo bar') 1550 self.assertEqual(g.addresses, tuple()) 1551 self.assertEqual(str(g), 'foo bar:;') 1552 1553 def test_set_message_header_from_address(self): 1554 a = Address('foo', 'bar', 'example.com') 1555 m = Message(policy=policy.default) 1556 m['To'] = a 1557 self.assertEqual(m['to'], 'foo <bar@example.com>') 1558 self.assertEqual(m['to'].addresses, (a,)) 1559 1560 def test_set_message_header_from_group(self): 1561 g = Group('foo bar') 1562 m = Message(policy=policy.default) 1563 m['To'] = g 1564 self.assertEqual(m['to'], 'foo bar:;') 1565 self.assertEqual(m['to'].addresses, g.addresses) 1566 1567 def test_address_comparison(self): 1568 a = Address('foo', 'bar', 'example.com') 1569 self.assertEqual(Address('foo', 'bar', 'example.com'), a) 1570 self.assertNotEqual(Address('baz', 'bar', 'example.com'), a) 1571 self.assertNotEqual(Address('foo', 'baz', 'example.com'), a) 1572 self.assertNotEqual(Address('foo', 'bar', 'baz'), a) 1573 self.assertFalse(a == object()) 1574 self.assertTrue(a == ALWAYS_EQ) 1575 1576 def test_group_comparison(self): 1577 a = Address('foo', 'bar', 'example.com') 1578 g = Group('foo bar', [a]) 1579 self.assertEqual(Group('foo bar', (a,)), g) 1580 self.assertNotEqual(Group('baz', [a]), g) 1581 self.assertNotEqual(Group('foo bar', []), g) 1582 self.assertFalse(g == object()) 1583 self.assertTrue(g == ALWAYS_EQ) 1584 1585 1586class TestFolding(TestHeaderBase): 1587 1588 def test_address_display_names(self): 1589 """Test the folding and encoding of address headers.""" 1590 for name, result in ( 1591 ('Foo Bar, France', '"Foo Bar, France"'), 1592 ('Foo Bar (France)', '"Foo Bar (France)"'), 1593 ('Foo Bar, España', 'Foo =?utf-8?q?Bar=2C_Espa=C3=B1a?='), 1594 ('Foo Bar (España)', 'Foo Bar =?utf-8?b?KEVzcGHDsWEp?='), 1595 ('Foo, Bar España', '=?utf-8?q?Foo=2C_Bar_Espa=C3=B1a?='), 1596 ('Foo, Bar [España]', '=?utf-8?q?Foo=2C_Bar_=5BEspa=C3=B1a=5D?='), 1597 ('Foo Bär, France', 'Foo =?utf-8?q?B=C3=A4r=2C?= France'), 1598 ('Foo Bär <France>', 'Foo =?utf-8?q?B=C3=A4r_=3CFrance=3E?='), 1599 ( 1600 'Lôrem ipsum dôlôr sit amet, cônsectetuer adipiscing. ' 1601 'Suspendisse pôtenti. Aliquam nibh. Suspendisse pôtenti.', 1602 '=?utf-8?q?L=C3=B4rem_ipsum_d=C3=B4l=C3=B4r_sit_amet=2C_c' 1603 '=C3=B4nsectetuer?=\n =?utf-8?q?adipiscing=2E_Suspendisse' 1604 '_p=C3=B4tenti=2E_Aliquam_nibh=2E?=\n Suspendisse =?utf-8' 1605 '?q?p=C3=B4tenti=2E?=', 1606 ), 1607 ): 1608 h = self.make_header('To', Address(name, addr_spec='a@b.com')) 1609 self.assertEqual(h.fold(policy=policy.default), 1610 'To: %s <a@b.com>\n' % result) 1611 1612 def test_short_unstructured(self): 1613 h = self.make_header('subject', 'this is a test') 1614 self.assertEqual(h.fold(policy=policy.default), 1615 'subject: this is a test\n') 1616 1617 def test_long_unstructured(self): 1618 h = self.make_header('Subject', 'This is a long header ' 1619 'line that will need to be folded into two lines ' 1620 'and will demonstrate basic folding') 1621 self.assertEqual(h.fold(policy=policy.default), 1622 'Subject: This is a long header line that will ' 1623 'need to be folded into two lines\n' 1624 ' and will demonstrate basic folding\n') 1625 1626 def test_unstructured_short_max_line_length(self): 1627 h = self.make_header('Subject', 'this is a short header ' 1628 'that will be folded anyway') 1629 self.assertEqual( 1630 h.fold(policy=policy.default.clone(max_line_length=20)), 1631 textwrap.dedent("""\ 1632 Subject: this is a 1633 short header that 1634 will be folded 1635 anyway 1636 """)) 1637 1638 def test_fold_unstructured_single_word(self): 1639 h = self.make_header('Subject', 'test') 1640 self.assertEqual(h.fold(policy=policy.default), 'Subject: test\n') 1641 1642 def test_fold_unstructured_short(self): 1643 h = self.make_header('Subject', 'test test test') 1644 self.assertEqual(h.fold(policy=policy.default), 1645 'Subject: test test test\n') 1646 1647 def test_fold_unstructured_with_overlong_word(self): 1648 h = self.make_header('Subject', 'thisisaverylonglineconsistingofa' 1649 'singlewordthatwontfit') 1650 self.assertEqual( 1651 h.fold(policy=policy.default.clone(max_line_length=20)), 1652 'Subject: \n' 1653 ' =?utf-8?q?thisisa?=\n' 1654 ' =?utf-8?q?verylon?=\n' 1655 ' =?utf-8?q?glineco?=\n' 1656 ' =?utf-8?q?nsistin?=\n' 1657 ' =?utf-8?q?gofasin?=\n' 1658 ' =?utf-8?q?gleword?=\n' 1659 ' =?utf-8?q?thatwon?=\n' 1660 ' =?utf-8?q?tfit?=\n' 1661 ) 1662 1663 def test_fold_unstructured_with_two_overlong_words(self): 1664 h = self.make_header('Subject', 'thisisaverylonglineconsistingofa' 1665 'singlewordthatwontfit plusanotherverylongwordthatwontfit') 1666 self.assertEqual( 1667 h.fold(policy=policy.default.clone(max_line_length=20)), 1668 'Subject: \n' 1669 ' =?utf-8?q?thisisa?=\n' 1670 ' =?utf-8?q?verylon?=\n' 1671 ' =?utf-8?q?glineco?=\n' 1672 ' =?utf-8?q?nsistin?=\n' 1673 ' =?utf-8?q?gofasin?=\n' 1674 ' =?utf-8?q?gleword?=\n' 1675 ' =?utf-8?q?thatwon?=\n' 1676 ' =?utf-8?q?tfit_pl?=\n' 1677 ' =?utf-8?q?usanoth?=\n' 1678 ' =?utf-8?q?erveryl?=\n' 1679 ' =?utf-8?q?ongword?=\n' 1680 ' =?utf-8?q?thatwon?=\n' 1681 ' =?utf-8?q?tfit?=\n' 1682 ) 1683 1684 # XXX Need test for when max_line_length is less than the chrome size. 1685 1686 def test_fold_unstructured_with_slightly_long_word(self): 1687 h = self.make_header('Subject', 'thislongwordislessthanmaxlinelen') 1688 self.assertEqual( 1689 h.fold(policy=policy.default.clone(max_line_length=35)), 1690 'Subject:\n thislongwordislessthanmaxlinelen\n') 1691 1692 def test_fold_unstructured_with_commas(self): 1693 # The old wrapper would fold this at the commas. 1694 h = self.make_header('Subject', "This header is intended to " 1695 "demonstrate, in a fairly succinct way, that we now do " 1696 "not give a , special treatment in unstructured headers.") 1697 self.assertEqual( 1698 h.fold(policy=policy.default.clone(max_line_length=60)), 1699 textwrap.dedent("""\ 1700 Subject: This header is intended to demonstrate, in a fairly 1701 succinct way, that we now do not give a , special treatment 1702 in unstructured headers. 1703 """)) 1704 1705 def test_fold_address_list(self): 1706 h = self.make_header('To', '"Theodore H. Perfect" <yes@man.com>, ' 1707 '"My address is very long because my name is long" <foo@bar.com>, ' 1708 '"Only A. Friend" <no@yes.com>') 1709 self.assertEqual(h.fold(policy=policy.default), textwrap.dedent("""\ 1710 To: "Theodore H. Perfect" <yes@man.com>, 1711 "My address is very long because my name is long" <foo@bar.com>, 1712 "Only A. Friend" <no@yes.com> 1713 """)) 1714 1715 def test_fold_date_header(self): 1716 h = self.make_header('Date', 'Sat, 2 Feb 2002 17:00:06 -0800') 1717 self.assertEqual(h.fold(policy=policy.default), 1718 'Date: Sat, 02 Feb 2002 17:00:06 -0800\n') 1719 1720 def test_fold_overlong_words_using_RFC2047(self): 1721 h = self.make_header( 1722 'X-Report-Abuse', 1723 '<https://www.mailitapp.com/report_abuse.php?' 1724 'mid=xxx-xxx-xxxxxxxxxxxxxxxxxxxxxxxx==-xxx-xx-xx>') 1725 self.assertEqual( 1726 h.fold(policy=policy.default), 1727 'X-Report-Abuse: =?utf-8?q?=3Chttps=3A//www=2Emailitapp=2E' 1728 'com/report=5Fabuse?=\n' 1729 ' =?utf-8?q?=2Ephp=3Fmid=3Dxxx-xxx-xxxx' 1730 'xxxxxxxxxxxxxxxxxxxx=3D=3D-xxx-xx-xx?=\n' 1731 ' =?utf-8?q?=3E?=\n') 1732 1733 def test_message_id_header_is_not_folded(self): 1734 h = self.make_header( 1735 'Message-ID', 1736 '<somemessageidlongerthan@maxlinelength.com>') 1737 self.assertEqual( 1738 h.fold(policy=policy.default.clone(max_line_length=20)), 1739 'Message-ID: <somemessageidlongerthan@maxlinelength.com>\n') 1740 1741 # Test message-id isn't folded when id-right is no-fold-literal. 1742 h = self.make_header( 1743 'Message-ID', 1744 '<somemessageidlongerthan@[127.0.0.0.0.0.0.0.0.1]>') 1745 self.assertEqual( 1746 h.fold(policy=policy.default.clone(max_line_length=20)), 1747 'Message-ID: <somemessageidlongerthan@[127.0.0.0.0.0.0.0.0.1]>\n') 1748 1749 # Test message-id isn't folded when id-right is non-ascii characters. 1750 h = self.make_header('Message-ID', '<ईमेल@wők.com>') 1751 self.assertEqual( 1752 h.fold(policy=policy.default.clone(max_line_length=30)), 1753 'Message-ID: <ईमेल@wők.com>\n') 1754 1755 # Test message-id is folded without breaking the msg-id token into 1756 # encoded words, *even* if they don't fit into max_line_length. 1757 h = self.make_header('Message-ID', '<ईमेलfromMessage@wők.com>') 1758 self.assertEqual( 1759 h.fold(policy=policy.default.clone(max_line_length=20)), 1760 'Message-ID:\n <ईमेलfromMessage@wők.com>\n') 1761 1762if __name__ == '__main__': 1763 unittest.main() 1764