#!/usr/bin/env python3 import difflib import email.parser import email.policy import itertools import mailbox import sys def flexible_eq(expected, got): """Compare two strings, supporting wildcards. This functions compares two strings, but supports wildcards on the expected string. The following characters have special meaning: - ? matches any character. - * matches anything until the end of the line. Returns True if equal (considering wildcards), False otherwise. """ posG = 0 for c in expected: if posG >= len(got): return False if c == "?": posG += 1 continue if c == "*": while posG < len(got) and got[posG] != "\t": posG += 1 continue continue if c != got[posG]: return False posG += 1 if posG != len(got): # We got more than we expected. return False return True def msg_equals(expected, msg): """Compare two messages recursively, using flexible_eq().""" diff = False for h, val in expected.items(): if h not in msg: print("Header missing: %r" % h) diff = True continue if expected[h] == "*": continue msg_hdr_vals = msg.get_all(h, []) if len(msg_hdr_vals) == 1: if not flexible_eq(val, msg[h]): print("Header %r differs:" % h) print("Exp: %r" % val) print("Got: %r" % msg[h]) diff = True else: # We have multiple values for this header, so we need to check each # one, and only return a diff if none of them match. # Note this will result in a false positive if two headers match # the same expected one, but this is good enough for now. for msg_hdr_val in msg_hdr_vals: if flexible_eq(val, msg_hdr_val): break else: print("Header %r differs, no matching header found" % h) print("Exp: %r" % val) for i, msg_hdr_val in enumerate(msg_hdr_vals): print("Got %d: %r" % (i, msg_hdr_val)) diff = True if diff: return False if expected.is_multipart() != msg.is_multipart(): print( "Multipart differs, expected %s, got %s" % (expected.is_multipart(), msg.is_multipart()) ) return False if expected.is_multipart(): for exp, got in itertools.zip_longest( expected.get_payload(), msg.get_payload() ): if not msg_equals(exp, got): return False else: if not flexible_eq(expected.get_payload(), msg.get_payload()): exp = expected.get_payload().splitlines() got = msg.get_payload().splitlines() print("Payload differs:") for l in difflib.ndiff(exp, got): print(l) return False return True if __name__ == "__main__": f1, f2 = sys.argv[1:3] # We use a custom strict policy to do more strict content validation. policy = email.policy.EmailPolicy( utf8=True, linesep="\r\n", refold_source="none", raise_on_defect=True ) expected = email.parser.Parser(policy=policy).parse(open(f1)) msg = email.parser.Parser(policy=policy).parse(open(f2)) sys.exit(0 if msg_equals(expected, msg) else 1)