ref: c6b681c48e27d4d5d258c393567878b55d1a43e2
dir: /sys/src/cmd/python/Tools/unicode/comparecodecs.py/
#!/usr/bin/env python
""" Compare the output of two codecs.
(c) Copyright 2005, Marc-Andre Lemburg (mal@lemburg.com).
    Licensed to PSF under a Contributor Agreement.
"""
import sys
def compare_codecs(encoding1, encoding2):
    print 'Comparing encoding/decoding of   %r and   %r' % (encoding1, encoding2)
    mismatch = 0
    # Check encoding
    for i in range(sys.maxunicode):
        u = unichr(i)
        try:
            c1 = u.encode(encoding1)
        except UnicodeError, reason:
            c1 = '<undefined>'
        try:
            c2 = u.encode(encoding2)
        except UnicodeError, reason:
            c2 = '<undefined>'
        if c1 != c2:
            print ' * encoding mismatch for 0x%04X: %-14r != %r' % \
                  (i, c1, c2)
            mismatch += 1
    # Check decoding
    for i in range(256):
        c = chr(i)
        try:
            u1 = c.decode(encoding1)
        except UnicodeError:
            u1 = u'<undefined>'
        try:
            u2 = c.decode(encoding2)
        except UnicodeError:
            u2 = u'<undefined>'
        if u1 != u2:
            print ' * decoding mismatch for 0x%04X: %-14r != %r' % \
                  (i, u1, u2)
            mismatch += 1
    if mismatch:
        print
        print 'Found %i mismatches' % mismatch
    else:
        print '-> Codecs are identical.'
if __name__ == '__main__':
    compare_codecs(sys.argv[1], sys.argv[2])