File: test_md5_extra.py

package info (click to toggle)
pypy3 7.3.19%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 212,236 kB
  • sloc: python: 2,098,316; ansic: 540,565; sh: 21,462; asm: 14,419; cpp: 4,451; makefile: 4,209; objc: 761; xml: 530; exp: 499; javascript: 314; pascal: 244; lisp: 45; csh: 12; awk: 4
file content (225 lines) | stat: -rw-r--r-- 7,452 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
"""A test script to compare MD5 implementations.

A note about performance: the pure Python MD5 takes roughly 160 sec. per
MB of data on a 233 MHz Intel Pentium CPU.
"""
import md5

from pypy.module.test_lib_pypy.support import import_lib_pypy


def compare_host(message, d2, d2h):
    """Compare results against the host Python's builtin md5.

    For equal digests this returns None, otherwise it returns a tuple of
    both digests.
    """
    # Use the host Python's standard library MD5 compiled C module.
    m1 = md5.md5()
    m1.update(message)
    d1 = m1.digest()
    d1h = m1.hexdigest()
    # Return None if equal or the different digests if not equal.
    return None if d1 == d2 and d1h == d2h else (d1, d2)


class TestMD5Update:

    spaceconfig = dict(usemodules=('struct',))

    def setup_class(cls):
        if cls.runappdirect:
            # XXX:
            import py
            py.test.skip('Unavailable under py3 runappdirect')

    def test_update(self):
        """Test updating cloned objects."""
        cases = (
            b"123",
            b"1234",
            b"12345",
            b"123456",
            b"1234567",
            b"12345678",
            b"123456789 123456789 123456789 ",
            b"123456789 123456789 ",
            b"123456789 123456789 1",
            b"123456789 123456789 12",
            b"123456789 123456789 123",
            b"123456789 123456789 1234",
            b"123456789 123456789 123456789 1",
            b"123456789 123456789 123456789 12",
            b"123456789 123456789 123456789 123",
            b"123456789 123456789 123456789 1234",
            b"123456789 123456789 123456789 12345",
            b"123456789 123456789 123456789 123456",
            b"123456789 123456789 123456789 1234567",
            b"123456789 123456789 123456789 12345678",
            )
        space = self.space
        w__md5 = import_lib_pypy(space, '_md5')

        # Load both with same prefix.
        prefix1 = 2**10 * b'a'

        # The host md5
        m1 = md5.md5()
        m1.update(prefix1)
        m1c = m1.copy()

        # The app-level _md5
        w_m2 = space.call_method(w__md5, 'md5')
        space.call_method(w_m2, 'update', space.newbytes(prefix1))
        w_m2c = space.call_method(w_m2, 'copy')

        # Update and compare...
        for message in cases:
            m1c.update(message)
            d1 = m1c.hexdigest()

            space.call_method(w_m2c, 'update', space.newbytes(message))
            w_d2 = space.call_method(w_m2c, 'hexdigest')
            d2 = space.text_w(w_d2)

            assert d1 == d2


class AppTestMD5Compare:
    """Compare pure Python MD5 against Python's std. lib. version."""

    spaceconfig = dict(usemodules=('struct',))

    def setup_class(cls):
        from pypy.interpreter import gateway
        space = cls.space
        cls.w__md5 = import_lib_pypy(space, '_md5')
        if cls.runappdirect:
            # XXX:
            import py
            py.test.skip('Unavailable under py3 runappdirect')
        else:
            compare_host.unwrap_spec = ['bytes', 'bytes', 'text']
            cls.w_compare_host = space.wrap(gateway.interp2app(compare_host))

    def w_compare(self, message):
        # Generate results against the app-level pure Python MD5 and
        # pass them off for comparison against the host Python's MD5
        m2 = self._md5.md5()
        m2.update(message)
        return self.compare_host(message, m2.digest(), m2.hexdigest())

    def w__format_hex(self, string):
        """Print a string's HEX code in groups of two digits."""
        d = map(None, string)
        d = map(ord, d)
        d = map(lambda x: "%02x" % x, d)
        return ' '.join(d)

    def w__format(self, string):
        """Print a string as-is in groups of two characters."""
        s = ''
        for i in range(0, len(string) - 1, 2):
            s = s + "%03s" % string[i:i + 2]
        return s[1:]

    def w_print_diff(self, message, d1, d2, expectedResult=None):
        """Print different outputs for same message."""
        print("Message: '%s'" % message)
        print("Message length: %d" % len(message))
        if expectedResult:
            print("%-48s (expected)" % self._format(expectedResult))
        print("%-48s (Std. lib. MD5)" % self._format_hex(d1))
        print("%-48s (Pure Python MD5)" % self._format_hex(d2))
        print()

    def test1(self):
        """Test cases with known digest result."""
        cases = (
            (b"",
             "d41d8cd98f00b204e9800998ecf8427e"),
            (b"a",
             "0cc175b9c0f1b6a831c399e269772661"),
            (b"abc",
             "900150983cd24fb0d6963f7d28e17f72"),
            (b"message digest",
             "f96b697d7cb7938d525a2f31aaf161d0"),
            (b"abcdefghijklmnopqrstuvwxyz",
             "c3fcd3d76192e4007dfb496cca67e13b"),
            (b"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789",
             "d174ab98d277d9f5a5611c2c9f419d9f"),
            (b"1234567890"*8,
             "57edf4a22be3c955ac49da2e2107b67a"),
            )

        for message, expectedResult in cases:
            res = self.compare(message)
            if res is not None:
                d1, d2 = res
                self.print_diff(message, d1, d2, expectedResult)
            assert res is None

    def test2(self):
        """Test cases without known digest result."""
        cases = (
            b"123",
            b"1234",
            b"12345",
            b"123456",
            b"1234567",
            b"12345678",
            b"123456789 123456789 123456789 ",
            b"123456789 123456789 ",
            b"123456789 123456789 1",
            b"123456789 123456789 12",
            b"123456789 123456789 123",
            b"123456789 123456789 1234",
            b"123456789 123456789 123456789 1",
            b"123456789 123456789 123456789 12",
            b"123456789 123456789 123456789 123",
            b"123456789 123456789 123456789 1234",
            b"123456789 123456789 123456789 12345",
            b"123456789 123456789 123456789 123456",
            b"123456789 123456789 123456789 1234567",
            b"123456789 123456789 123456789 12345678",
            )

        for message in cases:
            res = self.compare(message)
            if res is not None:
                d1, d2 = res
                self.print_diff(message, d1, d2)
            assert res is None

    def test3(self):
        """Test cases with long messages (can take a while)."""
        cases = (
            2**10*b'a',
            2**10*b'abcd',
            #2**20*b'a',  # 1 MB, takes about 160 sec. on a 233 Mhz Pentium.
            )

        for message in cases:
            res = self.compare(message)
            if res is not None:
                d1, d2 = res
                self.print_diff(message, d1, d2)
            assert res is None

    def test4(self):
        """Test cases with increasingly growing message lengths."""
        i = 0
        while i < 2**5:
            message = i * b'a'
            res = self.compare(message)
            if res is not None:
                d1, d2 = res
                self.print_diff(message, d1, d2)
            assert res is None
            i += 1

    def test_attributes(self):
        _md5 = self._md5
        assert _md5.md5().digest_size == 16
        assert _md5.md5().digestsize == 16
        assert _md5.md5().block_size == 64