File: test_bson_binary_vector.py

package info (click to toggle)
pymongo 4.15.5-1
  • links: PTS, VCS
  • area: main
  • in suites: forky
  • size: 23,376 kB
  • sloc: python: 107,945; ansic: 4,601; javascript: 137; makefile: 38; sh: 10
file content (122 lines) | stat: -rw-r--r-- 5,119 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
# Copyright 2024-present MongoDB, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from __future__ import annotations

import binascii
import struct
from pathlib import Path
from test import unittest

from bson import decode, encode, json_util
from bson.binary import Binary, BinaryVectorDtype

_TEST_PATH = Path(__file__).parent / "bson_binary_vector"


class TestBSONBinaryVector(unittest.TestCase):
    """Runs Binary Vector subtype tests.

    Follows the style of the BSON corpus specification tests.
    Tests are automatically generated on import
    from json files in _TEST_PATH via `create_tests`.
    The actual tests are defined in the inner function `run_test`
    of the test generator `create_test`."""


def create_test(case_spec):
    """Create standard test given specification in json.

    We use the naming convention expected (exp) and observed (obj)
    to differentiate what is in the json (expected or suffix _exp)
    from what is produced by the API (observed or suffix _obs)
    """
    test_key = case_spec.get("test_key")

    def run_test(self):
        for test_case in case_spec.get("tests", []):
            description = test_case["description"]
            vector_exp = test_case.get("vector")
            dtype_hex_exp = test_case["dtype_hex"]
            dtype_alias_exp = test_case.get("dtype_alias")
            padding_exp = test_case.get("padding", 0)
            canonical_bson_exp = test_case.get("canonical_bson")
            # Convert dtype hex string into bytes
            dtype_exp = BinaryVectorDtype(int(dtype_hex_exp, 16).to_bytes(1, byteorder="little"))

            if test_case["valid"]:
                # Convert bson string to bytes
                cB_exp = binascii.unhexlify(canonical_bson_exp.encode("utf8"))
                decoded_doc = decode(cB_exp)
                binary_obs = decoded_doc[test_key]

                # Test round-tripping canonical bson.
                self.assertEqual(encode(decoded_doc), cB_exp, description)

                # Test BSON to Binary Vector
                vector_obs = binary_obs.as_vector()
                self.assertEqual(vector_obs.dtype, dtype_exp, description)
                if dtype_alias_exp:
                    self.assertEqual(
                        vector_obs.dtype, BinaryVectorDtype[dtype_alias_exp], description
                    )
                if dtype_exp in [BinaryVectorDtype.FLOAT32]:
                    [
                        self.assertAlmostEqual(vector_obs.data[i], vector_exp[i], delta=1e-5)
                        for i in range(len(vector_exp))
                    ]
                else:
                    self.assertEqual(vector_obs.data, vector_exp, description)
                # Test Binary Vector to BSON
                vector_exp = Binary.from_vector(vector_exp, dtype_exp, padding_exp)
                cB_obs = binascii.hexlify(encode({test_key: vector_exp})).decode().upper()
                self.assertEqual(cB_obs, canonical_bson_exp, description)

            else:
                """
                #### To prove correct in an invalid case (`valid:false`), one MUST
                - (encoding case) if the vector field is present, raise an exception
                when attempting to encode a document from the numeric values,dtype, and padding.
                - (decoding case) if the canonical_bson field is present, raise an exception
                when attempting to deserialize it into the corresponding
                numeric values, as the field contains corrupted data.
                """
                # Tests Binary.from_vector()
                if vector_exp is not None:
                    with self.assertRaises((struct.error, ValueError), msg=description):
                        Binary.from_vector(vector_exp, dtype_exp, padding_exp)

                # Tests Binary.as_vector()
                if canonical_bson_exp is not None:
                    with self.assertRaises((struct.error, ValueError), msg=description):
                        cB_exp = binascii.unhexlify(canonical_bson_exp.encode("utf8"))
                        decoded_doc = decode(cB_exp)
                        binary_obs = decoded_doc[test_key]
                        binary_obs.as_vector()

    return run_test


def create_tests():
    for filename in _TEST_PATH.glob("*.json"):
        with open(str(filename), encoding="utf-8") as test_file:
            test_method = create_test(json_util.loads(test_file.read()))
        setattr(TestBSONBinaryVector, "test_" + filename.stem, test_method)


create_tests()


if __name__ == "__main__":
    unittest.main()