File: test_match.py

package info (click to toggle)
pfzy 0.3.4-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 224 kB
  • sloc: python: 311; makefile: 17; sh: 5
file content (64 lines) | stat: -rw-r--r-- 1,888 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
import pytest

from pfzy.match import _rank_task, fuzzy_match
from pfzy.score import fzy_scorer, substr_scorer


@pytest.mark.asyncio
async def test_rank_task() -> None:
    assert await _rank_task(substr_scorer, "abc", [{"val": "wzawbc"}], "val") == []
    assert await _rank_task(
        substr_scorer, "abc", [{"val": "wabco"}, {"val": "abcabc"}], "val"
    ) == [
        {
            "haystack": {"val": "abcabc"},
            "indices": [0, 1, 2],
            "score": -0.6666666666666667,
        },
        {"haystack": {"val": "wabco"}, "indices": [1, 2, 3], "score": -1.75},
    ]

    assert await _rank_task(
        fzy_scorer,
        "abc",
        [{"val": "acbabc"}, {"val": "abcABC"}, {"val": "bwd abc"}],
        "val",
    ) == [
        {
            "haystack": {"val": "abcABC"},
            "indices": [0, 1, 2],
            "score": 2.8850000000000002,
        },
        {
            "haystack": {"val": "bwd abc"},
            "indices": [4, 5, 6],
            "score": 2.7800000000000002,
        },
        {
            "haystack": {"val": "acbabc"},
            "indices": [3, 4, 5],
            "score": 1.9849999999999999,
        },
    ]

    assert await _rank_task(
        fzy_scorer, "ab", [{"val": "acb"}, {"val": "acbabc"}], "val"
    ) == [
        {"score": 0.98, "indices": [3, 4], "haystack": {"val": "acbabc"}},
        {"score": 0.89, "indices": [0, 2], "haystack": {"val": "acb"}},
    ]


@pytest.mark.asyncio
async def test_fuzzy_match() -> None:
    await fuzzy_match("a", ["abca"]) == [{"value": "abca", "indices": [0]}]
    await fuzzy_match(
        "a",
        [{"val": "abca"}, {"val": "aAbc"}],
        key="val",
        scorer=substr_scorer,
        batch_size=1,
    ) == [{"val": "abca", "indices": [0]}, {"val": "aAbc", "indices": [0]}]

    with pytest.raises(TypeError):
        await fuzzy_match("a", [{"val": "abc"}])