File: fuzz.hpp

package info (click to toggle)
rapidfuzz-cpp 3.3.2-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 2,480 kB
  • sloc: cpp: 30,893; python: 63; makefile: 26; sh: 8
file content (63 lines) | stat: -rw-r--r-- 2,395 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
/* SPDX-License-Identifier: MIT */
/* Copyright © 2022-present Max Bachmann */

#pragma once

#include "Indel.hpp"

namespace rapidfuzz_reference {

template <typename InputIt1, typename InputIt2>
double ratio(InputIt1 first1, InputIt1 last1, InputIt2 first2, InputIt2 last2, double score_cutoff = 0.0)
{
    return indel_similarity(first1, last1, first2, last2, score_cutoff / 100.0) * 100;
}

template <typename Sentence1, typename Sentence2>
double ratio(const Sentence1& s1, const Sentence2& s2, double score_cutoff = 0.0)
{
    return indel_similarity(s1, s2, score_cutoff / 100.0) * 100;
}

template <typename InputIt1, typename InputIt2>
double partial_ratio_impl(InputIt1 first1, InputIt1 last1, InputIt2 first2, InputIt2 last2,
                          double score_cutoff = 0.0)
{
    size_t len1 = static_cast<size_t>(std::distance(first1, last1));
    size_t len2 = static_cast<size_t>(std::distance(first2, last2));
    if (len1 == 0 && len2 == 0) return 100.0;

    if (len1 == 0 || len2 == 0) return 0.0;

    if (len1 > len2) return partial_ratio_impl(first2, last2, first1, last1, score_cutoff);

    double res = 0.0;
    for (ptrdiff_t i = -1 * (ptrdiff_t)len1; i < (ptrdiff_t)len2; i++) {
        ptrdiff_t start = std::max(ptrdiff_t(0), i);
        ptrdiff_t end = std::min(ptrdiff_t(len2), i + ptrdiff_t(len1));
        InputIt2 first2_ = first2 + start;
        InputIt2 last2_ = first2 + end;
        res = std::max(res, ratio(first1, last1, first2_, last2_, score_cutoff));
    }
    return res;
}

template <typename InputIt1, typename InputIt2>
double partial_ratio(InputIt1 first1, InputIt1 last1, InputIt2 first2, InputIt2 last2,
                     double score_cutoff = 0.0)
{
    size_t len1 = static_cast<size_t>(std::distance(first1, last1));
    size_t len2 = static_cast<size_t>(std::distance(first2, last2));
    if (len1 != len2) return partial_ratio_impl(first1, last1, first2, last2, score_cutoff);

    return std::max(partial_ratio_impl(first1, last1, first2, last2, score_cutoff),
                    partial_ratio_impl(first2, last2, first1, last1, score_cutoff));
}

template <typename Sentence1, typename Sentence2>
double partial_ratio(const Sentence1& s1, const Sentence2& s2, double score_cutoff = 0.0)
{
    return partial_ratio(std::begin(s1), std::end(s1), std::begin(s2), std::end(s2), score_cutoff);
}

} // namespace rapidfuzz_reference