File: trie_builder.py

package info (click to toggle)
chromium 138.0.7204.183-1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 6,071,908 kB
  • sloc: cpp: 34,937,088; ansic: 7,176,967; javascript: 4,110,704; python: 1,419,953; asm: 946,768; xml: 739,971; pascal: 187,324; sh: 89,623; perl: 88,663; objc: 79,944; sql: 50,304; cs: 41,786; fortran: 24,137; makefile: 21,806; php: 13,980; tcl: 13,166; yacc: 8,925; ruby: 7,485; awk: 3,720; lisp: 3,096; lex: 1,327; ada: 727; jsp: 228; sed: 36
file content (57 lines) | stat: -rw-r--r-- 1,630 bytes parent folder | download | duplicates (8)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
# Copyright 2016 The Chromium Authors
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.

from collections import defaultdict


def _single_trie(string_to_value_pairs, index):
    """Build a single trie from a dict of input string to output values.

    This function assumes that all of the strings in
    string_to_value_pairs have the same length.
    The input
    {'abcd': 'ABCD', 'adef': 'ADEF', 'adeg': 'ADEG'}
    creates a trie like this:
    {
     'a' : {
      'b': {'cd' : "ABCD"},
      'd' : {
       'e' : {
        'f' : {'': "ADEF"},
        'g' : {'': "ADEG"},
       },
      },
     },
    }
    """
    dicts_by_indexed_letter = defaultdict(list)
    for string, value in string_to_value_pairs:
        dicts_by_indexed_letter[string[index]].append((string, value))

    output = {}
    for char, d in dicts_by_indexed_letter.items():
        if len(d) == 1:
            string = d[0][0]
            value = d[0][1]
            output[char] = {string[index + 1:]: value}
        else:
            output[char] = _single_trie(d, index + 1)

    return output


def trie_list_by_str_length(str_to_return_value_dict):
    """Make a list of tries from a dict of input string to output value.

    All strings should be all lower case.
    """
    dicts_by_length = defaultdict(list)
    for string, value in str_to_return_value_dict.items():
        dicts_by_length[len(string)].append((string, value))

    output = []
    for length, pairs in sorted(dicts_by_length.items()):
        output.append((length, _single_trie(sorted(pairs), 0)))

    return output