File: collation_loader-t.cc

package info (click to toggle)
mysql-8.0 8.0.43-3
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 1,273,924 kB
  • sloc: cpp: 4,684,605; ansic: 412,450; pascal: 108,398; java: 83,641; perl: 30,221; cs: 27,067; sql: 26,594; sh: 24,181; python: 21,816; yacc: 17,169; php: 11,522; xml: 7,388; javascript: 7,076; makefile: 2,194; lex: 1,075; awk: 670; asm: 520; objc: 183; ruby: 97; lisp: 86
file content (124 lines) | stat: -rw-r--r-- 4,635 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
/* Copyright (c) 2017, 2025, Oracle and/or its affiliates.

   This program is free software; you can redistribute it and/or modify
   it under the terms of the GNU General Public License, version 2.0,
   as published by the Free Software Foundation.

   This program is designed to work with certain software (including
   but not limited to OpenSSL) that is licensed under separate terms,
   as designated in a particular file or component or in included license
   documentation.  The authors of MySQL hereby grant you an additional
   permission to link the program and your derivative works with the
   separately licensed software that they have either included with
   the program or referenced in the documentation.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License, version 2.0, for more details.

   You should have received a copy of the GNU General Public License
   along with this program; if not, write to the Free Software
   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301  USA */

/*
  We do benchmark test of character set loader below.
  1. Load a collation. This happens in query like 'SELECT a FROM tbl ORDER BY
     a COLLATE coll_name'. 'coll_name' is the name of collation which is used
     to do ordering, like 'latin1_swedish_ci'.
  2. Load a character set. In MySQL, when you ask for a 'character set', you
     actually get a collation. For example, when executing 'SELECT _utf16
     0x0100'. MySQL uses the pointer to collation 'utf16_general_ci' to handle
     this character.
*/

#include <gtest/gtest.h>
#include <thread>
#include <vector>

#include "m_ctype.h"
#include "my_sys.h"
#include "unittest/gunit/benchmark.h"

namespace collation_loader_unittest {

namespace {

CHARSET_INFO *lookup_collation(const char *name) {
  MY_CHARSET_LOADER loader;
  return my_collation_get_by_name(&loader, name, MYF(0));
}

CHARSET_INFO *lookup_charset(const char *name, int flag) {
  MY_CHARSET_LOADER loader;
  return my_charset_get_by_name(&loader, name, flag, MYF(0));
}

}  // namespace

static void BM_LookupAllCollations(size_t num_iterations) {
  StopBenchmarkTiming();

  // Look up one collation to initialize the all_charsets array.
  lookup_collation("latin1_swedish_ci");
  size_t num_charsets = array_elements(all_charsets);

  StartBenchmarkTiming();
  for (size_t i = 0; i < num_iterations; i++) {
    const CHARSET_INFO *cs = all_charsets[i % num_charsets];
    if (cs) {
      EXPECT_NE(lookup_collation(cs->m_coll_name), nullptr);
    }
  }
}
BENCHMARK(BM_LookupAllCollations)

static std::vector<std::string> charsets = {
    "armscii8", "ascii",   "big5",   "binary",  "cp1250",  "cp1251",
    "cp1256",   "cp1257",  "cp850",  "cp852",   "cp866",   "cp932",
    "dec8",     "eucjpms", "euckr",  "gb18030", "gb2312",  "gbk",
    "geostd8",  "greek",   "hebrew", "hp8",     "keybcs2", "koi8r",
    "koi8u",    "latin1",  "latin2", "latin5",  "latin7",  "macce",
    "macroman", "sjis",    "swe7",   "tis620",  "ucs2",    "ujis",
    "utf16",    "utf16le", "utf32",  "utf8",    "utf8mb4",
};

static void BM_LookupAllCharsets(size_t num_iterations) {
  StopBenchmarkTiming();

  // Look up one collation to initialize the all_charsets array.
  lookup_collation("latin1_swedish_ci");

  StartBenchmarkTiming();
  for (size_t i = 0; i < num_iterations; i++) {
    const std::string &charset = charsets[i % charsets.size()];
    EXPECT_NE(lookup_charset(charset.c_str(), MY_CS_PRIMARY), nullptr);
    EXPECT_NE(lookup_charset(charset.c_str(), MY_CS_BINSORT), nullptr);
  }
}
BENCHMARK(BM_LookupAllCharsets)

void TestRandomCollation() {
  char coll_name[65];
  for (int ix = 0; ix < 100000; ix++) {
    memset(coll_name, 0, 65);
    // Generate a random collation name whose length is in range [1, 64].
    size_t random_coll_name_len = 1 + rand() % 64;
    for (size_t i = 0; i < random_coll_name_len; i++) {
      // Use ASCII latin letters to generate the name.
      coll_name[i] = 'a' + rand() % 26;
    }
    int rc = get_collation_number(coll_name);
    // Random collation that doesn't exist should return 0.
    EXPECT_EQ(0, rc);
  }
}

TEST(CollationLoaderTest, RandomCollation) {
  // Look up one collation to initialize the all_charsets array.
  lookup_collation("latin1_swedish_ci");
  std::thread test_thd[4];
  for (int i = 0; i < 4; i++) test_thd[i] = std::thread(TestRandomCollation);
  for (int i = 0; i < 4; i++) test_thd[i].join();
}
}  // namespace collation_loader_unittest