1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714
|
/* Copyright (c) 2006, 2025, Oracle and/or its affiliates.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License, version 2.0,
as published by the Free Software Foundation.
This program is designed to work with certain software (including
but not limited to OpenSSL) that is licensed under separate terms,
as designated in a particular file or component or in included license
documentation. The authors of MySQL hereby grant you an additional
permission to link the program and your derivative works with the
separately licensed software that they have either included with
the program or referenced in the documentation.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License, version 2.0, for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
#ifndef RPL_UTILITY_H
#define RPL_UTILITY_H
#ifndef __cplusplus
#error "Don't include this C++ header file from a non-C++ file!"
#endif
#include <sys/types.h>
#include <algorithm>
#include <string>
#include <unordered_map>
#include "field_types.h" // enum_field_types
#include "my_dbug.h"
#include "my_inttypes.h"
#include "my_macros.h"
#include "sql/psi_memory_key.h"
struct MY_BITMAP;
#ifdef MYSQL_SERVER
#include <memory>
#include "map_helpers.h"
#include "prealloced_array.h" // Prealloced_array
#include "sql/table.h" // Table_ref
class Log_event;
class Relay_log_info;
class THD;
/**
Hash table used when applying row events on the slave and there is
no index on the slave's table.
*/
struct HASH_ROW_POS {
/**
Points at the position where the row starts in the
event buffer (ie, area in memory before unpacking takes
place).
*/
const uchar *bi_start;
const uchar *bi_ends;
};
struct HASH_ROW_ENTRY;
struct hash_slave_rows_free_entry {
void operator()(HASH_ROW_ENTRY *entry) const;
};
/**
Internal structure that acts as a preamble for HASH_ROW_POS
in memory structure.
Allocation is done in Hash_slave_rows::make_entry as part of
the entry allocation.
*/
struct HASH_ROW_PREAMBLE {
HASH_ROW_PREAMBLE() = default;
/*
The actual key.
*/
uint hash_value;
/**
The search state used to iterate over multiple entries for a
given key.
*/
malloc_unordered_multimap<
uint, std::unique_ptr<HASH_ROW_ENTRY, hash_slave_rows_free_entry>>::
const_iterator search_state;
/**
whether this search_state is usable or not.
*/
bool is_search_state_inited;
};
struct HASH_ROW_ENTRY {
HASH_ROW_PREAMBLE *preamble;
HASH_ROW_POS *positions;
};
class Hash_slave_rows {
public:
/**
Allocates an empty entry to be added to the hash table.
It should be called before calling member function @c put.
@returns NULL if a problem occurred, a valid pointer otherwise.
*/
HASH_ROW_ENTRY *make_entry();
/**
Allocates an entry to be added to the hash table. It should be
called before calling member function @c put.
@param bi_start the position to where in the rows buffer the
before image begins.
@param bi_ends the position to where in the rows buffer the
before image ends.
@returns NULL if a problem occurred, a valid pointer otherwise.
*/
HASH_ROW_ENTRY *make_entry(const uchar *bi_start, const uchar *bi_ends);
/**
Puts data into the hash table. It calculates the key taking
the data on @c TABLE::record as the input for hash computation.
@param table The table holding the buffer used to calculate the
key, ie, table->record[0].
@param cols The read_set bitmap signaling which columns are used.
@param entry The entry with the values to store.
@returns true if something went wrong, false otherwise.
*/
bool put(TABLE *table, MY_BITMAP *cols, HASH_ROW_ENTRY *entry);
/**
Gets the entry, from the hash table, that matches the data in
table->record[0] and signaled using cols.
@param table The table holding the buffer containing data used to
make the entry lookup.
@param cols Bitmap signaling which columns, from
table->record[0], should be used.
@returns a pointer that will hold a reference to the entry
found. If the entry is not found then NULL shall be
returned.
*/
HASH_ROW_ENTRY *get(TABLE *table, MY_BITMAP *cols);
/**
Gets the entry that stands next to the one pointed to by
*entry. Before calling this member function, the entry that one
uses as parameter must have: 1. been obtained through get() or
next() invocations; and 2. must have not been used before in a
next() operation.
@param[in,out] entry contains a pointer to an entry that we can
use to search for another adjacent entry
(ie, that shares the same key).
@returns true if something went wrong, false otherwise. In the
case that this entry was already used in a next()
operation this member function returns true and does not
update the pointer.
*/
bool next(HASH_ROW_ENTRY **entry);
/**
Deletes the entry pointed by entry. It also frees memory used
holding entry contents. This is the way to release memory
used for entry, freeing it explicitly with my_free will cause
undefined behavior.
@param entry Pointer to the entry to be deleted.
@returns true if something went wrong, false otherwise.
*/
bool del(HASH_ROW_ENTRY *entry);
/**
Initializes the hash table.
@returns true if something went wrong, false otherwise.
*/
bool init(void);
/**
De-initializes the hash table.
@returns true if something went wrong, false otherwise.
*/
bool deinit(void);
/**
Checks if the hash table is empty or not.
@returns true if the hash table has zero entries, false otherwise.
*/
bool is_empty(void);
/**
Returns the number of entries in the hash table.
@returns the number of entries in the hash table.
*/
int size();
private:
/**
The hashtable itself.
*/
malloc_unordered_multimap<
uint, std::unique_ptr<HASH_ROW_ENTRY, hash_slave_rows_free_entry>>
m_hash{key_memory_HASH_ROW_ENTRY};
/**
Auxiliary and internal method used to create an hash key, based on
the data in table->record[0] buffer and signaled as used in cols.
@param table The table that is being scanned
@param cols The read_set bitmap signaling which columns are used.
@returns the hash key created.
*/
uint make_hash_key(TABLE *table, MY_BITMAP *cols);
};
#endif
/**
A table definition from the master.
The responsibilities of this class is:
- Extract and decode table definition data from the table map event
- Check if table definition in table map is compatible with table
definition on slave
- expose the type information so that it can be used when encoding
or decoding row event data.
*/
class table_def {
public:
/**
No-op constructor. Instances of RPL_Table_ref are created by first
allocating memory, then placement-new-ing an RPL_Table_ref object
containing an uninitialized table_def object which is only conditionally
initialized. See Table_map_log_event::do_apply_event().
*/
table_def() = default;
/**
Constructor.
@param types Array of types, each stored as a byte
@param size Number of elements in array 'types'
@param field_metadata Array of extra information about fields
@param metadata_size Size of the field_metadata array
@param null_bitmap The bitmap of fields that can be null
@param flags Table flags
*/
table_def(unsigned char *types, ulong size, uchar *field_metadata,
int metadata_size, uchar *null_bitmap, uint16 flags);
~table_def();
/**
Return the number of fields there is type data for.
@return The number of fields that there is type data for.
*/
ulong size() const { return m_size; }
/**
Return the number of fields there is type data for minus
the GIPK field if this field does not exist in the replica.
@return The number of fields there is a type minus the GIPK
*/
ulong filtered_size(bool replica_has_gipk) const {
if (m_is_gipk_on_table && !replica_has_gipk) return m_size - 1;
return m_size;
}
/*
Returns internal binlog type code for one field,
without translation to real types.
*/
enum_field_types binlog_type(ulong index) const {
return static_cast<enum_field_types>(m_type[index]);
}
/// Return the number of JSON columns in this table.
int json_column_count() const {
// Cache in member field to make successive calls faster.
if (m_json_column_count == -1) {
int c = 0;
for (uint i = 0; i < size(); i++)
if (type(i) == MYSQL_TYPE_JSON) c++;
m_json_column_count = c;
}
return m_json_column_count;
}
/*
Return a representation of the type data for one field.
@param index Field index to return data for
@return Will return a representation of the type data for field
<code>index</code>. Currently, only the type identifier is
returned.
*/
enum_field_types type(ulong index) const {
assert(index < m_size);
/*
If the source type is MYSQL_TYPE_STRING, it can in reality be
either MYSQL_TYPE_STRING, MYSQL_TYPE_ENUM, or MYSQL_TYPE_SET, so
we might need to modify the type to get the real type.
*/
enum_field_types source_type = binlog_type(index);
uint source_metadata = m_field_metadata[index];
switch (source_type) {
case MYSQL_TYPE_STRING: {
int real_type = source_metadata >> 8;
if (real_type == MYSQL_TYPE_ENUM || real_type == MYSQL_TYPE_SET)
source_type = static_cast<enum_field_types>(real_type);
break;
}
/*
This type has not been used since before row-based replication,
so we can safely assume that it really is MYSQL_TYPE_NEWDATE.
*/
case MYSQL_TYPE_DATE:
source_type = MYSQL_TYPE_NEWDATE;
break;
default:
/* Do nothing */
break;
}
return source_type;
}
/*
This function allows callers to get the extra field data from the
table map for a given field. If there is no metadata for that field
or there is no extra metadata at all, the function returns 0.
The function returns the value for the field metadata for column at
position indicated by index. As mentioned, if the field was a type
that stores field metadata, that value is returned else zero (0) is
returned. This method is used in the unpack() methods of the
corresponding fields to properly extract the data from the binary log
in the event that the master's field is smaller than the slave.
*/
uint field_metadata(uint index) const {
assert(index < m_size);
if (m_field_metadata_size)
return m_field_metadata[index];
else
return 0;
}
/**
Returns whether or not the field at `index` is a typed array.
*/
bool is_array(uint index) const {
assert(index < m_size);
if (m_field_metadata_size)
return m_is_array[index];
else
return false;
}
/*
This function returns whether the field on the master can be null.
This value is derived from field->maybe_null().
*/
bool maybe_null(uint index) const {
assert(index < m_size);
return ((m_null_bits[(index / 8)] & (1 << (index % 8))) ==
(1 << (index % 8)));
}
/*
This function returns the field size in raw bytes based on the type
and the encoded field data from the master's raw data. This method can
be used for situations where the slave needs to skip a column (e.g.,
WL#3915) or needs to advance the pointer for the fields in the raw
data from the master to a specific column.
*/
uint32 calc_field_size(uint col, const uchar *master_data) const;
#ifdef MYSQL_SERVER
/**
Decide if the table definition is compatible with a table.
Compare the definition with a table to see if it is compatible
with it.
A table definition is compatible with a table if:
- The columns types of the table definition is a (not
necessarily proper) prefix of the column type of the table.
- The other way around.
- Each column on the master that also exists on the slave can be
converted according to the current settings of @c
REPLICA_TYPE_CONVERSIONS.
@param thd Current thread
@param rli Pointer to relay log info
@param table Pointer to table to compare with.
@param[out] conv_table_var Pointer to temporary table for holding
conversion table.
@retval 1 if the table definition is not compatible with @c table
@retval 0 if the table definition is compatible with @c table
*/
bool compatible_with(THD *thd, Relay_log_info *rli, TABLE *table,
TABLE **conv_table_var);
/**
Create a virtual in-memory temporary table structure.
The table structure has records and field array so that a row can
be unpacked into the record for further processing.
In the virtual table, each field that requires conversion will
have a non-NULL value, while fields that do not require
conversion will have a NULL value.
Some information that is missing in the events, such as the
character set for string types, are taken from the table that the
field is going to be pushed into, so the target table that the data
eventually need to be pushed into need to be supplied.
@param thd Thread to allocate memory from.
@param rli Relay log info structure, for error reporting.
@param target_table Target table for fields.
@param replica_has_gipk Does the replica table contain a GIPK
@return A pointer to a temporary table with memory allocated in the
thread's memroot, NULL if the table could not be created
*/
TABLE *create_conversion_table(THD *thd, Relay_log_info *rli,
TABLE *target_table,
bool replica_has_gipk) const;
/**
Evaluates if the source table might contain a GIPK
@note for servers of older versions that do not fully support GIPK, this
sets the info that is a guess based on available information replication
has.
In the case when the replica has a GIPK, the source is from an old
version that does not indicate if it has a GIPK or not, and the source
either has extra columns, or the replica has two more more extra columns
true is returned.
This function does not report an error.
@param thd The thread object associated to the application
@param table The table in the replica.
@return true if this table definition is found to be incompatible with the
table, false otherwise.
*/
bool compute_source_table_gipk_info(THD &thd, TABLE *table);
/**
Checks if the table contains a GIPK
@note for servers of older versions that do not fully support GIPK, this
method returns a guess based on available information replication has.
@return true if we believe the table to contain a GIPK, false otherwise
*/
bool is_gipk_present_on_source_table() const;
#endif
private:
ulong m_size; // Number of elements in the types array
unsigned char *m_type; // Array of type descriptors
uint m_field_metadata_size;
uint *m_field_metadata;
uchar *m_null_bits;
uint16 m_flags; // Table flags
uchar *m_memory;
mutable int m_json_column_count; // Number of JSON columns
bool *m_is_array;
bool m_is_gipk_set;
bool m_is_gipk_on_table;
};
#ifdef MYSQL_SERVER
/**
Extend the normal Table_ref with a few new fields needed by the
slave thread, but nowhere else.
*/
struct RPL_Table_ref : public Table_ref {
RPL_Table_ref(const char *db_name_arg, size_t db_length_arg,
const char *table_name_arg, size_t table_name_length_arg,
const char *alias_arg, enum thr_lock_type lock_type_arg)
: Table_ref(db_name_arg, db_length_arg, table_name_arg,
table_name_length_arg, alias_arg, lock_type_arg) {}
bool m_tabledef_valid;
table_def m_tabledef;
TABLE *m_conv_table;
};
class Deferred_log_events {
private:
Prealloced_array<Log_event *, 32> m_array;
public:
Deferred_log_events();
~Deferred_log_events();
/* queue for execution at Query-log-event time prior to the Query */
int add(Log_event *ev);
bool is_empty();
bool execute(Relay_log_info *rli);
void rewind();
};
#endif
/**
Decode field metadata from a char buffer (serialized form) into an int
(packed form).
@note On little-endian platforms (e.g Intel) this function effectively
inverts order of bytes compared to what Field::save_field_metadata()
writes. E.g for MYSQL_TYPE_NEWDECIMAL save_field_metadata writes precision
into the first byte and decimals into the second, this function puts
precision into the second byte and decimals into the first. This layout
is expected by replication code that reads metadata in the uint form.
Due to this design feature show_sql_type() can't correctly print
immediate output of save_field_metadata(), this function have to be used
as translator.
@param buffer Field metadata, in the character stream form produced by
save_field_metadata.
@param binlog_type The type of the field, in the form returned by
Field::binlog_type and stored in Table_map_log_event.
@retval pair where:
- the first component is the length of the metadata within 'buffer',
i.e., how much the buffer pointer should move forward in order to skip it.
- the second component is pair containing:
- the metadata, encoded as an 'uint', in the form required by e.g.
show_sql_type.
- bool indicating whether the field is array (true) or a scalar (false)
*/
std::pair<my_off_t, std::pair<uint, bool>> read_field_metadata(
const uchar *buffer, enum_field_types binlog_type);
// NB. number of printed bit values is limited to sizeof(buf) - 1
#define DBUG_PRINT_BITSET(N, FRM, BS) \
do { \
char buf[256]; \
uint i; \
for (i = 0; i < std::min(uint{sizeof(buf) - 1}, (BS)->n_bits); i++) \
buf[i] = bitmap_is_set((BS), i) ? '1' : '0'; \
buf[i] = '\0'; \
DBUG_PRINT((N), ((FRM), buf)); \
} while (0)
#ifdef MYSQL_SERVER
/**
Sentry class for managing the need to create and dispose of a local `THD`
instance.
If the given `THD` object pointer passed on the constructor is `nullptr`, a
new instance will be initialized within the constructor and disposed of in the
destructor.
If the given `THD` object pointer passed on the constructor is not `nullptr`,
the reference is kept and nothing is disposed on the destructor.
Casting operator to `THD*` is also provided, to easy code replacemente.
Usage example:
THD_instance_guard thd{current_thd != nullptr ? current_thd :
this->info_thd};
Acl_cache_lock_guard guard{thd, Acl_cache_lock_mode::READ_MODE};
if (guard.lock())
...
*/
class THD_instance_guard {
public:
/**
If the given `THD` object pointer is `nullptr`, a new instance will be
initialized within the constructor and disposed of in the destructor.
If the given `THD` object pointer is not `nullptr`, the reference is kept
and nothing is disposed on the destructor.
@param thd `THD` object reference that determines if an existence instance
is used or a new instance of `THD` must be created.
*/
THD_instance_guard(THD *thd);
/**
If a new instance of `THD` was created in the constructor, it will be
disposed here.
*/
virtual ~THD_instance_guard();
/**
Returns the active `THD` object pointer.
@return a not-nullptr `THD` object pointer.
*/
operator THD *();
private:
/** The active `THD` object pointer. */
THD *m_target{nullptr};
/**
Tells whether or not the active `THD` object was created in this object
constructor.
*/
bool m_is_locally_initialized{false};
};
#endif // MYSQL_SERVER
/**
Replaces every occurrence of the string `find` by the string `replace`, within
the string `from` and return the resulting string.
The original string `from` remains untouched.
@param from the string to search within.
@param find the string to search for.
@param replace the string to replace every occurrence of `from`
@return a new string, holding the result of the search and replace operation.
*/
std::string replace_all_in_str(std::string from, std::string find,
std::string replace);
#ifdef MYSQL_SERVER
/**
This method shall evaluate if a command being executed goes against any of
the restrictions of server variable session.require_row_format.
@param thd The thread associated to the command
@return true if it violates any restrictions
false otherwise
*/
bool is_require_row_format_violation(const THD *thd);
/**
This function shall blindly replace some deprecated terms used in the
field names with more recent ones. This function must be removed
once the related syntax (SHOW SLAVE STATUS and friends) is removed.
@param thd the thread context.
@param field_list the list of fields that will have their name checked
and altered if needed.
*/
void rename_fields_use_old_replica_source_terms(
THD *thd, mem_root_deque<Item *> &field_list);
/**
Checks if the immediate_server_version supports GIPKs or not
@param thd The THD context to check the version
@return true if the source server supports GIPK, false otherwise
*/
bool is_immediate_server_gipk_ready(THD &thd);
/**
Returns if the replicated table contains a GIPK or not
@note for servers of older versions that do not fully support GIPK, this
method returns a guess based on available information replication has.
@param rli The relay log object associated to the channel
@param table The table to check for the GIPK
@return true if we believe the table has a GIPK, false otherwise.
*/
bool does_source_table_contain_gipk(Relay_log_info const *rli, TABLE *table);
/**
@brief Returns a string representation for a given version
@param version a version represented using a integer
@return a string for the given version or "unknown"
if version is undefined or unknown.
*/
std::string decimal_numeric_version_to_string(uint32 version);
#endif // MYSQL_SERVER
#endif /* RPL_UTILITY_H */
|