-
Notifications
You must be signed in to change notification settings - Fork 4k
/
Copy pathtable_cache.h
686 lines (550 loc) · 21.5 KB
/
table_cache.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
/* Copyright (c) 2012, 2024, Oracle and/or its affiliates.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License, version 2.0,
as published by the Free Software Foundation.
This program is designed to work with certain software (including
but not limited to OpenSSL) that is licensed under separate terms,
as designated in a particular file or component or in included license
documentation. The authors of MySQL hereby grant you an additional
permission to link the program and your derivative works with the
separately licensed software that they have either included with
the program or referenced in the documentation.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License, version 2.0, for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
#ifndef TABLE_CACHE_INCLUDED
#define TABLE_CACHE_INCLUDED
#include <assert.h>
#include <stddef.h>
#include <sys/types.h>
#include <atomic>
#include <memory>
#include <string>
#include <unordered_map>
#include <utility>
#include "lex_string.h"
#include "my_base.h"
#include "my_psi_config.h"
#include "mysql/components/services/bits/mysql_mutex_bits.h"
#include "mysql/components/services/bits/psi_mutex_bits.h"
#include "mysql/psi/mysql_mutex.h"
#include "sql/aggregated_stats.h"
#include "sql/handler.h"
#include "sql/sql_base.h"
#include "sql/sql_class.h"
#include "sql/sql_plist.h"
#include "sql/system_variables.h"
#include "sql/table.h"
#include "sql/table_trigger_dispatcher.h"
class Table_cache_element;
extern ulong table_cache_size_per_instance, table_cache_instances,
table_cache_triggers, table_cache_triggers_per_instance;
extern struct aggregated_stats global_aggregated_stats;
/**
Cache for open TABLE objects.
The idea behind this cache is that most statements don't need to
go to a central table definition cache to get a TABLE object and
therefore don't need to lock LOCK_open mutex.
Instead they only need to go to one Table_cache instance (the
specific instance is determined by thread id) and only lock the
mutex protecting this cache.
DDL statements that need to remove all TABLE objects from all caches
need to lock mutexes for all Table_cache instances, but they are rare.
This significantly increases scalability in some scenarios.
*/
class Table_cache {
private:
/**
The table cache lock protects the following data:
1) m_unused_tables list.
2) m_cache hash.
3) used_tables, free_tables lists in Table_cache_element objects in
this cache.
4) m_table_count - total number of TABLE objects in this cache.
5) the element in TABLE_SHARE::cache_element[] array that corresponds
to this cache,
6) in_use member in TABLE object.
7) Also ownership of mutexes for all caches are required to update
the refresh_version and table_def_shutdown_in_progress variables
and TABLE_SHARE::version member.
The intention is that any query that finds a cached table object in
its designated table cache should only need to lock this mutex
instance and there should be no need to lock LOCK_open. LOCK_open is
still required however to create and release TABLE objects. However
most usage of the MySQL Server should be able to set the cache size
big enough so that the majority of the queries only need to lock this
mutex instance and not LOCK_open.
*/
mysql_mutex_t m_lock;
/**
The hash of Table_cache_element objects, each table/table share that
has any TABLE object in the Table_cache has a Table_cache_element from
which the list of free TABLE objects in this table cache AND the list
of used TABLE objects in this table cache is stored.
We use Table_cache_element::share::table_cache_key as key for this hash.
*/
std::unordered_map<std::string, std::unique_ptr<Table_cache_element>> m_cache;
/**
List that contains all TABLE instances for tables in this particular
table cache that are in not use by any thread. Recently used TABLE
instances are appended to the end of the list. Thus the beginning of
the list contains which have been least recently used.
*/
TABLE *m_unused_tables;
/**
Total number of TABLE instances for tables in this particular table
cache (both in use by threads and not in use).
This value summed over all table caches is accessible to users as
Open_tables status variable.
*/
uint m_table_count;
/**
LRU-organized list containing all TABLE instances with fully-loaded
triggers in this table cache which are not in use by any thread.
Tail is LRU TABLE.
*/
I_P_List<TABLE,
I_P_List_adapter<TABLE, &TABLE::triggers_lru_next,
&TABLE::triggers_lru_prev>,
I_P_List_null_counter, I_P_List_fast_push_back<TABLE>>
m_unused_triggers_lru;
/**
Total number of TABLE instances in this table cache with fully-loaded
triggers (both in use and unused).
@sa notify_triggers_load() for rationale behind use of atomic here.
*/
std::atomic<uint> m_table_triggers_count;
#ifdef HAVE_PSI_INTERFACE
static PSI_mutex_key m_lock_key;
static PSI_mutex_info m_mutex_keys[];
#endif
private:
#ifdef EXTRA_DEBUG
void check_unused();
#else
void check_unused() {}
#endif
inline void link_unused_table(TABLE *table);
inline void unlink_unused_table(TABLE *table);
inline void free_unused_tables_if_necessary(THD *thd);
public:
bool init();
void destroy();
static void init_psi_keys();
/** Acquire lock on table cache instance. */
void lock() { mysql_mutex_lock(&m_lock); }
/** Release lock on table cache instance. */
void unlock() { mysql_mutex_unlock(&m_lock); }
/** Assert that caller owns lock on the table cache. */
void assert_owner() { mysql_mutex_assert_owner(&m_lock); }
inline TABLE *get_table(THD *thd, const char *key, size_t key_length,
bool is_update, TABLE_SHARE **share);
inline void release_table(THD *thd, TABLE *table);
inline bool add_used_table(THD *thd, TABLE *table);
inline void remove_table(TABLE *table);
/** Get number of TABLE instances in the cache. */
uint cached_tables() const { return m_table_count; }
void free_all_unused_tables();
/**
Notify the table cache that we have finalized loading and parsing
triggers for one of its TABLE objects.
@note We use atomic to make it MT-safe without introducing overhead
from lock()/unlock() pair.
*/
void notify_triggers_load() { m_table_triggers_count++; }
uint loaded_triggers_tables() const { return m_table_triggers_count; }
#ifndef NDEBUG
void print_tables();
#endif
};
/**
Container class for all table cache instances in the system.
*/
class Table_cache_manager {
public:
/** Maximum supported number of table cache instances. */
static const int MAX_TABLE_CACHES = 64;
/** Default number of table cache instances */
static const int DEFAULT_MAX_TABLE_CACHES = 16;
bool init();
void destroy();
/** Get instance of table cache to be used by particular connection. */
Table_cache *get_cache(THD *thd) {
return &m_table_cache[thd->thread_id() % table_cache_instances];
}
/** Get index for the table cache in container. */
uint cache_index(Table_cache *cache) const {
return static_cast<uint>(cache - &m_table_cache[0]);
}
uint cached_tables();
void lock_all_and_tdc();
void unlock_all_and_tdc();
void assert_owner(THD *thd);
void assert_owner_all();
void assert_owner_all_and_tdc();
void free_table(THD *thd, enum_tdc_remove_table_type remove_type,
TABLE_SHARE *share);
void free_all_unused_tables();
#ifndef NDEBUG
void print_tables();
#endif
friend class Table_cache_iterator;
private:
/**
An array of Table_cache instances.
Only the first table_cache_instances elements in it are used.
*/
Table_cache m_table_cache[MAX_TABLE_CACHES];
};
extern Table_cache_manager table_cache_manager;
/**
Element that represents the table in the specific table cache.
Plays for table cache instance role similar to role of TABLE_SHARE
for table definition cache.
It is an implementation detail of Table_cache and is present
in the header file only to allow inlining of some methods.
*/
class Table_cache_element {
private:
/*
Doubly-linked (back-linked) lists of used and unused TABLE objects
for this table in this table cache (one such list per table cache).
*/
typedef I_P_List<
TABLE, I_P_List_adapter<TABLE, &TABLE::cache_next, &TABLE::cache_prev>>
TABLE_list;
TABLE_list used_tables;
/**
List of unused TABLE objects that do not have fully-loaded triggers;
either because there were no triggers, or because the triggers were
not previously loaded as they were not needed for read-only statements.
(This distinction is why our nomenclature is not just full <-> lazy.)
*/
TABLE_list free_tables_slim;
/** List of unused TABLE objects with fully-loaded triggers. */
TABLE_list free_tables_full_triggers;
TABLE_SHARE *share;
public:
Table_cache_element(TABLE_SHARE *share_arg) : share(share_arg) {}
TABLE_SHARE *get_share() const { return share; }
friend class Table_cache;
friend class Table_cache_manager;
friend class Table_cache_iterator;
};
/**
Iterator which allows to go through all used TABLE instances
for the table in all table caches.
*/
class Table_cache_iterator {
const TABLE_SHARE *share;
uint current_cache_index;
TABLE *current_table;
inline void move_to_next_table();
public:
/**
Construct iterator over all used TABLE objects for the table share.
@note Assumes that caller owns locks on all table caches.
*/
inline Table_cache_iterator(const TABLE_SHARE *share_arg);
inline TABLE *operator++(int);
inline void rewind();
};
/**
Add table to the tail of unused tables list for table cache
(i.e. as the most recently used table in this list).
If necessary, do the same thing for list of unused tables with
fully-loaded triggers.
*/
void Table_cache::link_unused_table(TABLE *table) {
if (m_unused_tables) {
table->next = m_unused_tables;
table->prev = m_unused_tables->prev;
m_unused_tables->prev = table;
table->prev->next = table;
} else
m_unused_tables = table->next = table->prev = table;
check_unused();
if (table->triggers && table->triggers->has_load_been_finalized())
m_unused_triggers_lru.push_back(table);
}
/**
Remove table from the unused tables list for the table cache.
If necessary, do the same thing for list of unused tables with
fully-loaded triggers for the table cache.
*/
void Table_cache::unlink_unused_table(TABLE *table) {
table->next->prev = table->prev;
table->prev->next = table->next;
if (table == m_unused_tables) {
m_unused_tables = m_unused_tables->next;
if (table == m_unused_tables) m_unused_tables = nullptr;
}
check_unused();
if (table->triggers && table->triggers->has_load_been_finalized())
m_unused_triggers_lru.remove(table);
}
/**
Free unused TABLE instances if total number of TABLE objects
in table cache has exceeded table_cache_size_per_instance
limit.
@note That we might need to free more than one instance during
this call if table_cache_size was changed dynamically.
*/
void Table_cache::free_unused_tables_if_necessary(THD *thd) {
/*
We have too many TABLE instances around let us try to get rid of them.
Note that we might need to free more than one TABLE object, and thus
need the below loop, in case when table_cache_size is changed dynamically,
at server run time.
We also might need to get rid of TABLE instances with fully-loaded triggers
if there are too many of them. Unfortunately, there is no good way to
"unload" triggers, so we have to get rid of the whole TABLE object.
*/
if ((m_table_count > table_cache_size_per_instance && m_unused_tables) ||
(m_table_triggers_count > table_cache_triggers_per_instance &&
!m_unused_triggers_lru.is_empty())) {
mysql_mutex_lock(&LOCK_open);
while (m_table_count > table_cache_size_per_instance && m_unused_tables) {
TABLE *table_to_free = m_unused_tables;
remove_table(table_to_free);
intern_close_table(table_to_free);
thd->status_var.table_open_cache_overflows++;
global_aggregated_stats.get_shard(thd->thread_id())
.table_open_cache_overflows++;
}
while (m_table_triggers_count > table_cache_triggers_per_instance &&
!m_unused_triggers_lru.is_empty()) {
TABLE *table_to_free = m_unused_triggers_lru.front();
remove_table(table_to_free);
intern_close_table(table_to_free);
thd->status_var.table_open_cache_triggers_overflows++;
DBUG_PRINT("info", ("table_open_cache_triggers_overflows: %llu",
thd->status_var.table_open_cache_triggers_overflows));
}
mysql_mutex_unlock(&LOCK_open);
}
}
/**
Add newly created TABLE object which is going to be used right away
to the table cache.
@note Caller should own lock on the table cache.
@note Sets TABLE::in_use member as side effect.
@retval false - success.
@retval true - failure.
*/
bool Table_cache::add_used_table(THD *thd, TABLE *table) {
Table_cache_element *el;
assert_owner();
assert(table->in_use == thd);
/*
Try to get Table_cache_element representing this table in the cache
from array in the TABLE_SHARE.
*/
el = table->s->cache_element[table_cache_manager.cache_index(this)];
if (!el) {
/*
If TABLE_SHARE doesn't have pointer to the element representing table
in this cache, the element for the table must be absent from table the
cache.
Allocate new Table_cache_element object and add it to the cache
and array in TABLE_SHARE.
*/
const std::string key(table->s->table_cache_key.str,
table->s->table_cache_key.length);
assert(m_cache.count(key) == 0);
el = new Table_cache_element(table->s);
m_cache.emplace(key, std::unique_ptr<Table_cache_element>(el));
table->s->cache_element[table_cache_manager.cache_index(this)] = el;
}
/* Add table to the used tables list */
el->used_tables.push_front(table);
m_table_count++;
free_unused_tables_if_necessary(thd);
return false;
}
/**
Prepare used or unused TABLE instance for destruction by removing
it from the table cache.
@note Caller should own lock on the table cache.
*/
void Table_cache::remove_table(TABLE *table) {
Table_cache_element *el =
table->s->cache_element[table_cache_manager.cache_index(this)];
assert_owner();
if (table->in_use) {
/* Remove from per-table chain of used TABLE objects. */
el->used_tables.remove(table);
} else {
/* Remove from per-table chain of unused TABLE objects. */
if (table->triggers && table->triggers->has_load_been_finalized())
el->free_tables_full_triggers.remove(table);
else
el->free_tables_slim.remove(table);
/* And per-cache unused chain. */
unlink_unused_table(table);
}
m_table_count--;
if (table->triggers && table->triggers->has_load_been_finalized())
m_table_triggers_count--;
if (el->used_tables.is_empty() && el->free_tables_full_triggers.is_empty() &&
el->free_tables_slim.is_empty()) {
const std::string key(table->s->table_cache_key.str,
table->s->table_cache_key.length);
m_cache.erase(key);
/*
Remove reference to deleted cache element from array
in the TABLE_SHARE.
*/
table->s->cache_element[table_cache_manager.cache_index(this)] = nullptr;
}
}
/**
Get an unused TABLE instance from the table cache.
@param thd Thread context.
@param key Key identifying table.
@param key_length Length of key for the table.
@param is_update Indicates whether statement is going to use
TABLE object for updating the table; if so,
it is better to obtain a TABLE instance with
fully-loaded triggers.
@param[out] share NULL - if table cache doesn't contain any
information about the table (i.e. doesn't have
neither used nor unused TABLE objects for it).
Pointer to TABLE_SHARE for the table otherwise.
@note Caller should own lock on the table cache.
@note Sets TABLE::in_use member as side effect.
@retval non-NULL - pointer to unused TABLE object, "share" out-parameter
contains pointer to TABLE_SHARE for this table.
@retval NULL - no unused TABLE object was found, "share" parameter
contains pointer to TABLE_SHARE for this table if there
are used TABLE objects in cache and NULL otherwise.
*/
TABLE *Table_cache::get_table(THD *thd, const char *key, size_t key_length,
bool is_update, TABLE_SHARE **share) {
TABLE *table;
assert_owner();
*share = nullptr;
const std::string key_str(key, key_length);
const auto el_it = m_cache.find(key_str);
if (el_it == m_cache.end()) return nullptr;
Table_cache_element *el = el_it->second.get();
*share = el->share;
/*
Obtain (get first and unlink) table from list of unused TABLE objects for
this table in this cache.
*/
if (!is_update) {
/*
For read-only statements we prefer TABLE objects which don't have
triggers fully-loaded. If successful, this should leave unused TABLEs
with fully-loaded triggers for read-write statements.
If there are no TABLE instances without fully-loaded triggers available,
we will resort to using one that has them. That's still better than
doing full-blown TABLE construction process.
*/
table = el->free_tables_slim.pop_front();
if (!table) table = el->free_tables_full_triggers.pop_front();
} else {
/*
For read-write statements try to get a TABLE object with fully-loaded
triggers.
If there is no such object, try to obtain a TABLE object without
fully-loaded triggers. (If necessary trigger loading will be finalized
later.)
*/
table = el->free_tables_full_triggers.pop_front();
if (!table) table = el->free_tables_slim.pop_front();
}
if (table) {
assert(!table->in_use);
/* Unlink table from unused tables list for this cache. */
unlink_unused_table(table);
/*
Add table to list of used TABLE objects for this table
in the table cache.
*/
el->used_tables.push_front(table);
table->in_use = thd;
/* The ex-unused table must be fully functional. */
assert(table->db_stat && table->file);
/* The children must be detached from the table. */
assert(!table->file->ha_extra(HA_EXTRA_IS_ATTACHED_CHILDREN));
}
return table;
}
/**
Put used TABLE instance back to the table cache and mark
it as unused.
@note Caller should own lock on the table cache.
@note Sets TABLE::in_use member as side effect.
*/
void Table_cache::release_table(THD *thd, TABLE *table) {
Table_cache_element *el =
table->s->cache_element[table_cache_manager.cache_index(this)];
assert_owner();
assert(table->in_use);
assert(table->file);
/* We shouldn't put the table to 'unused' list if the share is old. */
assert(!table->s->has_old_version());
table->in_use = nullptr;
/* Remove TABLE from the list of used objects for the table in this cache. */
el->used_tables.remove(table);
/* Add TABLE to the list of unused objects for the table in this cache. */
if (table->triggers && table->triggers->has_load_been_finalized())
el->free_tables_full_triggers.push_front(table);
else
el->free_tables_slim.push_front(table);
/* Also link it last in the list of unused TABLE objects for the cache. */
link_unused_table(table);
/*
We free the least used tables, not the subject table, to keep the LRU order.
Note that in most common case the below call won't free anything.
*/
free_unused_tables_if_necessary(thd);
}
/**
Construct iterator over all used TABLE objects for the table share.
@note Assumes that caller owns locks on all table caches.
*/
Table_cache_iterator::Table_cache_iterator(const TABLE_SHARE *share_arg)
: share(share_arg), current_cache_index(0), current_table(nullptr) {
table_cache_manager.assert_owner_all();
move_to_next_table();
}
/** Helper that moves iterator to the next used TABLE for the table share. */
void Table_cache_iterator::move_to_next_table() {
for (; current_cache_index < table_cache_instances; ++current_cache_index) {
Table_cache_element *el;
if ((el = share->cache_element[current_cache_index])) {
if ((current_table = el->used_tables.front())) break;
}
}
}
/**
Get current used TABLE instance and move iterator to the next one.
@note Assumes that caller owns locks on all table caches.
*/
TABLE *Table_cache_iterator::operator++(int) {
table_cache_manager.assert_owner_all();
TABLE *result = current_table;
if (current_table) {
Table_cache_element::TABLE_list::Iterator it(
share->cache_element[current_cache_index]->used_tables, current_table);
current_table = ++it;
if (!current_table) {
++current_cache_index;
move_to_next_table();
}
}
return result;
}
void Table_cache_iterator::rewind() {
current_cache_index = 0;
current_table = nullptr;
move_to_next_table();
}
#endif /* TABLE_CACHE_INCLUDED */