MySQL 8.4.5
Source Code Documentation
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages Concepts
buf0buf.h
Go to the documentation of this file.
1/*****************************************************************************
2
3Copyright (c) 1995, 2025, Oracle and/or its affiliates.
4
5This program is free software; you can redistribute it and/or modify it under
6the terms of the GNU General Public License, version 2.0, as published by the
7Free Software Foundation.
8
9This program is designed to work with certain software (including
10but not limited to OpenSSL) that is licensed under separate terms,
11as designated in a particular file or component or in included license
12documentation. The authors of MySQL hereby grant you an additional
13permission to link the program and your derivative works with the
14separately licensed software that they have either included with
15the program or referenced in the documentation.
16
17This program is distributed in the hope that it will be useful, but WITHOUT
18ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
19FOR A PARTICULAR PURPOSE. See the GNU General Public License, version 2.0,
20for more details.
21
22You should have received a copy of the GNU General Public License along with
23this program; if not, write to the Free Software Foundation, Inc.,
2451 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
25
26*****************************************************************************/
27
28/** @file include/buf0buf.h
29 The database buffer pool high-level routines
30
31 Created 11/5/1995 Heikki Tuuri
32 *******************************************************/
33
34#ifndef buf0buf_h
35#define buf0buf_h
36
37#include "buf0types.h"
38#include "fil0fil.h"
39#include "hash0hash.h"
40#include "mtr0types.h"
41#include "os0proc.h"
42#include "page0types.h"
43#include "srv0shutdown.h"
44#include "srv0srv.h"
45#include "univ.i"
46#include "ut0byte.h"
47#include "ut0rbt.h"
48
49#include "buf/buf.h"
50
51#include <ostream>
52
53// Forward declaration
54struct fil_addr_t;
55
56/** @name Modes for buf_page_get_gen */
57/** @{ */
58enum class Page_fetch {
59 /** Get always */
60 NORMAL,
61
62 /** Same as NORMAL, but hint that the fetch is part of a large scan.
63 Try not to flood the buffer pool with pages that may not be accessed again
64 any time soon. */
65 SCAN,
66
67 /** get if in pool */
69
70 /** get if in pool, do not make the block young in the LRU list */
72
73 /** get and bufferfix, but set no latch; we have separated this case, because
74 it is error-prone programming not to set a latch, and it should be used with
75 care */
77
78 /** Get the page only if it's in the buffer pool, if not then set a watch on
79 the page. */
81
82 /** Like Page_fetch::NORMAL, but do not mind if the file page has been
83 freed. */
85
86 /** Like Page_fetch::POSSIBLY_FREED, but do not initiate read ahead. */
88};
89/** @} */
90
91/** @name Modes for buf_page_get_known_nowait */
92
93/** @{ */
94enum class Cache_hint {
95 /** Move the block to the start of the LRU list if there is a danger that the
96 block would drift out of the buffer pool*/
97 MAKE_YOUNG = 51,
98
99 /** Preserve the current LRU position of the block. */
100 KEEP_OLD = 52
101};
102
103/** @} */
104
105/** Number of bits to representing a buffer pool ID */
107
108/** The maximum number of buffer pools that can be defined */
110
111/** Maximum number of concurrent buffer pool watches */
112#define BUF_POOL_WATCH_SIZE (srv_n_purge_threads + 1)
113
114/** The maximum number of page_hash locks */
115constexpr ulint MAX_PAGE_HASH_LOCKS = 1024;
116
117/** The buffer pools of the database */
119
120#ifdef UNIV_HOTBACKUP
121/** first block, for --apply-log */
122extern buf_block_t *back_block1;
123/** second block, for page reorganize */
124extern buf_block_t *back_block2;
125#endif /* UNIV_HOTBACKUP */
126
127/** @brief States of a control block
128@see buf_page_t
129
130The enumeration values must be 0..7. */
131enum buf_page_state : uint8_t {
132 /** A sentinel for the buffer pool watch, element of buf_pool->watch[] */
134 /** Contains a clean compressed page */
136 /** Contains a compressed page that is in the buf_pool->flush_list */
138
139 /** Is in the free list; must be after the BUF_BLOCK_ZIP_ constants for
140 compressed-only pages @see buf_block_state_valid() */
142
143 /** When buf_LRU_get_free_block returns a block, it is in this state */
145
146 /** Contains a buffered file page */
148
149 /** Contains some main memory object */
151
152 /** Hash index should be removed before putting to the free list */
155
156const std::unordered_map<buf_page_state, std::string_view> buf_page_state_str{
157 /* First three states are for compression pages and are not states we would
158 get as we scan pages through buffer blocks */
160 {BUF_BLOCK_ZIP_PAGE, ""},
162 {BUF_BLOCK_NOT_USED, "NOT_USED"},
163 {BUF_BLOCK_READY_FOR_USE, "READY_FOR_USE"},
164 {BUF_BLOCK_FILE_PAGE, "FILE_PAGE"},
165 {BUF_BLOCK_MEMORY, "MEMORY"},
166 {BUF_BLOCK_REMOVE_HASH, "REMOVE_HASH"}};
167
168/** This structure defines information we will fetch from each buffer pool. It
169will be used to print table IO stats */
171 /* General buffer pool info */
172
173 /** Buffer Pool ID */
175 /** Buffer Pool size in pages */
177 /** Length of buf_pool->LRU */
179 /** buf_pool->LRU_old_len */
181 /** Length of buf_pool->free list */
183 /** Length of buf_pool->flush_list */
185 /** buf_pool->n_pend_unzip, pages pending decompress */
187 /** buf_pool->n_pend_reads, pages pending read */
189 /** Number of pages pending flush of given type */
190 std::array<size_t, BUF_FLUSH_N_TYPES> n_pending_flush;
191 /** number of pages made young */
193 /** number of pages not made young */
195 /** buf_pool->n_pages_read */
197 /** buf_pool->n_pages_created */
199 /** buf_pool->n_pages_written */
201 /** buf_pool->n_page_gets */
203 /** buf_pool->n_ra_pages_read_rnd, number of pages readahead */
205 /** buf_pool->n_ra_pages_read, number of pages readahead */
207 /** buf_pool->n_ra_pages_evicted, number of readahead pages evicted without
208 access */
210 /** num of buffer pool page gets since last printout */
212
213 /* Buffer pool access stats */
214 double page_made_young_rate; /*!< page made young rate in pages
215 per second */
216 double page_not_made_young_rate; /*!< page not made young rate
217 in pages per second */
218 double pages_read_rate; /*!< num of pages read per second */
219 double pages_created_rate; /*!< num of pages create per second */
220 double pages_written_rate; /*!< num of pages written per second */
221 ulint page_read_delta; /*!< num of pages read since last
222 printout */
223 ulint young_making_delta; /*!< num of pages made young since
224 last printout */
225 ulint not_young_making_delta; /*!< num of pages not make young since
226 last printout */
227
228 /* Statistics about read ahead algorithm. */
229 double pages_readahead_rnd_rate; /*!< random readahead rate in pages per
230 second */
231 double pages_readahead_rate; /*!< readahead rate in pages per
232 second */
233 double pages_evicted_rate; /*!< rate of readahead page evicted
234 without access, in pages per second */
235
236 /* Stats about LRU eviction */
237 ulint unzip_lru_len; /*!< length of buf_pool->unzip_LRU
238 list */
239 /* Counters for LRU policy */
240 ulint io_sum; /*!< buf_LRU_stat_sum.io */
241 ulint io_cur; /*!< buf_LRU_stat_cur.io, num of IO
242 for current interval */
243 ulint unzip_sum; /*!< buf_LRU_stat_sum.unzip */
244 ulint unzip_cur; /*!< buf_LRU_stat_cur.unzip, num
245 pages decompressed in current
246 interval */
247};
248
249/** The occupied bytes of lists in all buffer pools */
251 ulint LRU_bytes; /*!< LRU size in bytes */
252 ulint unzip_LRU_bytes; /*!< unzip_LRU size in bytes */
253 ulint flush_list_bytes; /*!< flush_list size in bytes */
254};
255
256#ifndef UNIV_HOTBACKUP
257/** Creates the buffer pool.
258@param[in] total_size Size of the total pool in bytes.
259@param[in] n_instances Number of buffer pool instances to create.
260@return DB_SUCCESS if success, DB_ERROR if not enough memory or error */
261dberr_t buf_pool_init(ulint total_size, ulint n_instances);
262
263/** Frees the buffer pool at shutdown. This must not be invoked before
264 freeing all mutexes. */
265void buf_pool_free_all();
266
267/** Determines if a block is intended to be withdrawn. The caller must ensure
268that there was a sufficient memory barrier to read curr_size and old_size.
269@param[in] buf_pool buffer pool instance
270@param[in] block pointer to control block
271@retval true if will be withdrawn */
272bool buf_block_will_withdrawn(buf_pool_t *buf_pool, const buf_block_t *block);
273
274/** Determines if a frame is intended to be withdrawn. The caller must ensure
275that there was a sufficient memory barrier to read curr_size and old_size.
276@param[in] buf_pool buffer pool instance
277@param[in] ptr pointer to a frame
278@retval true if will be withdrawn */
279bool buf_frame_will_withdrawn(buf_pool_t *buf_pool, const byte *ptr);
280
281/** This is the thread for resizing buffer pool. It waits for an event and
282when waked up either performs a resizing and sleeps again. */
283void buf_resize_thread();
284
285/** Checks if innobase_should_madvise_buf_pool() value has changed since we've
286last check and if so, then updates buf_pool_should_madvise and calls madvise
287for all chunks in all srv_buf_pool_instances.
288@see buf_pool_should_madvise comment for a longer explanation. */
290
291/** Clears the adaptive hash index on all pages in the buffer pool. */
293
294/** Gets the current size of buffer buf_pool in bytes.
295 @return size in bytes */
296static inline ulint buf_pool_get_curr_size(void);
297/** Gets the current size of buffer buf_pool in frames.
298 @return size in pages */
299static inline ulint buf_pool_get_n_pages(void);
300
301/** @return true if buffer pool resize is in progress. */
303
304#endif /* !UNIV_HOTBACKUP */
305
306/** Gets the smallest oldest_modification lsn among all of the earliest
307added pages in flush lists. In other words - takes the last dirty page
308from each flush list, and calculates minimum oldest_modification among
309all of them. Does not acquire global lock for the whole process, so the
310result might come from inconsistent view on flush lists.
311
312@note Note that because of the relaxed order in each flush list, this
313functions no longer returns the smallest oldest_modification among all
314of the dirty pages. If you wanted to have a safe lsn, which is smaller
315than every oldest_modification, you would need to use another function:
316 buf_pool_get_oldest_modification_lwm().
317
318Returns zero if there were no dirty pages (flush lists were empty).
319
320@return minimum oldest_modification of last pages from flush lists,
321 zero if flush lists were empty */
323
324/** Gets a safe low watermark for oldest_modification. It's guaranteed
325that there were no dirty pages with smaller oldest_modification in the
326whole flush lists.
327
328Returns zero if flush lists were empty, be careful in such case, because
329taking the newest lsn is probably not a good idea. If you wanted to rely
330on some lsn in such case, you would need to follow pattern:
331
332 dpa_lsn = log_buffer_dirty_pages_added_up_to_lsn(*log_sys);
333
334 lwm_lsn = buf_pool_get_oldest_modification_lwm();
335
336 if (lwm_lsn == 0) lwm_lsn = dpa_lsn;
337
338The order is important to avoid race conditions.
339
340@remarks
341It's guaranteed that the returned value will not be smaller than the
342last checkpoint lsn. It's not guaranteed that the returned value is
343the maximum possible. It's just the best effort for the low cost.
344It basically takes result of buf_pool_get_oldest_modification_approx()
345and subtracts maximum possible lag introduced by relaxed order in
346flush lists (srv_log_recent_closed_size).
347
348@return safe low watermark for oldest_modification of dirty pages,
349 or zero if flush lists were empty; if non-zero, it is then
350 guaranteed not to be at block boundary (and it points to lsn
351 inside data fragment of block) */
353
354#ifndef UNIV_HOTBACKUP
355
356/** Allocates a buf_page_t descriptor. This function must succeed. In case
357 of failure we assert in this function. */
359 MY_ATTRIBUTE((malloc));
360
361/** Free a buf_page_t descriptor.
362@param[in] bpage bpage descriptor to free */
364
365/** Allocates a buffer block.
366 @return own: the allocated block, in state BUF_BLOCK_MEMORY */
368 buf_pool_t *buf_pool); /*!< in: buffer pool instance,
369 or NULL for round-robin selection
370 of the buffer pool */
371/** Frees a buffer block which does not contain a file page. */
372static inline void buf_block_free(
373 buf_block_t *block); /*!< in, own: block to be freed */
374#endif /* !UNIV_HOTBACKUP */
375
376/** Copies contents of a buffer frame to a given buffer.
377@param[in] buf buffer to copy to
378@param[in] frame buffer frame
379@return buf */
380static inline byte *buf_frame_copy(byte *buf, const buf_frame_t *frame);
381
382#ifndef UNIV_HOTBACKUP
383/** This is the general function used to get optimistic access to a database
384page.
385@param[in] rw_latch RW_S_LATCH, RW_X_LATCH
386@param[in,out] block Guessed block
387@param[in] modify_clock Modify clock value
388@param[in] fetch_mode Fetch mode
389@param[in] file File name
390@param[in] line Line where called
391@param[in,out] mtr Mini-transaction
392@return true if success */
393bool buf_page_optimistic_get(ulint rw_latch, buf_block_t *block,
394 uint64_t modify_clock, Page_fetch fetch_mode,
395 const char *file, ulint line, mtr_t *mtr);
396
397/** This is used to get access to a known database page, when no waiting can be
398done.
399@param[in] rw_latch RW_S_LATCH or RW_X_LATCH.
400@param[in] block The known page.
401@param[in] hint Cache_hint::MAKE_YOUNG or Cache_hint::KEEP_OLD
402@param[in] file File name from where it was called.
403@param[in] line Line from where it was called.
404@param[in,out] mtr Mini-transaction covering the fetch
405@return true if success */
406bool buf_page_get_known_nowait(ulint rw_latch, buf_block_t *block,
407 Cache_hint hint, const char *file, ulint line,
408 mtr_t *mtr);
409
410/** Given a tablespace id and page number tries to get that page. If the
411page is not in the buffer pool it is not loaded and NULL is returned.
412Suitable for using when holding the lock_sys latches (as it avoids deadlock).
413@param[in] page_id page Id
414@param[in] location Location where called
415@param[in] mtr Mini-transaction
416@return pointer to a page or NULL */
417const buf_block_t *buf_page_try_get(const page_id_t &page_id,
418 ut::Location location, mtr_t *mtr);
419
420/** Get read access to a compressed page (usually of type
421FIL_PAGE_TYPE_ZBLOB or FIL_PAGE_TYPE_ZBLOB2).
422The page must be released with buf_page_release_zip().
423NOTE: the page is not protected by any latch. Mutual exclusion has to
424be implemented at a higher level. In other words, all possible
425accesses to a given page through this function must be protected by
426the same set of mutexes or latches.
427@param[in] page_id page id
428@param[in] page_size page size
429@return pointer to the block */
431 const page_size_t &page_size);
432
433/** This is the general function used to get access to a database page.
434@param[in] page_id Page id
435@param[in] page_size Page size
436@param[in] rw_latch RW_S_LATCH, RW_X_LATCH, RW_NO_LATCH
437@param[in] guess Guessed block or NULL
438@param[in] mode Fetch mode.
439@param[in] location Location from where this method was called.
440@param[in] mtr Mini-transaction
441@param[in] dirty_with_no_latch Mark page as dirty even if page is being
442 pinned without any latch
443@return pointer to the block or NULL */
445 const page_size_t &page_size, ulint rw_latch,
447 ut::Location location, mtr_t *mtr,
448 bool dirty_with_no_latch = false);
449
450/** NOTE! The following macros should be used instead of buf_page_get_gen,
451 to improve debugging. Only values RW_S_LATCH and RW_X_LATCH are allowed
452 in LA! */
454 ulint latch, ut::Location location,
455 mtr_t *mtr) {
456 return buf_page_get_gen(id, size, latch, nullptr, Page_fetch::NORMAL,
457 location, mtr);
458}
459/** Use these macros to bufferfix a page with no latching. Remember not to
460 read the contents of the page unless you know it is safe. Do not modify
461 the contents of the page! We have separated this case, because it is
462 error-prone programming not to set a latch, and it should be used
463 with care. */
465 const page_size_t &size,
466 ut::Location location,
467 mtr_t *mtr) {
469 location, mtr);
470}
471
472/** Initializes a page to the buffer buf_pool. The page is usually not read
473from a file even if it cannot be found in the buffer buf_pool. This is one
474of the functions which perform to a block a state transition NOT_USED =>
475FILE_PAGE (the other is buf_page_get_gen). The page is latched by passed mtr.
476@param[in] page_id Page id
477@param[in] page_size Page size
478@param[in] rw_latch RW_SX_LATCH, RW_X_LATCH
479@param[in] mtr Mini-transaction
480@return pointer to the block, page bufferfixed */
482 const page_size_t &page_size,
483 rw_lock_type_t rw_latch, mtr_t *mtr);
484
485#else /* !UNIV_HOTBACKUP */
486
487/** Inits a page to the buffer buf_pool, for use in mysqlbackup --restore.
488@param[in] page_id page id
489@param[in] page_size page size
490@param[in,out] block block to init */
491void meb_page_init(const page_id_t &page_id, const page_size_t &page_size,
492 buf_block_t *block);
493#endif /* !UNIV_HOTBACKUP */
494
495#ifndef UNIV_HOTBACKUP
496/** Releases a compressed-only page acquired with buf_page_get_zip(). */
497static inline void buf_page_release_zip(
498 buf_page_t *bpage); /*!< in: buffer block */
499
500/** Releases a latch, if specified.
501@param[in] block buffer block
502@param[in] rw_latch RW_S_LATCH, RW_X_LATCH, RW_NO_LATCH */
503static inline void buf_page_release_latch(buf_block_t *block, ulint rw_latch);
504
505/** Moves a page to the start of the buffer pool LRU list. This high-level
506function can be used to prevent an important page from slipping out of
507the buffer pool.
508@param[in,out] bpage buffer block of a file page */
510
511/** Moved a page to the end of the buffer pool LRU list so that it can be
512flushed out at the earliest.
513@param[in] bpage buffer block of a file page */
514void buf_page_make_old(buf_page_t *bpage);
515
516/** Returns true if the page can be found in the buffer pool hash table.
517NOTE that it is possible that the page is not yet read from disk,
518though.
519@param[in] page_id page id
520@return true if found in the page hash table */
521static inline bool buf_page_peek(const page_id_t &page_id);
522
523#ifdef UNIV_DEBUG
524
525/** Sets file_page_was_freed true if the page is found in the buffer pool.
526This function should be called when we free a file page and want the
527debug version to check that it is not accessed any more unless
528reallocated.
529@param[in] page_id page id
530@return control block if found in page hash table, otherwise NULL */
532
533/** Sets file_page_was_freed false if the page is found in the buffer pool.
534This function should be called when we free a file page and want the
535debug version to check that it is not accessed any more unless
536reallocated.
537@param[in] page_id page id
538@return control block if found in page hash table, otherwise NULL */
540
541#endif /* UNIV_DEBUG */
542/** Reads the freed_page_clock of a buffer block.
543 @return freed_page_clock */
544[[nodiscard]] static inline ulint buf_page_get_freed_page_clock(
545 const buf_page_t *bpage); /*!< in: block */
546/** Reads the freed_page_clock of a buffer block.
547 @return freed_page_clock */
548[[nodiscard]] static inline ulint buf_block_get_freed_page_clock(
549 const buf_block_t *block); /*!< in: block */
550
551/** Tells, for heuristics, if a block is still close enough to the MRU end of
552the LRU list meaning that it is not in danger of getting evicted and also
553implying that it has been accessed recently.
554The page must be either buffer-fixed, either its page hash must be locked.
555@param[in] bpage block
556@return true if block is close to MRU end of LRU */
557static inline bool buf_page_peek_if_young(const buf_page_t *bpage);
558
559/** Recommends a move of a block to the start of the LRU list if there is
560danger of dropping from the buffer pool.
561NOTE: does not reserve the LRU list mutex.
562@param[in] bpage block to make younger
563@return true if should be made younger */
564static inline bool buf_page_peek_if_too_old(const buf_page_t *bpage);
565
566/** Gets the youngest modification log sequence number for a frame.
567 Returns zero if not file page or no modification occurred yet.
568 @return newest modification to page */
570 const buf_page_t *bpage); /*!< in: block containing the
571 page frame */
572
573/** Increment the modify clock.
574The caller must
575(1) own the buf_pool->mutex and block bufferfix count has to be zero,
576(2) own X or SX latch on the block->lock, or
577(3) operate on a thread-private temporary table
578@param[in,out] block buffer block */
579static inline void buf_block_modify_clock_inc(buf_block_t *block);
580
581/** Increments the bufferfix count.
582@param[in] location location
583@param[in,out] block block to bufferfix */
585 buf_block_t *block);
586
587/** Increments the bufferfix count.
588@param[in,out] bpage block to bufferfix
589@return the count */
590static inline ulint buf_block_fix(buf_page_t *bpage);
591
592/** Increments the bufferfix count.
593@param[in,out] block block to bufferfix
594@return the count */
595static inline ulint buf_block_fix(buf_block_t *block);
596
597/** Decrements the bufferfix count.
598@param[in,out] bpage block to bufferunfix
599@return the remaining buffer-fix count */
600static inline ulint buf_block_unfix(buf_page_t *bpage);
601
602/** Decrements the bufferfix count.
603@param[in,out] block block to bufferunfix
604@return the remaining buffer-fix count */
605static inline ulint buf_block_unfix(buf_block_t *block);
606
607/** Unfixes the page, unlatches the page,
608removes it from page_hash and removes it from LRU.
609@param[in,out] bpage pointer to the block */
611
612/** Increments the bufferfix count.
613@param[in,out] b block to bufferfix
614@param[in] l location where requested */
616 ut::Location l [[maybe_unused]]) {
618}
619#else /* !UNIV_HOTBACKUP */
620static inline void buf_block_modify_clock_inc(buf_block_t *block) {}
621#endif /* !UNIV_HOTBACKUP */
622
623#ifndef UNIV_HOTBACKUP
624
625/** Gets the space id, page offset, and byte offset within page of a pointer
626pointing to a buffer frame containing a file page.
627@param[in] ptr pointer to a buffer frame
628@param[out] space space id
629@param[out] addr page offset and byte offset */
630static inline void buf_ptr_get_fsp_addr(const void *ptr, space_id_t *space,
631 fil_addr_t *addr);
632
633#ifdef UNIV_DEBUG
634/** Finds a block in the buffer pool that points to a
635given compressed page. Used only to confirm that buffer pool does not contain a
636given pointer, thus protected by zip_free_mutex.
637@param[in] buf_pool buffer pool instance
638@param[in] data pointer to compressed page
639@return buffer block pointing to the compressed page, or NULL */
640buf_block_t *buf_pool_contains_zip(buf_pool_t *buf_pool, const void *data);
641#endif /* UNIV_DEBUG */
642
643/***********************************************************************
644FIXME_FTS: Gets the frame the pointer is pointing to. */
646 /* out: pointer to frame */
647 byte *ptr); /* in: pointer to a frame */
648
649#if defined UNIV_DEBUG || defined UNIV_BUF_DEBUG
650/** Validates the buffer pool data structure.
651 @return true */
652bool buf_validate(void);
653#endif /* UNIV_DEBUG || UNIV_BUF_DEBUG */
654#if defined UNIV_DEBUG_PRINT || defined UNIV_DEBUG || defined UNIV_BUF_DEBUG
655/** Prints info of the buffer pool data structure. */
656void buf_print(void);
657#endif /* UNIV_DEBUG_PRINT || UNIV_DEBUG || UNIV_BUF_DEBUG */
658#endif /* !UNIV_HOTBACKUP */
660 /** Do not crash at the end of buf_page_print(). */
662 /** Do not print the full page dump. */
665
666/** Prints a page to stderr.
667@param[in] read_buf a database page
668@param[in] page_size page size
669@param[in] flags 0 or BUF_PAGE_PRINT_NO_CRASH or
670BUF_PAGE_PRINT_NO_FULL */
671void buf_page_print(const byte *read_buf, const page_size_t &page_size,
672 ulint flags);
673
674/** Decompress a block.
675 @return true if successful */
676bool buf_zip_decompress(buf_block_t *block, /*!< in/out: block */
677 bool check); /*!< in: true=verify the page checksum */
678#ifndef UNIV_HOTBACKUP
679#ifdef UNIV_DEBUG
680/** Returns the number of latched pages in the buffer pool.
681 @return number of latched pages */
683#endif /* UNIV_DEBUG */
684/** Returns the number of pending buf pool read ios.
685 @return number of pending read I/O operations */
687/** Prints info of the buffer i/o. */
688void buf_print_io(FILE *file); /*!< in: file where to print */
689/** Collect buffer pool stats information for a buffer pool. Also
690 record aggregated stats if there are more than one buffer pool
691 in the server */
693 buf_pool_t *buf_pool, /*!< in: buffer pool */
694 ulint pool_id, /*!< in: buffer pool ID */
695 buf_pool_info_t *all_pool_info); /*!< in/out: buffer pool info
696 to fill */
697/** Return the ratio in percents of modified pages in the buffer pool /
698database pages in the buffer pool.
699@return modified page percentage ratio */
700double buf_get_modified_ratio_pct(void);
701/** Refresh the statistics used to print per-second averages. */
703
704/** Assert that all file pages in the buffer are in a replaceable state. */
706
707/** Computes number of pending I/O read operations for the buffer pool.
708@return number of pending i/o reads */
710
711/** Computes number of pending I/O write operations for the buffer pool.
712@return number of pending i/o writes */
714
715/** Waits until there are no pending I/O operations for the buffer pool.
716Keep waiting in loop with sleeps, emitting information every minute.
717This is used to avoid risk of some pending async IO (e.g. enqueued by
718the linear read-ahead), which would involve ibuf merge and create new
719redo records. */
721
722/** Invalidates the file pages in the buffer pool when an archive recovery is
723 completed. All the file pages buffered must be in a replaceable state when
724 this function is called: not latched and not modified. */
725void buf_pool_invalidate(void);
726
727/*========================================================================
728--------------------------- LOWER LEVEL ROUTINES -------------------------
729=========================================================================*/
730
731#ifdef UNIV_DEBUG
732/** Adds latch level info for the rw-lock protecting the buffer frame. This
733should be called in the debug version after a successful latching of a page if
734we know the latching order level of the acquired latch.
735@param[in] block buffer page where we have acquired latch
736@param[in] level latching order level */
737static inline void buf_block_dbg_add_level(buf_block_t *block,
738 latch_level_t level);
739#else /* UNIV_DEBUG */
740#define buf_block_dbg_add_level(block, level) /* nothing */
741#endif /* UNIV_DEBUG */
742
743#endif /* !UNIV_HOTBACKUP */
744
745/** Gets the state of a block.
746 @return state */
748 const buf_page_t *bpage); /*!< in: pointer to the control block */
749/** Gets the state of a block.
750 @return state */
751[[nodiscard]] static inline enum buf_page_state buf_block_get_state(
752 const buf_block_t *block); /*!< in: pointer to the control block */
753
754/** Sets the state of a block.
755@param[in,out] bpage pointer to control block
756@param[in] state state */
757static inline void buf_page_set_state(buf_page_t *bpage,
758 enum buf_page_state state);
759
760/** Sets the state of a block.
761@param[in,out] block pointer to control block
762@param[in] state state */
763static inline void buf_block_set_state(buf_block_t *block,
764 enum buf_page_state state);
765
766/** Determines if a block is mapped to a tablespace.
767 @return true if mapped */
768[[nodiscard]] static inline bool buf_page_in_file(
769 const buf_page_t *bpage); /*!< in: pointer to control block */
770#ifndef UNIV_HOTBACKUP
771/** Determines if a block should be on unzip_LRU list.
772 @return true if block belongs to unzip_LRU */
773[[nodiscard]] static inline bool buf_page_belongs_to_unzip_LRU(
774 const buf_page_t *bpage); /*!< in: pointer to control block */
775
776/** Gets the mutex of a block.
777 @return pointer to mutex protecting bpage */
778[[nodiscard]] static inline BPageMutex *buf_page_get_mutex(
779 const buf_page_t *bpage); /*!< in: pointer to control block */
780
781/** Get the flush type of a page.
782 @return flush type */
783[[nodiscard]] static inline buf_flush_t buf_page_get_flush_type(
784 const buf_page_t *bpage); /*!< in: buffer page */
785
786/** Set the flush type of a page.
787@param[in] bpage buffer page
788@param[in] flush_type flush type */
789static inline void buf_page_set_flush_type(buf_page_t *bpage,
791
792/** Map a block to a file page.
793@param[in,out] block pointer to control block
794@param[in] page_id page id */
795static inline void buf_block_set_file_page(buf_block_t *block,
796 const page_id_t &page_id);
797
798/** Gets the io_fix state of a block.
799 @return io_fix state */
800[[nodiscard]] static inline enum buf_io_fix buf_page_get_io_fix(
801 const buf_page_t *bpage); /*!< in: pointer to the control block */
802/** Gets the io_fix state of a block.
803 @return io_fix state */
804[[nodiscard]] static inline enum buf_io_fix buf_block_get_io_fix(
805 const buf_block_t *block); /*!< in: pointer to the control block */
806
807/** Sets the io_fix state of a block.
808@param[in,out] bpage control block
809@param[in] io_fix io_fix state */
810static inline void buf_page_set_io_fix(buf_page_t *bpage,
811 enum buf_io_fix io_fix);
812
813/** Sets the io_fix state of a block.
814@param[in,out] block control block
815@param[in] io_fix io_fix state */
816static inline void buf_block_set_io_fix(buf_block_t *block,
817 enum buf_io_fix io_fix);
818
819/** Makes a block sticky. A sticky block implies that even after we release
820the buf_pool->LRU_list_mutex and the block->mutex:
821* it cannot be removed from the flush_list
822* the block descriptor cannot be relocated
823* it cannot be removed from the LRU list
824Note that:
825* the block can still change its position in the LRU list
826* the next and previous pointers can change.
827@param[in,out] bpage control block */
828static inline void buf_page_set_sticky(buf_page_t *bpage);
829
830/** Removes stickiness of a block. */
831static inline void buf_page_unset_sticky(
832 buf_page_t *bpage); /*!< in/out: control block */
833/** Determine if a buffer block can be relocated in memory. The block
834 can be dirty, but it must not be I/O-fixed or bufferfixed. */
835[[nodiscard]] static inline bool buf_page_can_relocate(
836 const buf_page_t *bpage); /*!< control block being relocated */
837
838/** Determine if a block has been flagged old.
839@param[in] bpage control block
840@return true if old */
841[[nodiscard]] static inline bool buf_page_is_old(const buf_page_t *bpage);
842
843/** Flag a block old.
844@param[in,out] bpage control block
845@param[in] old old */
846static inline void buf_page_set_old(buf_page_t *bpage, bool old);
847
848/** Determine the time of first access of a block in the buffer pool.
849 @return Time of first access, zero if not accessed
850 */
851[[nodiscard]] static inline std::chrono::steady_clock::time_point
852buf_page_is_accessed(const buf_page_t *bpage); /*!< in: control block */
853/** Flag a block accessed. */
854static inline void buf_page_set_accessed(
855 buf_page_t *bpage); /*!< in/out: control block */
856
857/** Gets the buf_block_t handle of a buffered file block if an uncompressed
858page frame exists, or NULL. page frame exists, or NULL. The caller must hold
859either the appropriate hash lock in any mode, either the LRU list mutex. Note:
860even though bpage is not declared a const we don't update its value. It is safe
861to make this pure.
862@param[in] bpage control block, or NULL
863@return control block, or NULL */
864[[nodiscard]] static inline buf_block_t *buf_page_get_block(buf_page_t *bpage);
865#ifdef UNIV_DEBUG
866/** Gets a pointer to the memory frame of a block.
867 @return pointer to the frame */
868[[nodiscard]] static inline buf_frame_t *buf_block_get_frame(
869 const buf_block_t *block); /*!< in: pointer to the control block */
870#else /* UNIV_DEBUG */
871#define buf_block_get_frame(block) (block)->frame
872#endif /* UNIV_DEBUG */
873#else /* !UNIV_HOTBACKUP */
874#define buf_block_get_frame(block) (block)->frame
875#endif /* !UNIV_HOTBACKUP */
876
877/** Get a buffer block from an adaptive hash index pointer.
878This function does not return if the block is not identified.
879@param[in] ptr pointer to within a page frame
880@return pointer to block, never NULL */
881buf_block_t *buf_block_from_ahi(const byte *ptr);
882
883/** Find out if a block pointer points into one of currently used chunks of
884the buffer pool. This is useful if you stored the pointer some time ago, and
885want to dereference it now, and are afraid that buffer pool resize could free
886the memory pointed by it. Thus calling this function requires holding at least
887one of the latches which prevent freeing memory from buffer pool for the
888duration of the call and until you pin the block in some other way, as otherwise
889the result of this function might be obsolete by the time you dereference the
890block (an s-latch on buf_page_hash_lock_get for any hash cell is enough).
891@param buf_pool The buffer pool instance to search in.
892@param ptr A pointer which you want to check. This function will not
893 dereference it.
894@return true iff `block` points inside one of the chunks of the `buf_pool`
895*/
896bool buf_is_block_in_instance(const buf_pool_t *buf_pool,
897 const buf_block_t *ptr);
898
899#ifndef UNIV_HOTBACKUP
900
901/** Inits a page for read to the buffer buf_pool. If the page is
902(1) already in buf_pool, or
903(2) if we specify to read only ibuf pages and the page is not an ibuf page, or
904(3) if the space is deleted or being deleted,
905then this function does nothing.
906Sets the io_fix flag to BUF_IO_READ and sets a non-recursive exclusive lock
907on the buffer frame. The io-handler must take care that the flag is cleared
908and the lock released later.
909@param[in] mode BUF_READ_IBUF_PAGES_ONLY, ...
910@param[in] page_id page id
911@param[in] page_size page size
912@param[in] unzip true=request uncompressed page
913@return pointer to the block or NULL */
915 const page_size_t &page_size, bool unzip);
916
917/** Completes an asynchronous read or write request of a file page to or from
918the buffer pool.
919@param[in] bpage pointer to the block in question
920@param[in] evict whether or not to evict the page from LRU list
921@param[in] type i/o request type for which this completion routine is
922 called.
923@param[in] node file node in which the disk copy of the page exists.
924@return true if successful */
925bool buf_page_io_complete(buf_page_t *bpage, bool evict,
926 IORequest *type = nullptr,
927 fil_node_t *node = nullptr);
928
929/** Free a stale page. Caller must hold the LRU mutex. Upon successful page
930free the LRU mutex will be released.
931@param[in,out] buf_pool Buffer pool the page belongs to.
932@param[in,out] bpage Page to free.
933@return true if page was freed. */
934bool buf_page_free_stale(buf_pool_t *buf_pool, buf_page_t *bpage) noexcept;
935
936/** Evict a page from the buffer pool.
937@param[in] page_id page to be evicted.
938@param[in] page_size page size of the tablespace.
939@param[in] dirty_is_ok if true, it is OK for the page to be dirty. */
940void buf_page_force_evict(const page_id_t &page_id,
941 const page_size_t &page_size,
942 const bool dirty_is_ok = true) noexcept;
943
944/** Free a stale page. Caller must be holding the hash_lock in S mode if
945hash_lock parameter is not nullptr. The hash lock will be released upon return
946always. Caller must hold the LRU mutex if and only if the hash_lock parameter
947is nullptr. Upon unsuccessful page free the LRU mutex will not be released if
948hash_lock is nullptr.
949@param[in,out] buf_pool Buffer pool the page belongs to.
950@param[in,out] bpage Page to free.
951@param[in,out] hash_lock Hash lock covering the fetch from the hash table if
952latched in S mode. nullptr otherwise.
953@return true if page was freed. */
954bool buf_page_free_stale(buf_pool_t *buf_pool, buf_page_t *bpage,
955 rw_lock_t *hash_lock) noexcept;
956
957/** Free a stale page that is being written. The caller must be within the
958page's write code path.
959@param[in,out] bpage Page to free.
960@param[in] owns_sx_lock SX lock on block->lock is set. */
962 bool owns_sx_lock = false) noexcept;
963
964/** Calculates the index of a buffer pool to the buf_pool[] array.
965 @return the position of the buffer pool in buf_pool[] */
966[[nodiscard]] static inline ulint buf_pool_index(
967 const buf_pool_t *buf_pool); /*!< in: buffer pool */
968/** Returns the buffer pool instance given a page instance
969 @return buf_pool */
971 const buf_page_t *bpage); /*!< in: buffer pool page */
972/** Returns the buffer pool instance given a block instance
973 @return buf_pool */
975 const buf_block_t *block); /*!< in: block */
976
977/** Returns the buffer pool instance given a page id.
978@param[in] page_id page id
979@return buffer pool */
980static inline buf_pool_t *buf_pool_get(const page_id_t &page_id);
981
982/** Returns the buffer pool instance given its array index
983 @return buffer pool */
985 ulint index); /*!< in: array index to get
986 buffer pool instance from */
987
988/** Returns the control block of a file page, NULL if not found.
989@param[in] buf_pool buffer pool instance
990@param[in] page_id page id
991@return block, NULL if not found */
993 const page_id_t &page_id);
994
995/** Returns the control block of a file page, NULL if not found.
996If the block is found and lock is not NULL then the appropriate
997page_hash lock is acquired in the specified lock mode. Otherwise,
998mode value is ignored. It is up to the caller to release the
999lock. If the block is found and the lock is NULL then the page_hash
1000lock is released by this function.
1001@param[in] buf_pool buffer pool instance
1002@param[in] page_id page id
1003@param[in,out] lock lock of the page hash acquired if bpage is
1004found, NULL otherwise. If NULL is passed then the hash_lock is released by
1005this function.
1006@param[in] lock_mode RW_LOCK_X or RW_LOCK_S. Ignored if
1007lock == NULL
1008@param[in] watch if true, return watch sentinel also.
1009@return pointer to the bpage or NULL; if NULL, lock is also NULL or
1010a watch sentinel. */
1012 const page_id_t &page_id,
1013 rw_lock_t **lock,
1015 bool watch = false);
1016
1017/** Returns the control block of a file page, NULL if not found.
1018If the block is found and lock is not NULL then the appropriate
1019page_hash lock is acquired in the specified lock mode. Otherwise,
1020mode value is ignored. It is up to the caller to release the
1021lock. If the block is found and the lock is NULL then the page_hash
1022lock is released by this function.
1023@param[in] buf_pool buffer pool instance
1024@param[in] page_id page id
1025@param[in,out] lock lock of the page hash acquired if bpage is
1026found, NULL otherwise. If NULL is passed then the hash_lock is released by
1027this function.
1028@param[in] lock_mode RW_LOCK_X or RW_LOCK_S. Ignored if
1029lock == NULL
1030@return pointer to the block or NULL; if NULL, lock is also NULL. */
1032 const page_id_t &page_id,
1033 rw_lock_t **lock,
1035
1036/* There are four different ways we can try to get a bpage or block
1037from the page hash:
10381) Caller already holds the appropriate page hash lock: in the case call
1039buf_page_hash_get_low() function.
10402) Caller wants to hold page hash lock in x-mode
10413) Caller wants to hold page hash lock in s-mode
10424) Caller doesn't want to hold page hash lock */
1044 const page_id_t &page_id,
1045 rw_lock_t **l) {
1046 return buf_page_hash_get_locked(b, page_id, l, RW_LOCK_S);
1047}
1049 const page_id_t &page_id,
1050 rw_lock_t **l) {
1051 return buf_page_hash_get_locked(b, page_id, l, RW_LOCK_X);
1052}
1054 return buf_page_hash_get_locked(b, page_id, nullptr, 0);
1055}
1057 const page_id_t &page_id) {
1058 return buf_page_hash_get_locked(b, page_id, nullptr, 0, true);
1059}
1060
1062 const page_id_t &page_id,
1063 rw_lock_t **l) {
1064 return buf_block_hash_get_locked(b, page_id, l, RW_LOCK_S);
1065}
1067 const page_id_t &page_id,
1068 rw_lock_t **l) {
1069 return buf_block_hash_get_locked(b, page_id, l, RW_LOCK_X);
1070}
1072 const page_id_t &page_id) {
1073 return buf_block_hash_get_locked(b, page_id, nullptr, 0);
1074}
1075
1076/** Gets the current length of the free list of buffer blocks.
1077 @return length of the free list */
1079
1080/** Determine if a block is a sentinel for a buffer pool watch.
1081@param[in] buf_pool buffer pool instance
1082@param[in] bpage block
1083@return true if a sentinel for a buffer pool watch, false if not */
1084[[nodiscard]] bool buf_pool_watch_is_sentinel(const buf_pool_t *buf_pool,
1085 const buf_page_t *bpage);
1086
1087/** Stop watching if the page has been read in.
1088buf_pool_watch_set(same_page_id) must have returned NULL before.
1089@param[in] page_id page id */
1090void buf_pool_watch_unset(const page_id_t &page_id);
1091
1092/** Check if the page has been read in.
1093This may only be called after buf_pool_watch_set(same_page_id)
1094has returned NULL and before invoking buf_pool_watch_unset(same_page_id).
1095@param[in] page_id page id
1096@return false if the given page was not read in, true if it was */
1097[[nodiscard]] bool buf_pool_watch_occurred(const page_id_t &page_id);
1098
1099/** Get total buffer pool statistics.
1100@param[out] LRU_len Length of all lru lists
1101@param[out] free_len Length of all free lists
1102@param[out] flush_list_len Length of all flush lists */
1103void buf_get_total_list_len(ulint *LRU_len, ulint *free_len,
1104 ulint *flush_list_len);
1105
1106/** Get total list size in bytes from all buffer pools. */
1108 buf_pools_list_size_t *buf_pools_list_size); /*!< out: list sizes
1109 in all buffer pools */
1110/** Get total buffer pool statistics. */
1112 buf_pool_stat_t *tot_stat); /*!< out: buffer pool stats */
1113
1114/** Get the nth chunk's buffer block in the specified buffer pool.
1115@param[in] buf_pool buffer pool instance
1116@param[in] n nth chunk in the buffer pool
1117@param[in] chunk_size chunk_size
1118@return the nth chunk's buffer block. */
1119static inline buf_block_t *buf_get_nth_chunk_block(const buf_pool_t *buf_pool,
1120 ulint n, ulint *chunk_size);
1121
1122/** Calculate aligned buffer pool size based on srv_buf_pool_chunk_unit,
1123if needed.
1124@param[in] size size in bytes
1125@return aligned size */
1127
1128/** Adjust the proposed chunk unit size so that it satisfies all invariants
1129@param[in] size proposed size of buffer pool chunk unit in bytes
1130@return adjusted size which meets invariants */
1132
1133/** Calculate the checksum of a page from compressed table and update the
1134page.
1135@param[in,out] page page to update
1136@param[in] size compressed page size
1137@param[in] lsn LSN to stamp on the page
1138@param[in] skip_lsn_check true to skip check for lsn (in DEBUG) */
1140 bool skip_lsn_check);
1141
1142/** Return how many more pages must be added to the withdraw list to reach the
1143withdraw target of the currently ongoing buffer pool resize.
1144@param[in] buf_pool buffer pool instance
1145@return page count to be withdrawn or zero if the target is already achieved or
1146if the buffer pool is not currently being resized. */
1147static inline ulint buf_get_withdraw_depth(buf_pool_t *buf_pool);
1148
1149#endif /* !UNIV_HOTBACKUP */
1150
1151/** The common buffer control block structure
1152for compressed and uncompressed frames */
1153
1154/** Number of bits used for buffer page states. */
1155constexpr uint32_t BUF_PAGE_STATE_BITS = 3;
1156
1157template <typename T>
1158class copyable_atomic_t : public std::atomic<T> {
1159 public:
1161 : std::atomic<T>(other.load(std::memory_order_relaxed)) {}
1162};
1163
1166 public:
1167 /** Copy constructor.
1168 @param[in] other Instance to copy from. */
1170 : id(other.id),
1171 size(other.size),
1173 io_fix(other.io_fix),
1174 state(other.state),
1175 flush_type(other.flush_type),
1177#ifndef UNIV_HOTBACKUP
1178 hash(other.hash),
1179#endif /* !UNIV_HOTBACKUP */
1180 list(other.list),
1183 LRU(other.LRU),
1184 zip(other.zip)
1185#ifndef UNIV_HOTBACKUP
1186 ,
1188 m_space(other.m_space),
1190 m_version(other.m_version),
1191 access_time(other.access_time),
1192 m_dblwr_id(other.m_dblwr_id),
1193 old(other.old)
1194#ifdef UNIV_DEBUG
1195 ,
1199 in_LRU_list(other.in_LRU_list),
1202#endif /* UNIV_DEBUG */
1203#endif /* !UNIV_HOTBACKUP */
1204 {
1205#ifndef UNIV_HOTBACKUP
1206 m_space->inc_ref();
1207#endif /* !UNIV_HOTBACKUP */
1208 }
1209
1210 public:
1211 /** Check if the given ptr lies in a memory block of type BUF_BLOCK_MEMORY.
1212 This is checked by looking at the FIL_PAGE_LSN. If the FIL_PAGE_LSN is zero,
1213 then the block state is assumed to be BUF_BLOCK_MEMORY.
1214 @return true if the FIL_PAGE_LSN is zero, false otherwise. */
1215 [[nodiscard]] static bool is_memory(const page_t *const ptr) noexcept;
1216
1217 /** Check if the state of this page is BUF_BLOCK_MEMORY.
1218 @return true if the state is BUF_BLOCK_MEMORY, or false. */
1219 [[nodiscard]] bool is_memory() const noexcept {
1220 return state == BUF_BLOCK_MEMORY;
1221 }
1222
1223#ifndef UNIV_HOTBACKUP
1224 /** Set the doublewrite buffer ID.
1225 @param[in] batch_id Double write batch ID that flushed the page. */
1226 void set_dblwr_batch_id(uint16_t batch_id) { m_dblwr_id = batch_id; }
1227
1228 /** @return the double write batch id, or uint16_t max if undefined. */
1229 [[nodiscard]] uint16_t get_dblwr_batch_id() const { return (m_dblwr_id); }
1230
1231 /** Retrieve the tablespace id.
1232 @return tablespace id */
1233 [[nodiscard]] space_id_t space() const noexcept { return id.space(); }
1234
1235 /** Retrieve the page number.
1236 @return page number */
1237 [[nodiscard]] page_no_t page_no() const noexcept { return id.page_no(); }
1238
1239 /** Checks if this space reference saved during last page ID initialization
1240 was deleted or truncated since.
1241 @return true when space reference stored leads was deleted or truncated and
1242 this page should be discarded. Result is up to date until the fil_shard mutex
1243 is released. */
1244 inline bool is_stale() const {
1245 ut_a(m_space != nullptr);
1246 ut_a(id.space() == m_space->id);
1247 ut_a(m_version <= m_space->get_current_version());
1249 ut_a(!m_space->is_deleted());
1250 return false;
1251 } else {
1252 return true;
1253 }
1254 }
1255
1256 /** Checks if this space reference saved during last page ID initialization
1257 was deleted or truncated since.
1258 @return true when space reference stored leads was deleted or truncated and
1259 this page should be discarded. When false is returned, the status of stale is
1260 checked to be guaranteed. */
1261 inline bool was_stale() const {
1262 ut_a(m_space != nullptr);
1263 ut_a(id.space() == m_space->id);
1264 /* If the the version is OK, then the space must not be deleted.
1265 However, version is modified before the deletion flag is set, so reading
1266 these values need to be executed in reversed order. The atomic reads
1267 cannot be relaxed for it to work. */
1268 bool was_not_deleted = m_space->was_not_deleted();
1270 ut_a(was_not_deleted);
1271 return false;
1272 } else {
1273 return true;
1274 }
1275 }
1276
1277 /** Retrieve the tablespace object if one was available during page ID
1278 initialization. The returned object is safe to use as long as this buf_page_t
1279 object is not changed. Caller should have a IO fix, buffer fix, mutex or any
1280 other mean to assure the page will not be freed. After that is released the
1281 space object may be freed.
1282 @return tablespace object */
1283 inline fil_space_t *get_space() const { return m_space; }
1284
1285 /** Set the stored page id to a new value. This is used only on a buffer
1286 block with BUF_BLOCK_MEMORY state.
1287 @param[in] page_id the new value of the page id. */
1288 void set_page_id(const page_id_t page_id) {
1290 id = page_id;
1291 }
1292
1293 /** Set the page size to a new value. This can be used during initialization
1294 of a newly allocated buffer page.
1295 @param[in] page_size the new value of the page size. */
1296 void set_page_size(const page_size_t &page_size) {
1298 size = page_size;
1299 }
1300
1301 /** Sets stored page ID to the new value. Handles space object reference
1302 count.
1303 @param[in] new_page_id new page ID to be set. */
1304 inline void reset_page_id(page_id_t new_page_id) {
1305 if (m_space != nullptr) {
1306 /* If we reach this line through a call chain:
1307 srv_shutdown -> buf_pool_free_all -> buf_pool_free_instance ->
1308 buf_page_free_descriptor, then we are already past the fil system
1309 shutdown, and all fil_space_t objects were already freed. */
1311 m_space->dec_ref();
1312 }
1313 }
1314 id = new_page_id;
1316 }
1317
1318 /** Sets stored value to invalid/empty value. Handles space object reference
1319 count. */
1320 inline void reset_page_id() {
1322 }
1323
1324 private:
1325 /** Updates new space reference and acquires "reference count latch" and the
1326 current version of the space object. */
1327 inline void space_id_changed() {
1328 m_space = nullptr;
1329 m_version = 0;
1330 if (id.space() != UINT32_UNDEFINED) {
1331 m_space = fil_space_get(id.space());
1332 /* There could be non-existent tablespace while importing it */
1333 if (m_space) {
1334 m_space->inc_ref();
1335 /* We don't have a way to check the MDL locks, which are guarding the
1336 version number, so we don't use get_current_version(). */
1338 }
1339 }
1340 }
1341
1342 public:
1343 /** @return the flush observer instance. */
1345
1346 /** Set the flush observer for the page.
1347 @param[in] flush_observer The flush observer to set. */
1348 void set_flush_observer(Flush_observer *flush_observer) noexcept {
1349 /* Don't allow to set flush observer from non-null to null, or from one
1350 observer to another. */
1351 ut_a(m_flush_observer == nullptr || m_flush_observer == flush_observer);
1352 m_flush_observer = flush_observer;
1353 }
1354
1355 /** Remove the flush observer. */
1356 void reset_flush_observer() noexcept { m_flush_observer = nullptr; }
1357#endif /* !UNIV_HOTBACKUP */
1358
1359 /** @return the LSN of the latest modification. */
1360 lsn_t get_newest_lsn() const noexcept { return newest_modification; }
1361
1362 /** @return the LSN of the first modification since the last time
1363 it was clean. */
1364 lsn_t get_oldest_lsn() const noexcept { return oldest_modification; }
1365
1366 /** @return true if the page is dirty. */
1367 bool is_dirty() const noexcept { return get_oldest_lsn() > 0; }
1368
1369 /** Set the latest modification LSN.
1370 @param[in] lsn Latest modification lSN. */
1372
1373 /** Set the LSN when the page is modified for the first time.
1374 @param[in] lsn First modification LSN. */
1375 void set_oldest_lsn(lsn_t lsn) noexcept;
1376
1377 /** Set page to clean state. */
1378 void set_clean() noexcept { set_oldest_lsn(0); }
1379
1380 /** @name General fields
1381 None of these bit-fields must be modified without holding
1382 buf_page_get_mutex() [buf_block_t::mutex or
1383 buf_pool->zip_mutex], since they can be stored in the same
1384 machine word. */
1385 /** @{ */
1386
1387 /** Page id. */
1389
1390 /** Page size. */
1392
1393 /** Count of how many fold this block is currently bufferfixed. */
1395
1396 private:
1397 /** Type of pending I/O operation.
1398 Modified under protection of buf_page_get_mutex(this).
1399 Read under protection of rules described in @see Buf_io_fix_latching_rules */
1401
1402 public:
1403 /** Checks if io_fix has any of the known enum values.
1404 @param[in] io_fix the value to test
1405 @return true iff io_fix has any of the known enum values
1406 */
1408 switch (io_fix) {
1409 case BUF_IO_NONE:
1410 case BUF_IO_READ:
1411 case BUF_IO_WRITE:
1412 case BUF_IO_PIN:
1413 return true;
1414 }
1415 return false;
1416 }
1417
1418#ifdef UNIV_DEBUG
1419 private:
1420 /** Checks if io_fix has any of the known enum values.
1421 @return true iff io_fix has any of the known enum values
1422 */
1425 }
1426 /* Helper debug-only functions related latching rules are moved to a separate
1427 class so that this header doesn't have to pull in Stateful_latching_rules.*/
1430
1431 /* Helper debug-only class used to track which thread is currently responsible
1432 for performing I/O operation on this page. There's at most one such thread and
1433 the responsibility might be passed from one to another during async I/O. This
1434 is used to prove correctness of io_fix state transitions and checking it
1435 without a latch in the io_completion threads. */
1437 /** The thread responsible for I/O on this page, or an impossible value if
1438 no thread is currently responsible for I/O*/
1439 std::thread::id responsible_thread{std::thread().get_id()};
1440
1441 public:
1442 /** Checks if there is any thread responsible for I/O on this page now.
1443 @return true iff there is a thread responsible for I/O on this page.*/
1445 return responsible_thread != std::thread().get_id();
1446 }
1447
1448 /** Checks if the current thread is responsible for I/O on this page now.
1449 @return true iff the current thread is responsible for I/O on this page.*/
1452 }
1453
1454 /** Called by the thread responsible for I/O on this page to release its
1455 responsibility. */
1456 void release() {
1458 responsible_thread = std::thread().get_id();
1459 }
1460
1461 /** Called by the thread which becomes responsible for I/O on this page to
1462 indicate that it takes the responsibility. */
1463 void take() {
1466 }
1467 };
1468 /** Tracks which thread is responsible for I/O on this page. */
1470
1471 public:
1472 /** Checks if there is any thread responsible for I/O on this page now.
1473 @return true iff there is a thread responsible for I/O on this page.*/
1476 }
1477
1478 /** Checks if the current thread is responsible for I/O on this page now.
1479 @return true iff the current thread is responsible for I/O on this page.*/
1482 }
1483
1484 /** Called by the thread responsible for I/O on this page to release its
1485 responsibility. */
1487
1488 /** Called by the thread which becomes responsible for I/O on this page to
1489 indicate that it takes the responsibility. */
1492 io_fix.load(std::memory_order_relaxed) == BUF_IO_WRITE ||
1493 io_fix.load(std::memory_order_relaxed) == BUF_IO_READ);
1495 }
1496#endif /* UNIV_DEBUG */
1497 private:
1498 /** Retrieves a value of io_fix without requiring or acquiring any latches.
1499 Note that this implies that the value might be stale unless caller establishes
1500 happens-before relation in some other way.
1501 This is a low-level function which shouldn't be used directly, but
1502 rather via wrapper methods which check if proper latches are taken or via one
1503 of the many `was_io_fix_something()` methods with name explicitly warning the
1504 developer about the uncertainty involved.
1505 @return the value of io_fix at some moment "during" the call */
1508 return io_fix.load(std::memory_order_relaxed);
1509 }
1510
1511 public:
1512 /** This is called only when having full ownership of the page object and no
1513 other thread can reach it. This currently happens during buf_pool_create(),
1514 buf_pool_resize() (which latch quite a lot) or from fil_tablespace_iterate()
1515 which creates a fake, private block which is not really a part of the buffer
1516 pool.
1517 Therefore we allow this function to set io_fix without checking for any
1518 latches.
1519 Please use set_io_fix(BUF_IO_NONE) to change state in a regular situation. */
1521 io_fix.store(BUF_IO_NONE, std::memory_order_relaxed);
1522 /* This is only needed because places which call init_io_fix() do not call
1523 buf_page_t's constructor */
1525 }
1526
1527 /** This is called only when having full ownership of the page object and no
1528 other thread can reach it. This currently happens during buf_page_init_low()
1529 under buf_page_get_mutex(this), on a previously initialized page for reuse,
1530 yet should be treated as initialization of the field, not a state transition.
1531 Please use set_io_fix(BUF_IO_NONE) to change state in a regular situation. */
1533 ut_ad(io_fix.load(std::memory_order_relaxed) == BUF_IO_NONE);
1535 io_fix.store(BUF_IO_NONE, std::memory_order_relaxed);
1536 }
1537
1538 /** Sets io_fix to specified value.
1539 Assumes the caller holds buf_page_get_mutex(this).
1540 Might require additional latches depending on particular state transition.
1541 Calls take_io_responsibility() or release_io_responsibility() as needed.
1542 @see Buf_io_fix_latching_rules for specific rules. */
1544
1545 /** Retrieves the current value of io_fix.
1546 Assumes the caller holds buf_page_get_mutex(this).
1547 @return the current value of io_fix */
1550 return get_io_fix_snapshot();
1551 }
1552
1553 /** Checks if the current value of io_fix is BUF_IO_WRITE.
1554 Assumes the caller holds buf_page_get_mutex(this) or some other latches which
1555 prevent state transition from/to BUF_IO_WRITE.
1556 @see Buf_io_fix_latching_rules for specific rules.
1557 @return true iff the current value of io_fix == BUF_IO_WRITE */
1558 bool is_io_fix_write() const;
1559
1560 /** Checks if the current value of io_fix is BUF_IO_READ.
1561 Assumes the caller holds buf_page_get_mutex(this) or some other latches which
1562 prevent state transition from/to BUF_IO_READ.
1563 @see Buf_io_fix_latching_rules for specific rules.
1564 @return true iff the current value of io_fix == BUF_IO_READ */
1565 bool is_io_fix_read() const;
1566
1567 /** Assuming that io_fix is either BUF_IO_READ or BUF_IO_WRITE determines
1568 which of the two it is. Additionally it assumes the caller holds
1569 buf_page_get_mutex(this) or some other latches which prevent state transition
1570 from BUF_IO_READ or from BUF_IO_WRITE to another state.
1571 @see Buf_io_fix_latching_rules for specific rules.
1572 @return true iff the current value of io_fix == BUF_IO_READ */
1574
1575 /** Checks if io_fix is BUF_IO_READ without requiring or acquiring any
1576 latches.
1577 Note that this implies calling this function twice in a row could produce
1578 different results.
1579 @return true iff io_fix equal to BUF_IO_READ was noticed*/
1581
1582 /** Checks if io_fix is BUF_IO_FIX or BUF_IO_READ or BUF_IO_WRITE without
1583 requiring or acquiring any latches.
1584 Note that this implies calling this function twice in a row could produce
1585 different results.
1586 @return true iff io_fix not equal to BUF_IO_NONE was noticed */
1587 bool was_io_fixed() const { return get_io_fix_snapshot() != BUF_IO_NONE; }
1588
1589 /** Checks if io_fix is BUF_IO_NONE without requiring or acquiring any
1590 latches.
1591 Note that this implies calling this function twice in a row could produce
1592 different results.
1593 Please, prefer this function over !was_io_fixed() to avoid the misleading
1594 interpretation as "not(Exists time such that io_fix(time))", while in fact we
1595 want and get "Exists time such that !io_fix(time)".
1596 @return true iff io_fix equal to BUF_IO_NONE was noticed */
1598
1599 /** Block state. @see buf_page_in_file */
1601
1602 /** If this block is currently being flushed to disk, this tells
1603 the flush_type. @see buf_flush_t */
1605
1606 /** Index number of the buffer pool that this block belongs to */
1608
1609 static_assert(MAX_BUFFER_POOLS <= 64,
1610 "MAX_BUFFER_POOLS > 64; redefine buf_pool_index");
1611
1612 /** @} */
1613#ifndef UNIV_HOTBACKUP
1614 /** Node used in chaining to buf_pool->page_hash or buf_pool->zip_hash */
1616#endif /* !UNIV_HOTBACKUP */
1617
1618 /** @name Page flushing fields
1619 All these are protected by buf_pool->mutex. */
1620 /** @{ */
1621
1622 /** Based on state, this is a list node, protected by the corresponding list
1623 mutex, in one of the following lists in buf_pool:
1624
1625 - BUF_BLOCK_NOT_USED: free, withdraw
1626 - BUF_BLOCK_FILE_PAGE: flush_list
1627 - BUF_BLOCK_ZIP_DIRTY: flush_list
1628 - BUF_BLOCK_ZIP_PAGE: zip_clean
1629
1630 The node pointers are protected by the corresponding list mutex.
1631
1632 The contents of the list node is undefined if !in_flush_list &&
1633 state == BUF_BLOCK_FILE_PAGE, or if state is one of
1634 BUF_BLOCK_MEMORY,
1635 BUF_BLOCK_REMOVE_HASH or
1636 BUF_BLOCK_READY_IN_USE. */
1637
1639
1640 private:
1641 /** The flush LSN, LSN when this page was written to the redo log. For
1642 non redo logged pages this is set using: buf_flush_borrow_lsn() */
1644
1645 /** log sequence number of the youngest modification to this block, zero
1646 if not modified. Protected by block mutex */
1648
1649 public:
1650 /** log sequence number of the START of the log entry written of the oldest
1651 modification to this block which has not yet been flushed on disk; zero if
1652 all modifications are on disk. Writes to this field must be covered by both
1653 block->mutex and buf_pool->flush_list_mutex. Hence reads can happen while
1654 holding any one of the two mutexes */
1655 /** @} */
1656
1657 /** @name LRU replacement algorithm fields
1658 These fields are protected by both buf_pool->LRU_list_mutex and the
1659 block mutex. */
1660 /** @{ */
1661
1662 /** node of the LRU list */
1664
1665 /** compressed page; zip.data (but not the data it points to) is
1666 protected by buf_pool->zip_mutex; state == BUF_BLOCK_ZIP_PAGE and
1667 zip.data == NULL means an active buf_pool->watch */
1669
1670#ifndef UNIV_HOTBACKUP
1671 /** Flush observer instance. */
1673
1674 /** Tablespace instance that this page belongs to. */
1676
1677 /** The value of buf_pool->freed_page_clock when this block was the last
1678 time put to the head of the LRU list; a thread is allowed to read this
1679 for heuristic purposes without holding any mutex or latch */
1681
1682 /** @} */
1683 /** Version of fil_space_t when the page was updated. It can also be viewed as
1684 the truncation number. */
1685 uint32_t m_version{};
1686
1687 /** Time of first access, or 0 if the block was never accessed in the
1688 buffer pool. Protected by block mutex */
1689 std::chrono::steady_clock::time_point access_time;
1690
1691 private:
1692 /** Double write instance ordinal value during writes. This is used
1693 by IO completion (writes) to select the double write instance.*/
1694 uint16_t m_dblwr_id{};
1695
1696 public:
1697 /** true if the block is in the old blocks in buf_pool->LRU_old */
1698 bool old;
1699
1700#ifdef UNIV_DEBUG
1701 /** This is set to true when fsp frees a page in buffer pool;
1702 protected by buf_pool->zip_mutex or buf_block_t::mutex. */
1704
1705 /** true if in buf_pool->flush_list; when buf_pool->flush_list_mutex
1706 is free, the following should hold:
1707 in_flush_list == (state == BUF_BLOCK_FILE_PAGE ||
1708 state == BUF_BLOCK_ZIP_DIRTY)
1709 Writes to this field must be covered by both buf_pool->flush_list_mutex
1710 and block->mutex. Hence reads can happen while holding any one of the
1711 two mutexes */
1713
1714 /** true if in buf_pool->free; when buf_pool->free_list_mutex is free, the
1715 following should hold: in_free_list == (state == BUF_BLOCK_NOT_USED) */
1717
1718 /** true if the page is in the LRU list; used in debugging */
1720
1721 /** true if in buf_pool->page_hash */
1723
1724 /** true if in buf_pool->zip_hash */
1726#endif /* UNIV_DEBUG */
1727
1728 /** Print page metadata in JSON format {"key":"value"}. Asserts that caller
1729 holds page mutex and page if file page
1730 @param[in,out] outs the output stream
1731 @param[in] page the page whose metadata needs to be printed
1732 @return same output stream */
1733 friend std::ostream &operator<<(std::ostream &outs, const buf_page_t &page);
1734#endif /* !UNIV_HOTBACKUP */
1735};
1736
1737/** Structure used by AHI to contain information on record prefixes to be
1738considered in hash index subsystem. It is meant for using as a single 64bit
1739atomic value, thus it needs to be aligned properly. */
1740struct alignas(alignof(uint64_t)) btr_search_prefix_info_t {
1741 /** recommended prefix: number of bytes in an incomplete field
1742 @see BTR_PAGE_MAX_REC_SIZE */
1743 uint32_t n_bytes;
1744 /** recommended prefix length for hash search: number of full fields */
1745 uint16_t n_fields;
1746 /** true or false, depending on whether the leftmost record of several records
1747 with the same prefix should be indexed in the hash index */
1749
1751 return n_bytes == other.n_bytes && n_fields == other.n_fields;
1752 }
1753
1754 bool operator==(const btr_search_prefix_info_t &other) const {
1755 return n_bytes == other.n_bytes && n_fields == other.n_fields &&
1756 left_side == other.left_side;
1757 }
1758
1759 bool operator!=(const btr_search_prefix_info_t &other) const {
1760 return !(*this == other);
1761 }
1762};
1763
1764/** The buffer control block structure */
1766 /** @name General fields */
1767 /** @{ */
1768
1769 /** page information; this must be the first field, so
1770 that buf_pool->page_hash can point to buf_page_t or buf_block_t */
1772
1773#ifndef UNIV_HOTBACKUP
1774 /** read-write lock of the buffer frame */
1776
1777#ifdef UNIV_DEBUG
1778 /** Check if the buffer block was freed.
1779 @return true if the block was freed, false otherwise. */
1780 bool was_freed() const { return page.file_page_was_freed; }
1781#endif /* UNIV_DEBUG */
1782
1783#endif /* UNIV_HOTBACKUP */
1784
1785 /** pointer to buffer frame which is of size UNIV_PAGE_SIZE, and aligned
1786 to an address divisible by UNIV_PAGE_SIZE */
1787 byte *frame;
1788
1789 /** node of the decompressed LRU list; a block is in the unzip_LRU list if
1790 page.state == BUF_BLOCK_FILE_PAGE and page.zip.data != NULL. Protected by
1791 both LRU_list_mutex and the block mutex. */
1793#ifdef UNIV_DEBUG
1794 /** true if the page is in the decompressed LRU list; used in debugging */
1796
1798#endif /* UNIV_DEBUG */
1799
1800 /** @} */
1801
1802 /** Structure that holds most AHI-related fields. */
1803 struct ahi_t {
1804 public:
1805 /** Recommended prefix info for hash search. It is atomically copied
1806 from the index's current recommendation for the prefix info and should
1807 eventually get to the block's actual prefix info used. It is used to decide
1808 when the n_hash_helps should be reset. It is modified only while having S-
1809 or X- latch on block's lock. */
1810 std::atomic<btr_search_prefix_info_t> recommended_prefix_info;
1811 /** Prefix info that was used for building hash index. It cannot be modified
1812 while there are any record entries added in the AHI. It's invariant that all
1813 records added to AHI from this block were folded using this prefix info. It
1814 may only be modified when we are holding the appropriate X-latch in
1815 btr_search_sys->parts[]->latch. Also, it happens that it is modified
1816 to not-empty value only when the block is held in private or the block's
1817 lock is S- or X-latched. This implies that the field's non-empty value may
1818 be read and use reliably when the appropriate
1819 btr_search_sys->parts[]->latch S-latch or X-latch is being held, or
1820 the block's lock is X-latched. */
1821 std::atomic<btr_search_prefix_info_t> prefix_info;
1822 static_assert(decltype(prefix_info)::is_always_lock_free);
1823
1824 /** Index for which the adaptive hash index has been created, or nullptr if
1825 the page does not exist in the index. Note that it does not guarantee that
1826 the AHI index is complete, though: there may have been hash collisions etc.
1827 It may be modified:
1828 - to nullptr if btr_search_enabled is false and block's mutex is held and
1829 block's state is BUF_BLOCK_FILE_PAGE and btr_search_enabled_mutex is
1830 owned, protecting the btr_search_enabled from being changed,
1831 - to nullptr if btr_search_enabled is false and block is held in private in
1832 BUF_BLOCK_REMOVE_HASH state in buf_LRU_free_page().
1833 - to any value under appropriate X-latch in btr_search_sys->parts[]->latch
1834 if btr_search_enabled is true (and setting btr_search_enabled to false in
1835 turn is protected by having all btr_search_sys->parts[]->latch X-latched).
1836 */
1837 std::atomic<dict_index_t *> index;
1838
1839#if defined UNIV_AHI_DEBUG || defined UNIV_DEBUG
1840 /** Used in debugging. The number of pointers in the adaptive hash index
1841 pointing to this frame; Modified under appropriate X-latch in
1842 btr_search_sys->parts[]->latch. */
1843 std::atomic<uint16_t> n_pointers;
1844
1845 inline void validate() const {
1846 /* These fields are read without holding any AHI latches. Adding or
1847 removing a block from AHI requires having only an appropriate AHI part
1848 X-latched. If we have at least S-latched the correct AHI part (for which
1849 we would need at least S-latch on block for the block's index to not be
1850 changed in meantime) this check is certain. If we don't have necessary AHI
1851 latches, then:
1852 - it can't happen that the check fails while the block is removed from
1853 AHI. Both btr_search_drop_page_hash_index() and
1854 buf_pool_clear_hash_index() will first make the n_pointers be 0 and then
1855 set index to nullptr. As the index is an atomic variable, so if we
1856 synchronize with a reset to nullptr which is sequenced after the reset of
1857 n_pointers, we should see the n_pointers set to 0 here.
1858 - it can happen that the check fails while the block is added to the AHI
1859 right after we read the index is nullptr. In such case, if the n_pointers
1860 is not 0, we double check the index member. It can still be nullptr, if
1861 the block is removed after reading the n_pointers, but that should be near
1862 impossible. */
1863 ut_a(this->index.load() != nullptr || this->n_pointers.load() == 0 ||
1864 this->index.load() != nullptr);
1865 }
1866
1867 inline void assert_empty() const { ut_a(this->n_pointers.load() == 0); }
1868
1869 inline void assert_empty_on_init() const {
1870 UNIV_MEM_VALID(&this->n_pointers, sizeof(this->n_pointers));
1871 assert_empty();
1872 }
1873#else
1874 inline void validate() const {}
1875
1876 inline void assert_empty() const {}
1877
1878 inline void assert_empty_on_init() const {}
1879#endif /* UNIV_AHI_DEBUG || UNIV_DEBUG */
1881
1882 /** Counter which controls how many times the current prefix recommendation
1883 would help in searches. If it is helpful enough, it will be used as the
1884 actual prefix to build hash for this block. It is modified similarly as
1885 recommended_prefix_info, that is only while having S- or X- latch on block's
1886 lock. Because it is modified concurrently, it may not have fully reliable
1887 count, but it is enough for this use case.
1888 Mind the n_hash_helps is AHI-related, and should be in the ahi_t struct above,
1889 but having it outside causes the made_dirty_with_no_latch to occupy the common
1890 8byte aligned 8byte long space, so basically it saves us 8bytes of the object
1891 that is used in high volumes. */
1892 std::atomic<uint32_t> n_hash_helps;
1893 /** true if block has been made dirty without acquiring X/SX latch as the
1894 block belongs to temporary tablespace and block is always accessed by a
1895 single thread. */
1897
1898#ifndef UNIV_HOTBACKUP
1899#ifdef UNIV_DEBUG
1900 /** @name Debug fields */
1901 /** @{ */
1902 /** In the debug version, each thread which bufferfixes the block acquires
1903 an s-latch here; so we can use the debug utilities in sync0rw */
1905 /** @} */
1906#endif /* UNIV_DEBUG */
1907#endif /* !UNIV_HOTBACKUP */
1908
1909 /** @name Optimistic search field */
1910 /** @{ */
1911
1912 /** This clock is incremented every time a pointer to a record on the page
1913 may become obsolete; this is used in the optimistic cursor positioning: if
1914 the modify clock has not changed, we know that the pointer is still valid;
1915 this field may be changed if the thread (1) owns the LRU list mutex and the
1916 page is not bufferfixed, or (2) the thread has an x-latch on the block,
1917 or (3) the block must belong to an intrinsic table */
1919
1920 /** @} */
1921
1922 /** mutex protecting this block: state (also protected by the buffer
1923 pool mutex), io_fix, buf_fix_count, and accessed; we introduce this
1924 new mutex in InnoDB-5.1 to relieve contention on the buffer pool mutex */
1926
1927 /** Get the modified clock (version) value.
1928 @param[in] single_threaded Thread can only be written to or read by a
1929 single thread
1930 @return the modified clock vlue. */
1931 uint64_t get_modify_clock(IF_DEBUG(bool single_threaded)) const noexcept {
1932#if defined(UNIV_DEBUG) && !defined(UNIV_LIBRARY) && !defined(UNIV_HOTBACKUP)
1933 /* No block latch is acquired when blocks access is guaranteed to be
1934 in single threaded mode. */
1936 ut_ad(single_threaded || rw_lock_own_flagged(&lock, mode));
1937#endif /* UNIV_DEBUG && !UNIV_LIBRARY */
1938
1939 return modify_clock;
1940 }
1941
1942 /** Get the page number and space id of the current buffer block.
1943 @return page number of the current buffer block. */
1944 const page_id_t &get_page_id() const { return page.id; }
1945
1946 /** Get the page number of the current buffer block.
1947 @return page number of the current buffer block. */
1948 page_no_t get_page_no() const { return (page.id.page_no()); }
1949
1950 /** Get the next page number of the current buffer block.
1951 @return next page number of the current buffer block. */
1954 }
1955
1956 /** Get the prev page number of the current buffer block.
1957 @return prev page number of the current buffer block. */
1960 }
1961
1962 /** Get the page type of the current buffer block.
1963 @return page type of the current buffer block. */
1966 }
1967
1968#ifndef UNIV_HOTBACKUP
1969 /** Mark the frame with jumbled page_id, while initiating i/o read
1970 (BUF_IO_READ).*/
1972 memset(frame, 0x00, page.size.logical());
1975 }
1976
1977 /** Print control block information in JSON format: {"key":"value"}
1978 @param[in,out] outs the output stream
1979 @param[in] block the control block whose information needs to be printed
1980 @return same output stream */
1981 friend std::ostream &operator<<(std::ostream &outs, const buf_block_t &block);
1982#endif /* UNIV_HOTBACKUP */
1983
1984 uint16_t get_page_level() const;
1985 bool is_leaf() const;
1986 bool is_root() const;
1987 bool is_index_page() const;
1988
1989 /** Check if this index page is empty. An index page is considered empty
1990 if the next record of an infimum record is supremum record. Presence of
1991 del-marked records will make the page non-empty.
1992 @return true if this index page is empty. */
1993 bool is_empty() const;
1994
1995 /** Get the page type of the current buffer block as string.
1996 @return page type of the current buffer block as string. */
1997 [[nodiscard]] const char *get_page_type_str() const noexcept;
1998
1999 /** Gets the compressed page descriptor corresponding to an uncompressed page
2000 if applicable.
2001 @return page descriptor or nullptr. */
2003 return page.zip.data != nullptr ? &page.zip : nullptr;
2004 }
2005
2006 /** Const version.
2007 @return page descriptor or nullptr. */
2008 page_zip_des_t const *get_page_zip() const noexcept {
2009 return page.zip.data != nullptr ? &page.zip : nullptr;
2010 }
2011
2012 [[nodiscard]] bool is_memory() const noexcept { return page.is_memory(); }
2013};
2014
2015inline bool buf_block_t::is_root() const {
2016 return ((get_next_page_no() == FIL_NULL) && (get_prev_page_no() == FIL_NULL));
2017}
2018
2019inline bool buf_block_t::is_leaf() const { return get_page_level() == 0; }
2020
2021inline bool buf_block_t::is_index_page() const {
2022 return get_page_type() == FIL_PAGE_INDEX;
2023}
2024
2025/** Check if a buf_block_t object is in a valid state
2026@param block buffer block
2027@return true if valid */
2029 return buf_block_get_state(block) >= BUF_BLOCK_NOT_USED &&
2031}
2032
2033/** Compute the hash value for blocks in buf_pool->zip_hash. */
2034/** @{ */
2035static inline uint64_t buf_pool_hash_zip_frame(void *ptr) {
2036 return ut::hash_uint64(reinterpret_cast<uintptr_t>(ptr) >>
2038}
2039static inline uint64_t buf_pool_hash_zip(buf_block_t *b) {
2040 return buf_pool_hash_zip_frame(b->frame);
2041}
2042/** @} */
2043
2044/** A "Hazard Pointer" class used to iterate over page lists
2045inside the buffer pool. A hazard pointer is a buf_page_t pointer
2046which we intend to iterate over next and we want it remain valid
2047even after we release the buffer pool mutex. */
2049 public:
2050 /** Constructor
2051 @param buf_pool buffer pool instance
2052 @param mutex mutex that is protecting the hp. */
2053 HazardPointer(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
2054 : m_buf_pool(buf_pool) IF_DEBUG(, m_mutex(mutex)), m_hp() {}
2055
2056 /** Destructor */
2057 virtual ~HazardPointer() = default;
2058
2059 /** Get current value */
2060 buf_page_t *get() const {
2062 return (m_hp);
2063 }
2064
2065 /** Set current value
2066 @param bpage buffer block to be set as hp */
2067 void set(buf_page_t *bpage);
2068
2069 /** Checks if a bpage is the hp
2070 @param bpage buffer block to be compared
2071 @return true if it is hp */
2072 bool is_hp(const buf_page_t *bpage);
2073
2074 /** Adjust the value of hp. This happens when some
2075 other thread working on the same list attempts to
2076 remove the hp from the list. Must be implemented
2077 by the derived classes.
2078 @param bpage buffer block to be compared */
2079 virtual void adjust(const buf_page_t *bpage) = 0;
2080
2081 /** Adjust the value of hp for moving. This happens
2082 when some other thread working on the same list
2083 attempts to relocate the hp of the page.
2084 @param bpage buffer block to be compared
2085 @param dpage buffer block to be moved to */
2086 void move(const buf_page_t *bpage, buf_page_t *dpage);
2087
2088 protected:
2089 /** Disable copying */
2092
2093 /** Buffer pool instance */
2095
2096#ifdef UNIV_DEBUG
2097 /** mutex that protects access to the m_hp. */
2098 const ib_mutex_t *m_mutex;
2099#endif /* UNIV_DEBUG */
2100
2101 /** hazard pointer. */
2103};
2104
2105/** Class implementing buf_pool->flush_list hazard pointer */
2106class FlushHp : public HazardPointer {
2107 public:
2108 /** Constructor
2109 @param buf_pool buffer pool instance
2110 @param mutex mutex that is protecting the hp. */
2111 FlushHp(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
2112 : HazardPointer(buf_pool, mutex) {}
2113
2114 /** Destructor */
2115 ~FlushHp() override = default;
2116
2117 /** Adjust the value of hp. This happens when some
2118 other thread working on the same list attempts to
2119 remove the hp from the list.
2120 @param bpage buffer block to be compared */
2121 void adjust(const buf_page_t *bpage) override;
2122};
2123
2124/** Class implementing buf_pool->LRU hazard pointer */
2125class LRUHp : public HazardPointer {
2126 public:
2127 /** Constructor
2128 @param buf_pool buffer pool instance
2129 @param mutex mutex that is protecting the hp. */
2130 LRUHp(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
2131 : HazardPointer(buf_pool, mutex) {}
2132
2133 /** Destructor */
2134 ~LRUHp() override = default;
2135
2136 /** Adjust the value of hp. This happens when some
2137 other thread working on the same list attempts to
2138 remove the hp from the list.
2139 @param bpage buffer block to be compared */
2140 void adjust(const buf_page_t *bpage) override;
2141};
2142
2143/** Special purpose iterators to be used when scanning the LRU list.
2144The idea is that when one thread finishes the scan it leaves the
2145itr in that position and the other thread can start scan from
2146there */
2147class LRUItr : public LRUHp {
2148 public:
2149 /** Constructor
2150 @param buf_pool buffer pool instance
2151 @param mutex mutex that is protecting the hp. */
2152 LRUItr(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
2153 : LRUHp(buf_pool, mutex) {}
2154
2155 /** Destructor */
2156 ~LRUItr() override = default;
2157
2158 /** Selects from where to start a scan. If we have scanned
2159 too deep into the LRU list it resets the value to the tail
2160 of the LRU list.
2161 @return buf_page_t from where to start scan. */
2162 buf_page_t *start();
2163};
2164
2165/** Struct that is embedded in the free zip blocks */
2167 union {
2168 ulint size; /*!< size of the block */
2170 /*!< stamp[FIL_PAGE_ARCH_LOG_NO_OR_SPACE_ID]
2171 == BUF_BUDDY_FREE_STAMP denotes a free
2172 block. If the space_id field of buddy
2173 block != BUF_BUDDY_FREE_STAMP, the block
2174 is not in any zip_free list. If the
2175 space_id is BUF_BUDDY_FREE_STAMP then
2176 stamp[0] will contain the
2177 buddy block size. */
2179
2180 buf_page_t bpage; /*!< Embedded bpage descriptor */
2182 /*!< Node of zip_free list */
2183};
2184
2185/** @brief The buffer pool statistics structure. */
2188
2189 /** Number of page gets performed; also successful searches through the
2190 adaptive hash index are counted as page gets; this field is NOT protected
2191 by the buffer pool mutex */
2193
2194 /** Number of read operations. */
2195 std::atomic<uint64_t> n_pages_read;
2196
2197 /** Number of write operations. */
2198 std::atomic<uint64_t> n_pages_written;
2199
2200 /** number of pages created in the pool with no read. */
2201 std::atomic<uint64_t> n_pages_created;
2202
2203 /** Number of pages read in as part of random read ahead. */
2204 std::atomic<uint64_t> n_ra_pages_read_rnd;
2205
2206 /** Number of pages read in as part of read ahead. */
2207 std::atomic<uint64_t> n_ra_pages_read;
2208
2209 /** Number of read ahead pages that are evicted without being accessed.
2210 Protected by LRU_list_mutex. */
2212
2213 /** Number of pages made young, in calls to buf_LRU_make_block_young().
2214 Protected by LRU_list_mutex. */
2216
2217 /** Number of pages not made young because the first access was not long
2218 enough ago, in buf_page_peek_if_too_old(). Not protected. */
2220
2221 /** LRU size in bytes. Protected by LRU_list_mutex. */
2222 uint64_t LRU_bytes;
2223
2224 /** Flush_list size in bytes. Protected by flush_list_mutex */
2226
2227 static void copy(buf_pool_stat_t &dst, const buf_pool_stat_t &src) noexcept {
2228 Counter::copy(dst.m_n_page_gets, src.m_n_page_gets);
2229
2230 dst.n_pages_read.store(src.n_pages_read.load());
2231
2232 dst.n_pages_written.store(src.n_pages_written.load());
2233
2234 dst.n_pages_created.store(src.n_pages_created.load());
2235
2236 dst.n_ra_pages_read_rnd.store(src.n_ra_pages_read_rnd.load());
2237
2238 dst.n_ra_pages_read.store(src.n_ra_pages_read.load());
2239
2240 dst.n_ra_pages_evicted = src.n_ra_pages_evicted;
2241
2242 dst.n_pages_made_young = src.n_pages_made_young;
2243
2244 dst.n_pages_not_made_young = src.n_pages_not_made_young;
2245
2246 dst.LRU_bytes = src.LRU_bytes;
2247
2248 dst.flush_list_bytes = src.flush_list_bytes;
2249 }
2250
2251 void reset() {
2253
2254 n_pages_read = 0;
2255 n_pages_written = 0;
2256 n_pages_created = 0;
2258 n_ra_pages_read = 0;
2262 LRU_bytes = 0;
2263 flush_list_bytes = 0;
2264 }
2265};
2266
2267/** Statistics of buddy blocks of a given size. */
2269 /** Number of blocks allocated from the buddy system. */
2270 std::atomic<ulint> used;
2271 /** Number of blocks relocated by the buddy system.
2272 Protected by buf_pool zip_free_mutex. */
2273 uint64_t relocated;
2274 /** Total duration of block relocations.
2275 Protected by buf_pool zip_free_mutex. */
2276 std::chrono::steady_clock::duration relocated_duration;
2277
2278 struct snapshot_t {
2280 uint64_t relocated;
2281 std::chrono::steady_clock::duration relocated_duration;
2282 };
2283
2285 return {used.load(), relocated, relocated_duration};
2286 }
2287};
2288
2289/** @brief The buffer pool structure.
2290
2291NOTE! The definition appears here only for other modules of this
2292directory (buf) to see it. Do not use from outside! */
2293
2295 /** @name General fields */
2296 /** @{ */
2297 /** protects (de)allocation of chunks:
2298 - changes to chunks, n_chunks are performed while holding this latch,
2299 - reading buf_pool_should_madvise requires holding this latch for any
2300 buf_pool_t
2301 - writing to buf_pool_should_madvise requires holding these latches
2302 for all buf_pool_t-s */
2304
2305 /** LRU list mutex */
2307
2308 /** free and withdraw list mutex */
2310
2311 /** buddy allocator mutex */
2313
2314 /** zip_hash mutex */
2316
2317 /** Flush state protection mutex */
2319
2320 /** Zip mutex of this buffer pool instance, protects compressed only pages (of
2321 type buf_page_t, not buf_block_t */
2323
2324 /** Array index of this buffer pool instance */
2326
2327 /** Current pool size in bytes */
2329
2330 /** Reserve this much of the buffer pool for "old" blocks */
2332#ifdef UNIV_DEBUG
2333 /** Number of frames allocated from the buffer pool to the buddy system.
2334 Protected by zip_hash_mutex. */
2336#endif
2337
2338 /** Number of buffer pool chunks */
2339 volatile ulint n_chunks;
2340
2341 /** New number of buffer pool chunks */
2343
2344 /** buffer pool chunks */
2346
2347 /** old buffer pool chunks to be freed after resizing buffer pool */
2349
2350 /** Current pool size in pages */
2352
2353 /** Previous pool size in pages */
2355
2356 /** Size in pages of the area which the read-ahead algorithms read
2357 if invoked */
2359
2360 /** Hash table of buf_page_t or buf_block_t file pages, buf_page_in_file() ==
2361 true, indexed by (space_id, offset). page_hash is protected by an array of
2362 mutexes. */
2364
2365 /** Hash table of buf_block_t blocks whose frames are allocated to the zip
2366 buddy system, indexed by block->frame */
2368
2369 /** Number of pending read operations. Accessed atomically */
2370 std::atomic<ulint> n_pend_reads;
2371
2372 /** number of pending decompressions. Accessed atomically. */
2373 std::atomic<ulint> n_pend_unzip;
2374
2375 /** when buf_print_io was last time called. Accesses not protected. */
2376 std::chrono::steady_clock::time_point last_printout_time;
2377
2378 /** Statistics of buddy system, indexed by block size. Protected by zip_free
2379 mutex, except for the used field, which is also accessed atomically */
2381
2382 /** Current statistics */
2384
2385 /** Old statistics */
2387
2388 /** @} */
2389
2390 /** @name Page flushing algorithm fields */
2391
2392 /** @{ */
2393
2394 /** Mutex protecting the flush list access. This mutex protects flush_list,
2395 flush_rbt and bpage::list pointers when the bpage is on flush_list. It also
2396 protects writes to bpage::oldest_modification and flush_list_hp */
2398
2399 /** "Hazard pointer" used during scan of flush_list while doing flush list
2400 batch. Protected by flush_list_mutex */
2402
2403 /** Entry pointer to scan the oldest page except for system temporary */
2405
2406 /** Base node of the modified block list */
2408
2409 /** This is true when a flush of the given type is being initialized.
2410 Protected by flush_state_mutex. */
2412
2413 /** This is the number of pending writes in the given flush type. Protected
2414 by flush_state_mutex. */
2415 std::array<size_t, BUF_FLUSH_N_TYPES> n_flush;
2416
2417 /** This is in the set state when there is no flush batch of the given type
2418 running. Protected by flush_state_mutex. */
2420
2421 /** A red-black tree is used exclusively during recovery to speed up
2422 insertions in the flush_list. This tree contains blocks in order of
2423 oldest_modification LSN and is kept in sync with the flush_list. Each
2424 member of the tree MUST also be on the flush_list. This tree is relevant
2425 only in recovery and is set to NULL once the recovery is over. Protected
2426 by flush_list_mutex */
2428
2429 /** A sequence number used to count the number of buffer blocks removed from
2430 the end of the LRU list; NOTE that this counter may wrap around at 4
2431 billion! A thread is allowed to read this for heuristic purposes without
2432 holding any mutex or latch. For non-heuristic purposes protected by
2433 LRU_list_mutex */
2435
2436 /** Set to false when an LRU scan for free block fails. This flag is used to
2437 avoid repeated scans of LRU list when we know that there is no free block
2438 available in the scan depth for eviction. Set to true whenever we flush a
2439 batch from the buffer pool. Accessed protected by memory barriers. */
2441
2442 /** Page Tracking start LSN. */
2444
2445 /** Check if the page modifications are tracked.
2446 @return true if page modifications are tracked, false otherwise. */
2447 bool is_tracking() { return track_page_lsn != LSN_MAX; }
2448
2449 /** Maximum LSN for which write io has already started. */
2451
2452 /** @} */
2453
2454 /** @name LRU replacement algorithm fields */
2455 /** @{ */
2456
2457 /** Base node of the free block list */
2459
2460 /** base node of the withdraw block list. It is only used during shrinking
2461 buffer pool size, not to reuse the blocks will be removed. Protected by
2462 free_list_mutex */
2464
2465 /** Target length of withdraw block list, when withdrawing */
2467
2468 /** "hazard pointer" used during scan of LRU while doing
2469 LRU list batch. Protected by buf_pool::LRU_list_mutex */
2471
2472 /** Iterator used to scan the LRU list when searching for
2473 replaceable victim. Protected by buf_pool::LRU_list_mutex. */
2475
2476 /** Iterator used to scan the LRU list when searching for
2477 single page flushing victim. Protected by buf_pool::LRU_list_mutex. */
2479
2480 /** Base node of the LRU list */
2482
2483 /** Pointer to the about LRU_old_ratio/BUF_LRU_OLD_RATIO_DIV oldest blocks in
2484 the LRU list; NULL if LRU length less than BUF_LRU_OLD_MIN_LEN; NOTE: when
2485 LRU_old != NULL, its length should always equal LRU_old_len */
2487
2488 /** Length of the LRU list from the block to which LRU_old points onward,
2489 including that block; see buf0lru.cc for the restrictions on this value; 0
2490 if LRU_old == NULL; NOTE: LRU_old_len must be adjusted whenever LRU_old
2491 shrinks or grows! */
2493
2494 /** Base node of the unzip_LRU list. The list is protected by the
2495 LRU_list_mutex. */
2496 UT_LIST_BASE_NODE_T(buf_block_t, unzip_LRU) unzip_LRU;
2497
2498 /** @} */
2499 /** @name Buddy allocator fields
2500 The buddy allocator is used for allocating compressed page
2501 frames and buf_page_t descriptors of blocks that exist
2502 in the buffer pool only in compressed form. */
2503 /** @{ */
2504#if defined UNIV_DEBUG || defined UNIV_BUF_DEBUG
2505 /** Unmodified compressed pages */
2507#endif /* UNIV_DEBUG || UNIV_BUF_DEBUG */
2508
2509 /** Buddy free lists */
2511
2512 /** Sentinel records for buffer pool watches. Scanning the array is protected
2513 by taking all page_hash latches in X. Updating or reading an individual
2514 watch page is protected by a corresponding individual page_hash latch. */
2516
2517 /** A wrapper for buf_pool_t::allocator.alocate_large which also advices the
2518 OS that this chunk should not be dumped to a core file if that was requested.
2519 Emits a warning to the log and disables @@global.core_file if advising was
2520 requested but could not be performed, but still return true as the allocation
2521 itself succeeded.
2522 @param[in] mem_size number of bytes to allocate
2523 @param[in,out] chunk mem and mem_pfx fields of this chunk will be updated
2524 to contain information about allocated memory region
2525 @return true iff allocated successfully */
2526 bool allocate_chunk(ulonglong mem_size, buf_chunk_t *chunk);
2527
2528 /** A wrapper for buf_pool_t::allocator.deallocate_large which also advices
2529 the OS that this chunk can be dumped to a core file.
2530 Emits a warning to the log and disables @@global.core_file if advising was
2531 requested but could not be performed.
2532 @param[in] chunk mem and mem_pfx fields of this chunk will be used to
2533 locate the memory region to free */
2534 void deallocate_chunk(buf_chunk_t *chunk);
2535
2536 /** Advices the OS that all chunks in this buffer pool instance can be dumped
2537 to a core file.
2538 Emits a warning to the log if could not succeed.
2539 @return true iff succeeded, false if no OS support or failed */
2540 bool madvise_dump();
2541
2542 /** Advices the OS that all chunks in this buffer pool instance should not
2543 be dumped to a core file.
2544 Emits a warning to the log if could not succeed.
2545 @return true iff succeeded, false if no OS support or failed */
2546 bool madvise_dont_dump();
2547
2548 /** Checks if the batch is running, which is basically equivalent to
2549 !os_event_is_set(no_flush[type]) if you hold flush_state_mutex.
2550 It is used as source of truth to know when to set or reset this event.
2551 Caller should hold flush_state_mutex.
2552 @param[in] flush_type The type of the flush we are interested in
2553 @return Should no_flush[type] be in the "unset" state? */
2556 return init_flush[flush_type] || 0 < n_flush[flush_type];
2557 }
2558
2559#ifndef UNIV_HOTBACKUP
2560 /** Executes change() which modifies fields protected by flush_state_mutex.
2561 If it caused a change to is_flushing(flush_type) then it sets or resets the
2562 no_flush[flush_type] to keep it in sync.
2563 @param[in] flush_type The type of the flush this change of state concerns
2564 @param[in] change A callback to execute within flush_state_mutex
2565 */
2566 template <typename F>
2569 const bool was_set = !is_flushing(flush_type);
2571 std::forward<F>(change)();
2572 const bool should_be_set = !is_flushing(flush_type);
2573 if (was_set && !should_be_set) {
2575 } else if (!was_set && should_be_set) {
2577 }
2578 ut_ad(should_be_set == os_event_is_set(no_flush[flush_type]));
2580 }
2581#endif /*! UNIV_HOTBACKUP */
2582
2583 static_assert(BUF_BUDDY_LOW <= UNIV_ZIP_SIZE_MIN,
2584 "BUF_BUDDY_LOW > UNIV_ZIP_SIZE_MIN");
2585 /** @} */
2586};
2587
2588/** Print the given buf_pool_t object.
2589@param[in,out] out the output stream
2590@param[in] buf_pool the buf_pool_t object to be printed
2591@return the output stream */
2592std::ostream &operator<<(std::ostream &out, const buf_pool_t &buf_pool);
2593
2594/** @name Accessors for buffer pool mutexes
2595Use these instead of accessing buffer pool mutexes directly. */
2596/** @{ */
2597
2598#ifndef UNIV_HOTBACKUP
2599/** Test if flush list mutex is owned. */
2600#define buf_flush_list_mutex_own(b) mutex_own(&(b)->flush_list_mutex)
2601
2602/** Acquire the flush list mutex. */
2603#define buf_flush_list_mutex_enter(b) \
2604 do { \
2605 mutex_enter(&(b)->flush_list_mutex); \
2606 } while (0)
2607/** Release the flush list mutex. */
2608#define buf_flush_list_mutex_exit(b) \
2609 do { \
2610 mutex_exit(&(b)->flush_list_mutex); \
2611 } while (0)
2612/** Acquire the block->mutex. */
2613#define buf_page_mutex_enter(b) \
2614 do { \
2615 mutex_enter(&(b)->mutex); \
2616 } while (0)
2617
2618/** Release the block->mutex. */
2619#define buf_page_mutex_exit(b) \
2620 do { \
2621 (b)->mutex.exit(); \
2622 } while (0)
2623
2624/** Get appropriate page_hash_lock. */
2626 const page_id_t page_id) {
2627 return hash_get_lock(buf_pool->page_hash, page_id.hash());
2628}
2629
2630/** If not appropriate page_hash_lock, relock until appropriate. */
2632 const buf_pool_t *buf_pool,
2633 const page_id_t page_id) {
2634 return hash_lock_s_confirm(hash_lock, buf_pool->page_hash, page_id.hash());
2635}
2636
2638 buf_pool_t *buf_pool,
2639 const page_id_t &page_id) {
2640 return hash_lock_x_confirm(hash_lock, buf_pool->page_hash, page_id.hash());
2641}
2642#endif /* !UNIV_HOTBACKUP */
2643
2644#if defined(UNIV_DEBUG) && !defined(UNIV_HOTBACKUP)
2645/** Test if page_hash lock is held in s-mode. */
2647 const buf_page_t *bpage) {
2648 return rw_lock_own(buf_page_hash_lock_get(buf_pool, bpage->id), RW_LOCK_S);
2649}
2650
2651/** Test if page_hash lock is held in x-mode. */
2653 const buf_page_t *bpage) {
2654 return rw_lock_own(buf_page_hash_lock_get((buf_pool), (bpage)->id),
2655 RW_LOCK_X);
2656}
2657
2658/** Test if page_hash lock is held in x or s-mode. */
2659inline bool buf_page_hash_lock_held_s_or_x(const buf_pool_t *buf_pool,
2660 const buf_page_t *bpage) {
2661 return buf_page_hash_lock_held_s(buf_pool, bpage) ||
2662 buf_page_hash_lock_held_x(buf_pool, bpage);
2663}
2664
2665inline bool buf_block_hash_lock_held_s(const buf_pool_t *buf_pool,
2666 const buf_block_t *block) {
2667 return buf_page_hash_lock_held_s(buf_pool, &block->page);
2668}
2669
2670inline bool buf_block_hash_lock_held_x(const buf_pool_t *buf_pool,
2671 const buf_block_t *block) {
2672 return buf_page_hash_lock_held_x(buf_pool, &block->page);
2673}
2674
2676 const buf_block_t *block) {
2677 return buf_page_hash_lock_held_s_or_x(buf_pool, &block->page);
2678}
2679#else /* UNIV_DEBUG && !UNIV_HOTBACKUP */
2680#define buf_page_hash_lock_held_s(b, p) (true)
2681#define buf_page_hash_lock_held_x(b, p) (true)
2682#define buf_page_hash_lock_held_s_or_x(b, p) (true)
2683#define buf_block_hash_lock_held_s(b, p) (true)
2684#define buf_block_hash_lock_held_x(b, p) (true)
2685#define buf_block_hash_lock_held_s_or_x(b, p) (true)
2686#endif /* UNIV_DEBUG && !UNIV_HOTBACKUP */
2687
2688/** @} */
2689
2690/**********************************************************************
2691Let us list the consistency conditions for different control block states.
2692
2693NOT_USED: is in free list, not in LRU list, not in flush list, nor
2694 page hash table
2695READY_FOR_USE: is not in free list, LRU list, or flush list, nor page
2696 hash table
2697MEMORY: is not in free list, LRU list, or flush list, nor page
2698 hash table
2699FILE_PAGE: space and offset are defined, is in page hash table
2700 if io_fix == BUF_IO_WRITE,
2701 pool: no_flush[flush_type] is in reset state,
2702 pool: n_flush[flush_type] > 0
2703
2704 (1) if buf_fix_count == 0, then
2705 is in LRU list, not in free list
2706 is in flush list,
2707 if and only if oldest_modification > 0
2708 is x-locked,
2709 if and only if io_fix == BUF_IO_READ
2710 is s-locked,
2711 if and only if io_fix == BUF_IO_WRITE
2712
2713 (2) if buf_fix_count > 0, then
2714 is not in LRU list, not in free list
2715 is in flush list,
2716 if and only if oldest_modification > 0
2717 if io_fix == BUF_IO_READ,
2718 is x-locked
2719 if io_fix == BUF_IO_WRITE,
2720 is s-locked
2721
2722State transitions:
2723
2724NOT_USED => READY_FOR_USE
2725READY_FOR_USE => MEMORY
2726READY_FOR_USE => FILE_PAGE
2727MEMORY => NOT_USED
2728FILE_PAGE => NOT_USED NOTE: This transition is allowed if and only if
2729 (1) buf_fix_count == 0,
2730 (2) oldest_modification == 0, and
2731 (3) io_fix == 0.
2732*/
2733
2734#if defined UNIV_DEBUG || defined UNIV_BUF_DEBUG
2735#ifndef UNIV_HOTBACKUP
2736/** Functor to validate the LRU list. */
2738 void operator()(const buf_page_t *elem) const { ut_a(elem->in_LRU_list); }
2739
2740 static void validate(const buf_pool_t *buf_pool) {
2741 CheckInLRUList check;
2742 ut_list_validate(buf_pool->LRU, check);
2743 }
2744};
2745
2746/** Functor to validate the LRU list. */
2748 void operator()(const buf_page_t *elem) const { ut_a(elem->in_free_list); }
2749
2750 static void validate(const buf_pool_t *buf_pool) {
2751 CheckInFreeList check;
2752 ut_list_validate(buf_pool->free, check);
2753 }
2754};
2755
2757 void operator()(const buf_block_t *elem) const {
2758 ut_a(elem->page.in_LRU_list);
2759 ut_a(elem->in_unzip_LRU_list);
2760 }
2761
2762 static void validate(const buf_pool_t *buf_pool) {
2764 ut_list_validate(buf_pool->unzip_LRU, check);
2765 }
2766};
2767#endif /* !UNIV_HOTBACKUP */
2768#endif /* UNIV_DEBUG || defined UNIV_BUF_DEBUG */
2769
2770#ifndef UNIV_HOTBACKUP
2771/** Prepare a page before adding to the free list.
2772@param[in,out] bpage Buffer page to prepare for freeing. */
2773inline void buf_page_prepare_for_free(buf_page_t *bpage) noexcept {
2774 bpage->reset_page_id();
2775}
2776#endif /* !UNIV_HOTBACKUP */
2777
2778/** Gets the compressed page descriptor corresponding to an uncompressed
2779page if applicable.
2780@param[in] block Get the zip descriptor for this block. */
2782 return block->get_page_zip();
2783}
2784
2785/** Gets the compressed page descriptor corresponding to an uncompressed
2786page if applicable. Const version.
2787@param[in] block Get the zip descriptor for this block.
2788@return page descriptor or nullptr. */
2790 const buf_block_t *block) noexcept {
2791 return block->get_page_zip();
2792}
2793
2794inline bool buf_page_in_memory(const buf_page_t *bpage) {
2795 switch (buf_page_get_state(bpage)) {
2796 case BUF_BLOCK_MEMORY:
2797 return true;
2798 default:
2799 break;
2800 }
2801 return false;
2802}
2803
2804/** Verify the page contained by the block. If there is page type
2805mismatch then reset it to expected page type. Data files created
2806before MySQL 5.7 GA may contain garbage in the FIL_PAGE_TYPE field.
2807@param[in,out] block block that may possibly have invalid
2808 FIL_PAGE_TYPE
2809@param[in] type Expected page type
2810@param[in,out] mtr Mini-transaction */
2813 mtr_t &mtr) {
2814 byte *page = block.frame;
2815 page_type_t page_type = fil_page_get_type(page);
2816 if (page_type != type) {
2817 const page_id_t &page_id = block.page.id;
2818 fil_page_reset_type(page_id, page, type, &mtr);
2819 }
2820}
2821
2822#include "buf0buf.ic"
2823
2824#endif /* !buf0buf_h */
uint32_t space_id_t
Tablespace identifier.
Definition: api0api.h:48
uint32_t page_no_t
Page number.
Definition: api0api.h:46
Cache_hint
Definition: buf0buf.h:94
@ MAKE_YOUNG
Move the block to the start of the LRU list if there is a danger that the block would drift out of th...
@ KEEP_OLD
Preserve the current LRU position of the block.
static void buf_block_dbg_add_level(buf_block_t *block, latch_level_t level)
Adds latch level info for the rw-lock protecting the buffer frame.
bool buf_block_hash_lock_held_x(const buf_pool_t *buf_pool, const buf_block_t *block)
Definition: buf0buf.h:2670
static buf_block_t * buf_page_get_block(buf_page_t *bpage)
Gets the buf_block_t handle of a buffered file block if an uncompressed page frame exists,...
static bool buf_page_belongs_to_unzip_LRU(const buf_page_t *bpage)
Determines if a block should be on unzip_LRU list.
static bool buf_page_can_relocate(const buf_page_t *bpage)
Determine if a buffer block can be relocated in memory.
buf_page_t * buf_page_get_zip(const page_id_t &page_id, const page_size_t &page_size)
Get read access to a compressed page (usually of type FIL_PAGE_TYPE_ZBLOB or FIL_PAGE_TYPE_ZBLOB2).
Definition: buf0buf.cc:3302
dberr_t buf_pool_init(ulint total_size, ulint n_instances)
Creates the buffer pool.
Definition: buf0buf.cc:1499
void buf_page_print(const byte *read_buf, const page_size_t &page_size, ulint flags)
Prints a page to stderr.
Definition: buf0buf.cc:611
ulint buf_get_n_pending_read_ios(void)
Returns the number of pending buf pool read ios.
Definition: buf0buf.cc:6542
bool buf_page_hash_lock_held_s_or_x(const buf_pool_t *buf_pool, const buf_page_t *bpage)
Test if page_hash lock is held in x or s-mode.
Definition: buf0buf.h:2659
static ulint buf_pool_get_curr_size(void)
Gets the current size of buffer buf_pool in bytes.
ulint buf_page_hash_lock_held_x(const buf_pool_t *buf_pool, const buf_page_t *bpage)
Test if page_hash lock is held in x-mode.
Definition: buf0buf.h:2652
void buf_page_force_evict(const page_id_t &page_id, const page_size_t &page_size, const bool dirty_is_ok=true) noexcept
Evict a page from the buffer pool.
Definition: buf0buf.cc:5419
bool buf_validate(void)
Validates the buffer pool data structure.
Definition: buf0buf.cc:6328
void buf_flush_update_zip_checksum(buf_frame_t *page, ulint size, lsn_t lsn, bool skip_lsn_check)
Calculate the checksum of a page from compressed table and update the page.
Definition: buf0flu.cc:941
static enum buf_page_state buf_block_get_state(const buf_block_t *block)
Gets the state of a block.
static void buf_page_set_state(buf_page_t *bpage, enum buf_page_state state)
Sets the state of a block.
buf_block_t * buf_block_from_ahi(const byte *ptr)
Get a buffer block from an adaptive hash index pointer.
Definition: buf0buf.cc:3512
bool buf_page_io_complete(buf_page_t *bpage, bool evict, IORequest *type=nullptr, fil_node_t *node=nullptr)
Completes an asynchronous read or write request of a file page to or from the buffer pool.
Definition: buf0buf.cc:5780
lsn_t buf_pool_get_oldest_modification_lwm(void)
Gets a safe low watermark for oldest_modification.
Definition: buf0buf.cc:484
bool buf_frame_will_withdrawn(buf_pool_t *buf_pool, const byte *ptr)
Determines if a frame is intended to be withdrawn.
Definition: buf0buf.cc:1875
void buf_pool_update_madvise()
Checks if innobase_should_madvise_buf_pool() value has changed since we've last check and if so,...
Definition: buf0buf.cc:1016
ulonglong buf_pool_adjust_chunk_unit(ulonglong size)
Adjust the proposed chunk unit size so that it satisfies all invariants.
Definition: buf0buf.cc:2144
static buf_page_t * buf_page_hash_get_locked(buf_pool_t *buf_pool, const page_id_t &page_id, rw_lock_t **lock, ulint lock_mode, bool watch=false)
Returns the control block of a file page, NULL if not found.
static enum buf_io_fix buf_page_get_io_fix(const buf_page_t *bpage)
Gets the io_fix state of a block.
static void buf_page_set_io_fix(buf_page_t *bpage, enum buf_io_fix io_fix)
Sets the io_fix state of a block.
buf_page_t * buf_page_set_file_page_was_freed(const page_id_t &page_id)
Sets file_page_was_freed true if the page is found in the buffer pool.
Definition: buf0buf.cc:3215
static void buf_page_set_accessed(buf_page_t *bpage)
Flag a block accessed.
static void buf_block_set_io_fix(buf_block_t *block, enum buf_io_fix io_fix)
Sets the io_fix state of a block.
void buf_page_make_young(buf_page_t *bpage)
Moves a page to the start of the buffer pool LRU list.
Definition: buf0buf.cc:3169
buf_pool_t * buf_pool_ptr
The buffer pools of the database.
Definition: buf0buf.cc:306
void buf_pool_clear_hash_index(void)
Clears the adaptive hash index on all pages in the buffer pool.
Definition: buf0buf.cc:2707
void buf_get_total_stat(buf_pool_stat_t *tot_stat)
Get total buffer pool statistics.
Definition: buf0buf.cc:556
static buf_pool_t * buf_pool_from_bpage(const buf_page_t *bpage)
Returns the buffer pool instance given a page instance.
static buf_flush_t buf_page_get_flush_type(const buf_page_t *bpage)
Get the flush type of a page.
static ulint buf_page_get_freed_page_clock(const buf_page_t *bpage)
Reads the freed_page_clock of a buffer block.
ulint buf_page_hash_lock_held_s(const buf_pool_t *buf_pool, const buf_page_t *bpage)
Test if page_hash lock is held in s-mode.
Definition: buf0buf.h:2646
static std::chrono::steady_clock::time_point buf_page_is_accessed(const buf_page_t *bpage)
Determine the time of first access of a block in the buffer pool.
constexpr ulint MAX_PAGE_HASH_LOCKS
The maximum number of page_hash locks.
Definition: buf0buf.h:115
bool buf_page_optimistic_get(ulint rw_latch, buf_block_t *block, uint64_t modify_clock, Page_fetch fetch_mode, const char *file, ulint line, mtr_t *mtr)
This is the general function used to get optimistic access to a database page.
Definition: buf0buf.cc:4501
void buf_pool_watch_unset(const page_id_t &page_id)
Stop watching if the page has been read in.
Definition: buf0buf.cc:3118
static byte * buf_frame_copy(byte *buf, const buf_frame_t *frame)
Copies contents of a buffer frame to a given buffer.
void buf_assert_all_are_replaceable()
Assert that all file pages in the buffer are in a replaceable state.
Definition: buf0buf.cc:6891
bool buf_pool_watch_occurred(const page_id_t &page_id)
Check if the page has been read in.
Definition: buf0buf.cc:3145
buf_page_t * buf_page_init_for_read(ulint mode, const page_id_t &page_id, const page_size_t &page_size, bool unzip)
Inits a page for read to the buffer buf_pool.
Definition: buf0buf.cc:4865
static bool buf_page_peek_if_young(const buf_page_t *bpage)
Tells, for heuristics, if a block is still close enough to the MRU end of the LRU list meaning that i...
bool buf_page_free_stale(buf_pool_t *buf_pool, buf_page_t *bpage) noexcept
Free a stale page.
Definition: buf0buf.cc:5386
buf_page_t * buf_page_hash_get_x_locked(buf_pool_t *b, const page_id_t &page_id, rw_lock_t **l)
Definition: buf0buf.h:1048
static void buf_page_set_old(buf_page_t *bpage, bool old)
Flag a block old.
size_t buf_pool_pending_io_reads_count()
Computes number of pending I/O read operations for the buffer pool.
Definition: buf0buf.cc:6897
size_t buf_pool_pending_io_writes_count()
Computes number of pending I/O write operations for the buffer pool.
Definition: buf0buf.cc:6905
void buf_read_page_handle_error(buf_page_t *bpage)
Unfixes the page, unlatches the page, removes it from page_hash and removes it from LRU.
Definition: buf0buf.cc:5351
static ulint buf_block_unfix(buf_page_t *bpage)
Decrements the bufferfix count.
static void buf_page_set_flush_type(buf_page_t *bpage, buf_flush_t flush_type)
Set the flush type of a page.
void buf_page_free_stale_during_write(buf_page_t *bpage, bool owns_sx_lock=false) noexcept
Free a stale page that is being written.
Definition: buf0buf.cc:5527
static buf_pool_t * buf_pool_from_block(const buf_block_t *block)
Returns the buffer pool instance given a block instance.
bool buf_is_block_in_instance(const buf_pool_t *buf_pool, const buf_block_t *ptr)
Find out if a block pointer points into one of currently used chunks of the buffer pool.
Definition: buf0buf.cc:3548
rw_lock_t * buf_page_hash_lock_get(const buf_pool_t *buf_pool, const page_id_t page_id)
Get appropriate page_hash_lock.
Definition: buf0buf.h:2625
std::ostream & operator<<(std::ostream &out, const buf_pool_t &buf_pool)
Print the given buf_pool_t object.
Definition: buf0buf.cc:6978
static BPageMutex * buf_page_get_mutex(const buf_page_t *bpage)
Gets the mutex of a block.
static uint64_t buf_pool_hash_zip_frame(void *ptr)
Compute the hash value for blocks in buf_pool->zip_hash.
Definition: buf0buf.h:2035
static buf_frame_t * buf_block_get_frame(const buf_block_t *block)
Gets a pointer to the memory frame of a block.
void buf_block_reset_page_type_on_mismatch(buf_block_t &block, page_type_t type, mtr_t &mtr)
Verify the page contained by the block.
Definition: buf0buf.h:2811
void buf_pool_free_all()
Frees the buffer pool at shutdown.
Definition: buf0buf.cc:7012
static enum buf_page_state buf_page_get_state(const buf_page_t *bpage)
Gets the state of a block.
static ulint buf_pool_index(const buf_pool_t *buf_pool)
Calculates the index of a buffer pool to the buf_pool[] array.
buf_block_t * buf_page_get_gen(const page_id_t &page_id, const page_size_t &page_size, ulint rw_latch, buf_block_t *guess, Page_fetch mode, ut::Location location, mtr_t *mtr, bool dirty_with_no_latch=false)
This is the general function used to get access to a database page.
Definition: buf0buf.cc:4434
ulint buf_get_free_list_len(void)
Gets the current length of the free list of buffer blocks.
rw_lock_t * buf_page_hash_lock_x_confirm(rw_lock_t *hash_lock, buf_pool_t *buf_pool, const page_id_t &page_id)
Definition: buf0buf.h:2637
static lsn_t buf_page_get_newest_modification(const buf_page_t *bpage)
Gets the youngest modification log sequence number for a frame.
ulint buf_get_latched_pages_number(void)
Returns the number of latched pages in the buffer pool.
Definition: buf0buf.cc:6523
static buf_page_t * buf_page_hash_get_low(buf_pool_t *buf_pool, const page_id_t &page_id)
Returns the control block of a file page, NULL if not found.
static ulint buf_block_fix(buf_page_t *bpage)
Increments the bufferfix count.
constexpr ulint MAX_BUFFER_POOLS
The maximum number of buffer pools that can be defined.
Definition: buf0buf.h:109
static buf_block_t * buf_block_hash_get_locked(buf_pool_t *buf_pool, const page_id_t &page_id, rw_lock_t **lock, ulint lock_mode)
Returns the control block of a file page, NULL if not found.
void buf_print_io(FILE *file)
Prints info of the buffer i/o.
Definition: buf0buf.cc:6819
static buf_pool_t * buf_pool_from_array(ulint index)
Returns the buffer pool instance given its array index.
static void buf_page_release_latch(buf_block_t *block, ulint rw_latch)
Releases a latch, if specified.
void buf_stats_get_pool_info(buf_pool_t *buf_pool, ulint pool_id, buf_pool_info_t *all_pool_info)
Collect buffer pool stats information for a buffer pool.
Definition: buf0buf.cc:6626
void buf_resize_thread()
This is the thread for resizing buffer pool.
Definition: buf0buf.cc:2680
void buf_print(void)
Prints info of the buffer pool data structure.
Definition: buf0buf.cc:6429
const buf_block_t * buf_page_try_get(const page_id_t &page_id, ut::Location location, mtr_t *mtr)
Given a tablespace id and page number tries to get that page.
Definition: buf0buf.cc:4694
static ulint buf_block_get_freed_page_clock(const buf_block_t *block)
Reads the freed_page_clock of a buffer block.
static void buf_ptr_get_fsp_addr(const void *ptr, space_id_t *space, fil_addr_t *addr)
Gets the space id, page offset, and byte offset within page of a pointer pointing to a buffer frame c...
static bool buf_page_peek_if_too_old(const buf_page_t *bpage)
Recommends a move of a block to the start of the LRU list if there is danger of dropping from the buf...
bool buf_block_will_withdrawn(buf_pool_t *buf_pool, const buf_block_t *block)
Determines if a block is intended to be withdrawn.
Definition: buf0buf.cc:1854
void buf_page_make_old(buf_page_t *bpage)
Moved a page to the end of the buffer pool LRU list so that it can be flushed out at the earliest.
Definition: buf0buf.cc:3181
lsn_t buf_pool_get_oldest_modification_approx(void)
Gets the smallest oldest_modification lsn among all of the earliest added pages in flush lists.
Definition: buf0buf.cc:431
buf_block_t * buf_block_hash_get_s_locked(buf_pool_t *b, const page_id_t &page_id, rw_lock_t **l)
Definition: buf0buf.h:1061
Page_fetch
Definition: buf0buf.h:58
@ NO_LATCH
get and bufferfix, but set no latch; we have separated this case, because it is error-prone programmi...
@ NORMAL
Get always.
@ IF_IN_POOL
get if in pool
@ POSSIBLY_FREED_NO_READ_AHEAD
Like Page_fetch::POSSIBLY_FREED, but do not initiate read ahead.
@ IF_IN_POOL_OR_WATCH
Get the page only if it's in the buffer pool, if not then set a watch on the page.
@ PEEK_IF_IN_POOL
get if in pool, do not make the block young in the LRU list
@ POSSIBLY_FREED
Like Page_fetch::NORMAL, but do not mind if the file page has been freed.
@ SCAN
Same as NORMAL, but hint that the fetch is part of a large scan.
rw_lock_t * buf_page_hash_lock_s_confirm(rw_lock_t *hash_lock, const buf_pool_t *buf_pool, const page_id_t page_id)
If not appropriate page_hash_lock, relock until appropriate.
Definition: buf0buf.h:2631
static void buf_page_unset_sticky(buf_page_t *bpage)
Removes stickiness of a block.
buf_page_print_flags
Definition: buf0buf.h:659
@ BUF_PAGE_PRINT_NO_FULL
Do not print the full page dump.
Definition: buf0buf.h:663
@ BUF_PAGE_PRINT_NO_CRASH
Do not crash at the end of buf_page_print().
Definition: buf0buf.h:661
buf_page_t * buf_page_get_also_watch(buf_pool_t *b, const page_id_t &page_id)
Definition: buf0buf.h:1056
bool buf_pool_watch_is_sentinel(const buf_pool_t *buf_pool, const buf_page_t *bpage)
Determine if a block is a sentinel for a buffer pool watch.
Definition: buf0buf.cc:2963
buf_block_t * buf_page_get_with_no_latch(const page_id_t &id, const page_size_t &size, ut::Location location, mtr_t *mtr)
Use these macros to bufferfix a page with no latching.
Definition: buf0buf.h:464
constexpr ulint MAX_BUFFER_POOLS_BITS
Number of bits to representing a buffer pool ID.
Definition: buf0buf.h:106
bool buf_block_hash_lock_held_s(const buf_pool_t *buf_pool, const buf_block_t *block)
Definition: buf0buf.h:2665
buf_block_t * buf_block_hash_get(buf_pool_t *b, const page_id_t &page_id)
Definition: buf0buf.h:1071
bool buf_page_in_memory(const buf_page_t *bpage)
Definition: buf0buf.h:2794
bool is_buffer_pool_resize_in_progress()
Definition: buf0buf.cc:7022
static bool buf_page_peek(const page_id_t &page_id)
Returns true if the page can be found in the buffer pool hash table.
bool buf_page_get_known_nowait(ulint rw_latch, buf_block_t *block, Cache_hint hint, const char *file, ulint line, mtr_t *mtr)
This is used to get access to a known database page, when no waiting can be done.
Definition: buf0buf.cc:4601
buf_page_t * buf_page_hash_get_s_locked(buf_pool_t *b, const page_id_t &page_id, rw_lock_t **l)
Definition: buf0buf.h:1043
static void buf_page_release_zip(buf_page_t *bpage)
Releases a compressed-only page acquired with buf_page_get_zip().
static void buf_block_free(buf_block_t *block)
Frees a buffer block which does not contain a file page.
static uint64_t buf_pool_hash_zip(buf_block_t *b)
Definition: buf0buf.h:2039
buf_page_t * buf_page_hash_get(buf_pool_t *b, const page_id_t &page_id)
Definition: buf0buf.h:1053
static void buf_block_set_state(buf_block_t *block, enum buf_page_state state)
Sets the state of a block.
constexpr uint32_t BUF_PAGE_STATE_BITS
The common buffer control block structure for compressed and uncompressed frames.
Definition: buf0buf.h:1155
static void buf_block_buf_fix_inc_func(ut::Location location, buf_block_t *block)
Increments the bufferfix count.
static buf_pool_t * buf_pool_get(const page_id_t &page_id)
Returns the buffer pool instance given a page id.
static ulint buf_get_withdraw_depth(buf_pool_t *buf_pool)
Return how many more pages must be added to the withdraw list to reach the withdraw target of the cur...
buf_page_state
States of a control block.
Definition: buf0buf.h:131
@ BUF_BLOCK_NOT_USED
Is in the free list; must be after the BUF_BLOCK_ZIP_ constants for compressed-only pages.
Definition: buf0buf.h:141
@ BUF_BLOCK_ZIP_PAGE
Contains a clean compressed page.
Definition: buf0buf.h:135
@ BUF_BLOCK_REMOVE_HASH
Hash index should be removed before putting to the free list.
Definition: buf0buf.h:153
@ BUF_BLOCK_MEMORY
Contains some main memory object.
Definition: buf0buf.h:150
@ BUF_BLOCK_ZIP_DIRTY
Contains a compressed page that is in the buf_pool->flush_list.
Definition: buf0buf.h:137
@ BUF_BLOCK_POOL_WATCH
A sentinel for the buffer pool watch, element of buf_pool->watch[].
Definition: buf0buf.h:133
@ BUF_BLOCK_READY_FOR_USE
When buf_LRU_get_free_block returns a block, it is in this state.
Definition: buf0buf.h:144
@ BUF_BLOCK_FILE_PAGE
Contains a buffered file page.
Definition: buf0buf.h:147
void buf_refresh_io_stats_all()
Refresh the statistics used to print per-second averages.
Definition: buf0buf.cc:6881
static ulint buf_pool_get_n_pages(void)
Gets the current size of buffer buf_pool in frames.
buf_block_t * buf_block_alloc(buf_pool_t *buf_pool)
Allocates a buffer block.
Definition: buf0buf.cc:582
static buf_block_t * buf_get_nth_chunk_block(const buf_pool_t *buf_pool, ulint n, ulint *chunk_size)
Get the nth chunk's buffer block in the specified buffer pool.
static ulint buf_pool_size_align(ulint size)
Calculate aligned buffer pool size based on srv_buf_pool_chunk_unit, if needed.
buf_block_t * buf_page_get(const page_id_t &id, const page_size_t &size, ulint latch, ut::Location location, mtr_t *mtr)
NOTE! The following macros should be used instead of buf_page_get_gen, to improve debugging.
Definition: buf0buf.h:453
static void buf_block_modify_clock_inc(buf_block_t *block)
Increment the modify clock.
static bool buf_page_in_file(const buf_page_t *bpage)
Determines if a block is mapped to a tablespace.
page_zip_des_t * buf_block_get_page_zip(buf_block_t *block) noexcept
Gets the compressed page descriptor corresponding to an uncompressed page if applicable.
Definition: buf0buf.h:2781
void buf_pool_invalidate(void)
Invalidates the file pages in the buffer pool when an archive recovery is completed.
Definition: buf0buf.cc:6134
void buf_page_free_descriptor(buf_page_t *bpage)
Free a buf_page_t descriptor.
Definition: buf0buf.cc:1414
buf_block_t * buf_page_create(const page_id_t &page_id, const page_size_t &page_size, rw_lock_type_t rw_latch, mtr_t *mtr)
Initializes a page to the buffer buf_pool.
Definition: buf0buf.cc:5071
double buf_get_modified_ratio_pct(void)
Return the ratio in percents of modified pages in the buffer pool / database pages in the buffer pool...
Definition: buf0buf.cc:6556
static buf_frame_t * buf_frame_align(byte *ptr)
void buf_page_prepare_for_free(buf_page_t *bpage) noexcept
Prepare a page before adding to the free list.
Definition: buf0buf.h:2773
buf_block_t * buf_pool_contains_zip(buf_pool_t *buf_pool, const void *data)
Finds a block in the buffer pool that points to a given compressed page.
Definition: buf0buf.cc:1173
static void buf_block_set_file_page(buf_block_t *block, const page_id_t &page_id)
Map a block to a file page.
void buf_pool_wait_for_no_pending_io()
Waits until there are no pending I/O operations for the buffer pool.
Definition: buf0buf.cc:6917
static buf_page_t * buf_page_alloc_descriptor(void)
Allocates a buf_page_t descriptor.
static enum buf_io_fix buf_block_get_io_fix(const buf_block_t *block)
Gets the io_fix state of a block.
bool buf_block_hash_lock_held_s_or_x(const buf_pool_t *buf_pool, const buf_block_t *block)
Definition: buf0buf.h:2675
bool buf_block_state_valid(buf_block_t *block)
Check if a buf_block_t object is in a valid state.
Definition: buf0buf.h:2028
buf_block_t * buf_block_hash_get_x_locked(buf_pool_t *b, const page_id_t &page_id, rw_lock_t **l)
Definition: buf0buf.h:1066
const std::unordered_map< buf_page_state, std::string_view > buf_page_state_str
Definition: buf0buf.h:156
buf_page_t * buf_page_reset_file_page_was_freed(const page_id_t &page_id)
Sets file_page_was_freed false if the page is found in the buffer pool.
Definition: buf0buf.cc:3241
static bool buf_page_is_old(const buf_page_t *bpage)
Determine if a block has been flagged old.
void buf_block_buf_fix_inc(buf_block_t *b, ut::Location l)
Increments the bufferfix count.
Definition: buf0buf.h:615
static void buf_page_set_sticky(buf_page_t *bpage)
Makes a block sticky.
void buf_get_total_list_size_in_bytes(buf_pools_list_size_t *buf_pools_list_size)
Get total list size in bytes from all buffer pools.
Definition: buf0buf.cc:535
void buf_get_total_list_len(ulint *LRU_len, ulint *free_len, ulint *flush_list_len)
Get total buffer pool statistics.
Definition: buf0buf.cc:515
bool buf_zip_decompress(buf_block_t *block, bool check)
Decompress a block.
Definition: buf0buf.cc:3444
The database buffer buf_pool.
The database buffer pool global types for the directory.
byte buf_frame_t
A buffer frame.
Definition: buf0types.h:62
BPageMutex BufPoolZipMutex
Definition: buf0types.h:201
constexpr uint32_t BUF_BUDDY_LOW
Smallest buddy page size.
Definition: buf0types.h:183
constexpr uint32_t BUF_BUDDY_SIZES_MAX
Maximum number of buddy sizes based on the max page size.
Definition: buf0types.h:189
buf_flush_t
Flags for flush types.
Definition: buf0types.h:68
@ BUF_FLUSH_N_TYPES
Index of last element + 1
Definition: buf0types.h:79
ib_mutex_t BufListMutex
Definition: buf0types.h:199
ib_bpmutex_t BPageMutex
Definition: buf0types.h:198
buf_io_fix
Flags for io_fix types.
Definition: buf0types.h:99
@ BUF_IO_NONE
no pending I/O
Definition: buf0types.h:101
@ BUF_IO_WRITE
write pending
Definition: buf0types.h:107
@ BUF_IO_READ
read pending
Definition: buf0types.h:104
@ BUF_IO_PIN
disallow relocation of block and its removal from the flush_list
Definition: buf0types.h:110
The database buffer pool high-level routines.
Class implementing buf_pool->flush_list hazard pointer.
Definition: buf0buf.h:2106
~FlushHp() override=default
Destructor.
FlushHp(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
Constructor.
Definition: buf0buf.h:2111
void adjust(const buf_page_t *bpage) override
Adjust the value of hp.
Definition: buf0buf.cc:2923
We use Flush_observer to track flushing of non-redo logged pages in bulk create index(btr0load....
Definition: buf0flu.h:270
A "Hazard Pointer" class used to iterate over page lists inside the buffer pool.
Definition: buf0buf.h:2048
bool is_hp(const buf_page_t *bpage)
Checks if a bpage is the hp.
Definition: buf0buf.cc:2898
void set(buf_page_t *bpage)
Set current value.
Definition: buf0buf.cc:2885
virtual void adjust(const buf_page_t *bpage)=0
Adjust the value of hp.
const ib_mutex_t * m_mutex
mutex that protects access to the m_hp.
Definition: buf0buf.h:2098
void move(const buf_page_t *bpage, buf_page_t *dpage)
Adjust the value of hp for moving.
Definition: buf0buf.cc:2910
buf_page_t * m_hp
hazard pointer.
Definition: buf0buf.h:2102
virtual ~HazardPointer()=default
Destructor.
const buf_pool_t * m_buf_pool
Buffer pool instance.
Definition: buf0buf.h:2094
HazardPointer(const HazardPointer &)
Disable copying.
buf_page_t * get() const
Get current value.
Definition: buf0buf.h:2060
HazardPointer(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
Constructor.
Definition: buf0buf.h:2053
HazardPointer & operator=(const HazardPointer &)
The IO Context that is passed down to the low level IO code.
Definition: os0file.h:266
Class implementing buf_pool->LRU hazard pointer.
Definition: buf0buf.h:2125
~LRUHp() override=default
Destructor.
void adjust(const buf_page_t *bpage) override
Adjust the value of hp.
Definition: buf0buf.cc:2938
LRUHp(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
Constructor.
Definition: buf0buf.h:2130
Special purpose iterators to be used when scanning the LRU list.
Definition: buf0buf.h:2147
~LRUItr() override=default
Destructor.
buf_page_t * start()
Selects from where to start a scan.
Definition: buf0buf.cc:2953
LRUItr(const buf_pool_t *buf_pool, const ib_mutex_t *mutex)
Constructor.
Definition: buf0buf.h:2152
The purpose of this class is to hide the knowledge that Buf_io_fix_latching_rules even exists from us...
Definition: buf0buf.cc:5621
Definition: buf0buf.h:1436
bool someone_is_responsible() const
Checks if there is any thread responsible for I/O on this page now.
Definition: buf0buf.h:1444
void release()
Called by the thread responsible for I/O on this page to release its responsibility.
Definition: buf0buf.h:1456
bool current_thread_is_responsible() const
Checks if the current thread is responsible for I/O on this page now.
Definition: buf0buf.h:1450
void take()
Called by the thread which becomes responsible for I/O on this page to indicate that it takes the res...
Definition: buf0buf.h:1463
std::thread::id responsible_thread
The thread responsible for I/O on this page, or an impossible value if no thread is currently respons...
Definition: buf0buf.h:1439
Definition: buf0buf.h:1165
uint32_t freed_page_clock
The value of buf_pool->freed_page_clock when this block was the last time put to the head of the LRU ...
Definition: buf0buf.h:1680
buf_page_t(const buf_page_t &other)
Copy constructor.
Definition: buf0buf.h:1169
void space_id_changed()
Updates new space reference and acquires "reference count latch" and the current version of the space...
Definition: buf0buf.h:1327
void take_io_responsibility()
Called by the thread which becomes responsible for I/O on this page to indicate that it takes the res...
Definition: buf0buf.h:1490
bool is_stale() const
Checks if this space reference saved during last page ID initialization was deleted or truncated sinc...
Definition: buf0buf.h:1244
void init_io_fix()
This is called only when having full ownership of the page object and no other thread can reach it.
Definition: buf0buf.h:1520
void set_io_fix(buf_io_fix io_fix)
Sets io_fix to specified value.
Definition: buf0buf.cc:5695
bool someone_has_io_responsibility() const
Checks if there is any thread responsible for I/O on this page now.
Definition: buf0buf.h:1474
bool has_correct_io_fix_value() const
Checks if io_fix has any of the known enum values.
Definition: buf0buf.h:1423
lsn_t get_newest_lsn() const noexcept
Definition: buf0buf.h:1360
bool current_thread_has_io_responsibility() const
Checks if the current thread is responsible for I/O on this page now.
Definition: buf0buf.h:1480
void set_newest_lsn(lsn_t lsn) noexcept
Set the latest modification LSN.
Definition: buf0buf.h:1371
buf_page_t * hash
Node used in chaining to buf_pool->page_hash or buf_pool->zip_hash.
Definition: buf0buf.h:1610
bool is_io_fix_write() const
Checks if the current value of io_fix is BUF_IO_WRITE.
Definition: buf0buf.cc:5675
Flush_observer * get_flush_observer() noexcept
Definition: buf0buf.h:1344
fil_space_t * get_space() const
Retrieve the tablespace object if one was available during page ID initialization.
Definition: buf0buf.h:1283
bool is_io_fix_read_as_opposed_to_write() const
Assuming that io_fix is either BUF_IO_READ or BUF_IO_WRITE determines which of the two it is.
Definition: buf0buf.cc:5687
space_id_t space() const noexcept
Retrieve the tablespace id.
Definition: buf0buf.h:1233
bool in_zip_hash
true if in buf_pool->zip_hash
Definition: buf0buf.h:1725
bool in_free_list
true if in buf_pool->free; when buf_pool->free_list_mutex is free, the following should hold: in_free...
Definition: buf0buf.h:1716
std::chrono::steady_clock::time_point access_time
Time of first access, or 0 if the block was never accessed in the buffer pool.
Definition: buf0buf.h:1689
Flush_observer * m_flush_observer
Flush observer instance.
Definition: buf0buf.h:1672
buf_fix_count_atomic_t buf_fix_count
Count of how many fold this block is currently bufferfixed.
Definition: buf0buf.h:1394
bool in_flush_list
true if in buf_pool->flush_list; when buf_pool->flush_list_mutex is free, the following should hold: ...
Definition: buf0buf.h:1712
void reset_page_id()
Sets stored value to invalid/empty value.
Definition: buf0buf.h:1320
bool is_dirty() const noexcept
Definition: buf0buf.h:1367
bool old
true if the block is in the old blocks in buf_pool->LRU_old
Definition: buf0buf.h:1698
bool was_io_fix_read() const
Checks if io_fix is BUF_IO_READ without requiring or acquiring any latches.
Definition: buf0buf.h:1580
void reinit_io_fix()
This is called only when having full ownership of the page object and no other thread can reach it.
Definition: buf0buf.h:1532
void reset_page_id(page_id_t new_page_id)
Sets stored page ID to the new value.
Definition: buf0buf.h:1304
void set_oldest_lsn(lsn_t lsn) noexcept
Set the LSN when the page is modified for the first time.
Definition: buf0buf.ic:746
uint16_t get_dblwr_batch_id() const
Definition: buf0buf.h:1229
bool was_stale() const
Checks if this space reference saved during last page ID initialization was deleted or truncated sinc...
Definition: buf0buf.h:1261
void set_page_id(const page_id_t page_id)
Set the stored page id to a new value.
Definition: buf0buf.h:1288
friend std::ostream & operator<<(std::ostream &outs, const buf_page_t &page)
Print page metadata in JSON format {"key":"value"}.
Definition: buf0buf.cc:7063
lsn_t newest_modification
The flush LSN, LSN when this page was written to the redo log.
Definition: buf0buf.h:1643
void release_io_responsibility()
Called by the thread responsible for I/O on this page to release its responsibility.
Definition: buf0buf.h:1486
static bool is_memory(const page_t *const ptr) noexcept
Check if the given ptr lies in a memory block of type BUF_BLOCK_MEMORY.
Definition: buf0buf.cc:7029
lsn_t get_oldest_lsn() const noexcept
Definition: buf0buf.h:1364
lsn_t oldest_modification
log sequence number of the youngest modification to this block, zero if not modified.
Definition: buf0buf.h:1647
page_id_t id
Page id.
Definition: buf0buf.h:1388
copyable_atomic_t< buf_io_fix > io_fix
Type of pending I/O operation.
Definition: buf0buf.h:1400
UT_LIST_NODE_T(buf_page_t) list
Based on state, this is a list node, protected by the corresponding list mutex, in one of the followi...
buf_io_fix get_io_fix_snapshot() const
Retrieves a value of io_fix without requiring or acquiring any latches.
Definition: buf0buf.h:1506
page_size_t size
Page size.
Definition: buf0buf.h:1391
io_responsibility_t io_responsibility
Tracks which thread is responsible for I/O on this page.
Definition: buf0buf.h:1469
uint8_t buf_pool_index
Index number of the buffer pool that this block belongs to.
Definition: buf0buf.h:1607
uint16_t m_dblwr_id
Double write instance ordinal value during writes.
Definition: buf0buf.h:1694
bool was_io_fix_none() const
Checks if io_fix is BUF_IO_NONE without requiring or acquiring any latches.
Definition: buf0buf.h:1597
void set_clean() noexcept
Set page to clean state.
Definition: buf0buf.h:1378
buf_io_fix get_io_fix() const
Retrieves the current value of io_fix.
Definition: buf0buf.h:1548
bool is_io_fix_read() const
Checks if the current value of io_fix is BUF_IO_READ.
Definition: buf0buf.cc:5681
uint32_t m_version
Version of fil_space_t when the page was updated.
Definition: buf0buf.h:1685
bool in_LRU_list
true if the page is in the LRU list; used in debugging
Definition: buf0buf.h:1719
void set_flush_observer(Flush_observer *flush_observer) noexcept
Set the flush observer for the page.
Definition: buf0buf.h:1348
buf_page_state state
Block state.
Definition: buf0buf.h:1600
page_no_t page_no() const noexcept
Retrieve the page number.
Definition: buf0buf.h:1237
fil_space_t * m_space
Tablespace instance that this page belongs to.
Definition: buf0buf.h:1675
bool was_io_fixed() const
Checks if io_fix is BUF_IO_FIX or BUF_IO_READ or BUF_IO_WRITE without requiring or acquiring any latc...
Definition: buf0buf.h:1587
void reset_flush_observer() noexcept
Remove the flush observer.
Definition: buf0buf.h:1356
void set_dblwr_batch_id(uint16_t batch_id)
Set the doublewrite buffer ID.
Definition: buf0buf.h:1226
bool file_page_was_freed
This is set to true when fsp frees a page in buffer pool; protected by buf_pool->zip_mutex or buf_blo...
Definition: buf0buf.h:1703
UT_LIST_NODE_T(buf_page_t) LRU
node of the LRU list
friend class Latching_rules_helpers
Definition: buf0buf.h:1428
bool is_memory() const noexcept
Check if the state of this page is BUF_BLOCK_MEMORY.
Definition: buf0buf.h:1219
buf_flush_t flush_type
If this block is currently being flushed to disk, this tells the flush_type.
Definition: buf0buf.h:1604
void set_page_size(const page_size_t &page_size)
Set the page size to a new value.
Definition: buf0buf.h:1296
bool in_page_hash
true if in buf_pool->page_hash
Definition: buf0buf.h:1722
page_zip_des_t zip
compressed page; zip.data (but not the data it points to) is protected by buf_pool->zip_mutex; state ...
Definition: buf0buf.h:1668
static bool is_correct_io_fix_value(buf_io_fix io_fix)
Checks if io_fix has any of the known enum values.
Definition: buf0buf.h:1407
Definition: buf0buf.h:1158
copyable_atomic_t(const copyable_atomic_t< T > &other)
Definition: buf0buf.h:1160
Definition: hash0hash.h:375
Page identifier.
Definition: buf0types.h:207
uint64_t hash() const
Retrieve the hash value.
Definition: buf0types.h:247
page_no_t page_no() const
Retrieve the page number.
Definition: buf0types.h:243
Page size descriptor.
Definition: page0size.h:50
size_t logical() const
Retrieve the logical page size (in-memory).
Definition: page0size.h:129
int page
Definition: ctype-mb.cc:1234
dberr_t
Definition: db0err.h:39
fil_space_t * fil_space_get(space_id_t space_id)
Look up a tablespace.
Definition: fil0fil.cc:2230
void fil_page_reset_type(const page_id_t &page_id, byte *page, ulint type, mtr_t *mtr)
Reset the page type.
Definition: fil0fil.cc:8237
The low-level file system.
uint16_t page_type_t
Definition: fil0fil.h:1224
constexpr page_type_t FIL_PAGE_INDEX
File page types (values of FIL_PAGE_TYPE)
Definition: fil0fil.h:1228
constexpr page_no_t FIL_NULL
'null' (undefined) page offset in the context of file spaces
Definition: fil0fil.h:1162
page_type_t fil_page_get_type(const byte *page)
Get the file page type.
Definition: fil0fil.h:1341
constexpr uint32_t FIL_PAGE_TYPE
file page type: FIL_PAGE_INDEX,..., 2 bytes.
Definition: fil0types.h:76
constexpr uint32_t FIL_PAGE_OFFSET
page offset inside space
Definition: fil0types.h:46
constexpr uint32_t FIL_PAGE_DATA
start of the data on the page
Definition: fil0types.h:111
constexpr uint32_t FIL_PAGE_SPACE_ID
alias for space id
Definition: fil0types.h:108
constexpr uint32_t FIL_PAGE_NEXT
if there is a 'natural' successor of the page, its offset.
Definition: fil0types.h:61
constexpr uint32_t FIL_PAGE_PREV
if there is a 'natural' predecessor of the page, its offset.
Definition: fil0types.h:51
flush_type
Definition: my_sys.h:298
The simple hash table utility.
static rw_lock_t * hash_lock_s_confirm(rw_lock_t *hash_lock, hash_table_t *table, uint64_t hash_value)
If not appropriate rw_lock for a hash value in a hash table, relock S-lock the another rw_lock until ...
static rw_lock_t * hash_lock_x_confirm(rw_lock_t *hash_lock, hash_table_t *table, uint64_t hash_value)
If not appropriate rw_lock for a hash value in a hash table, relock X-lock the another rw_lock until ...
static rw_lock_t * hash_get_lock(hash_table_t *table, uint64_t hash_value)
Gets the rw_lock for a hash value in a hash table.
static int flags[50]
Definition: hp_test1.cc:40
#define malloc(A)
Definition: lexyy.cc:914
#define free(A)
Definition: lexyy.cc:915
lock_mode
Definition: lock0types.h:54
constexpr lsn_t LSN_MAX
Maximum possible lsn value is slightly higher than the maximum sn value, because lsn sequence enumera...
Definition: log0constants.h:159
uint64_t lsn_t
Type used for all log sequence number storage and arithmetic.
Definition: log0types.h:63
static uint16_t mach_read_from_2(const byte *b)
The following function is used to fetch data from 2 consecutive bytes.
static uint32_t mach_read_from_4(const byte *b)
The following function is used to fetch data from 4 consecutive bytes.
static void mach_write_to_4(byte *b, ulint n)
The following function is used to store data in 4 consecutive bytes.
Mini-transaction buffer global types.
unsigned long long int ulonglong
Definition: my_inttypes.h:56
void copy(Shards< COUNT > &dst, const Shards< COUNT > &src) noexcept
Copy the counters, overwrite destination.
Definition: ut0counter.h:354
void clear(Shards< COUNT > &shards) noexcept
Clear the counter - reset to 0.
Definition: ut0counter.h:344
Definition: buf0block_hint.cc:30
const std::string FILE("FILE")
bool load(THD *, const dd::String_type &fname, dd::String_type *buf)
Read an sdi file from disk and store in a buffer.
Definition: sdi_file.cc:308
Definition: os0file.h:89
Provides atomic access in shared-exclusive modes.
Definition: shared_spin_lock.h:79
size_t size(const char *const c)
Definition: base64.h:46
Definition: gcs_xcom_synode.h:64
mode
Definition: file_handle.h:61
pid_type get_id()
Definition: process.h:48
static uint64_t hash_uint64(uint64_t value)
Hashes a 64-bit integer.
Definition: ut0rnd.h:199
std::list< T, ut::allocator< T > > list
Specialization of list which uses ut_allocator.
Definition: ut0new.h:2879
void os_event_set(os_event_t event)
Sets an event semaphore to the signaled state: lets waiting threads proceed.
Definition: os0event.cc:553
bool os_event_is_set(const os_event_t event)
Check if the event is set.
Definition: os0event.cc:545
int64_t os_event_reset(os_event_t event)
Resets an event semaphore to the non-signaled state.
Definition: os0event.cc:568
The interface to the operating system process control primitives.
Index page routines.
byte page_t
Type of the index page.
Definition: page0types.h:152
required string type
Definition: replication_group_member_actions.proto:34
Shutdowns the Innobase database server.
std::atomic< enum srv_shutdown_t > srv_shutdown_state
At a shutdown this value climbs from SRV_SHUTDOWN_NONE to SRV_SHUTDOWN_EXIT_THREADS.
Definition: srv0start.cc:162
@ SRV_SHUTDOWN_EXIT_THREADS
Exit all threads and free resources.
Definition: srv0shutdown.h:111
The server main program.
Functor to validate the LRU list.
Definition: buf0buf.h:2747
static void validate(const buf_pool_t *buf_pool)
Definition: buf0buf.h:2750
void operator()(const buf_page_t *elem) const
Definition: buf0buf.h:2748
Functor to validate the LRU list.
Definition: buf0buf.h:2737
void operator()(const buf_page_t *elem) const
Definition: buf0buf.h:2738
static void validate(const buf_pool_t *buf_pool)
Definition: buf0buf.h:2740
Definition: buf0buf.h:2756
static void validate(const buf_pool_t *buf_pool)
Definition: buf0buf.h:2762
void operator()(const buf_block_t *elem) const
Definition: buf0buf.h:2757
Structure used by AHI to contain information on record prefixes to be considered in hash index subsys...
Definition: buf0buf.h:1740
bool operator==(const btr_search_prefix_info_t &other) const
Definition: buf0buf.h:1754
bool operator!=(const btr_search_prefix_info_t &other) const
Definition: buf0buf.h:1759
bool equals_without_left_side(const btr_search_prefix_info_t &other) const
Definition: buf0buf.h:1750
uint32_t n_bytes
recommended prefix: number of bytes in an incomplete field
Definition: buf0buf.h:1743
uint16_t n_fields
recommended prefix length for hash search: number of full fields
Definition: buf0buf.h:1745
bool left_side
true or false, depending on whether the leftmost record of several records with the same prefix shoul...
Definition: buf0buf.h:1748
Structure that holds most AHI-related fields.
Definition: buf0buf.h:1803
void assert_empty_on_init() const
Definition: buf0buf.h:1869
std::atomic< dict_index_t * > index
Index for which the adaptive hash index has been created, or nullptr if the page does not exist in th...
Definition: buf0buf.h:1822
void assert_empty() const
Definition: buf0buf.h:1867
void validate() const
Definition: buf0buf.h:1845
std::atomic< btr_search_prefix_info_t > prefix_info
Prefix info that was used for building hash index.
Definition: buf0buf.h:1821
std::atomic< uint16_t > n_pointers
Used in debugging.
Definition: buf0buf.h:1843
std::atomic< btr_search_prefix_info_t > recommended_prefix_info
Recommended prefix info for hash search.
Definition: buf0buf.h:1810
The buffer control block structure.
Definition: buf0buf.h:1765
rw_lock_t debug_latch
In the debug version, each thread which bufferfixes the block acquires an s-latch here; so we can use...
Definition: buf0buf.h:1904
uint64_t modify_clock
This clock is incremented every time a pointer to a record on the page may become obsolete; this is u...
Definition: buf0buf.h:1918
BPageLock lock
read-write lock of the buffer frame
Definition: buf0buf.h:1775
std::atomic< uint32_t > n_hash_helps
Counter which controls how many times the current prefix recommendation would help in searches.
Definition: buf0buf.h:1892
page_type_t get_page_type() const
Get the page type of the current buffer block.
Definition: buf0buf.h:1964
struct buf_block_t::ahi_t ahi
buf_page_t page
page information; this must be the first field, so that buf_pool->page_hash can point to buf_page_t o...
Definition: buf0buf.h:1771
page_no_t get_next_page_no() const
Get the next page number of the current buffer block.
Definition: buf0buf.h:1952
page_zip_des_t const * get_page_zip() const noexcept
Const version.
Definition: buf0buf.h:2008
const char * get_page_type_str() const noexcept
Get the page type of the current buffer block as string.
Definition: buf0buf.cc:7005
bool in_withdraw_list
Definition: buf0buf.h:1797
UT_LIST_NODE_T(buf_block_t) unzip_LRU
node of the decompressed LRU list; a block is in the unzip_LRU list if page.state == BUF_BLOCK_FILE_P...
page_no_t get_prev_page_no() const
Get the prev page number of the current buffer block.
Definition: buf0buf.h:1958
bool is_leaf() const
Definition: buf0buf.h:2019
void mark_for_read_io()
Mark the frame with jumbled page_id, while initiating i/o read (BUF_IO_READ).
Definition: buf0buf.h:1971
uint64_t get_modify_clock(bool single_threaded) const noexcept
Get the modified clock (version) value.
Definition: buf0buf.h:1931
bool in_unzip_LRU_list
true if the page is in the decompressed LRU list; used in debugging
Definition: buf0buf.h:1795
bool is_empty() const
Check if this index page is empty.
Definition: buf0buf.cc:7042
const page_id_t & get_page_id() const
Get the page number and space id of the current buffer block.
Definition: buf0buf.h:1944
BPageMutex mutex
mutex protecting this block: state (also protected by the buffer pool mutex), io_fix,...
Definition: buf0buf.h:1925
byte * frame
pointer to buffer frame which is of size UNIV_PAGE_SIZE, and aligned to an address divisible by UNIV_...
Definition: buf0buf.h:1787
page_no_t get_page_no() const
Get the page number of the current buffer block.
Definition: buf0buf.h:1948
bool is_index_page() const
Definition: buf0buf.h:2021
bool is_root() const
Definition: buf0buf.h:2015
bool was_freed() const
Check if the buffer block was freed.
Definition: buf0buf.h:1780
bool made_dirty_with_no_latch
true if block has been made dirty without acquiring X/SX latch as the block belongs to temporary tabl...
Definition: buf0buf.h:1896
page_zip_des_t * get_page_zip() noexcept
Gets the compressed page descriptor corresponding to an uncompressed page if applicable.
Definition: buf0buf.h:2002
bool is_memory() const noexcept
Definition: buf0buf.h:2012
uint16_t get_page_level() const
Definition: buf0buf.cc:7034
friend std::ostream & operator<<(std::ostream &outs, const buf_block_t &block)
Print control block information in JSON format: {"key":"value"}.
Definition: buf0buf.cc:7097
Struct that is embedded in the free zip blocks.
Definition: buf0buf.h:2166
UT_LIST_NODE_T(buf_buddy_free_t) list
Node of zip_free list.
ulint size
size of the block
Definition: buf0buf.h:2168
byte bytes[FIL_PAGE_DATA]
stamp[FIL_PAGE_ARCH_LOG_NO_OR_SPACE_ID] == BUF_BUDDY_FREE_STAMP denotes a free block.
Definition: buf0buf.h:2169
union buf_buddy_free_t::@196 stamp
buf_page_t bpage
Embedded bpage descriptor.
Definition: buf0buf.h:2180
Definition: buf0buf.h:2278
uint64_t relocated
Definition: buf0buf.h:2280
ulint used
Definition: buf0buf.h:2279
std::chrono::steady_clock::duration relocated_duration
Definition: buf0buf.h:2281
Statistics of buddy blocks of a given size.
Definition: buf0buf.h:2268
uint64_t relocated
Number of blocks relocated by the buddy system.
Definition: buf0buf.h:2273
snapshot_t take_snapshot()
Definition: buf0buf.h:2284
std::atomic< ulint > used
Number of blocks allocated from the buddy system.
Definition: buf0buf.h:2270
std::chrono::steady_clock::duration relocated_duration
Total duration of block relocations.
Definition: buf0buf.h:2276
A chunk of buffers.
Definition: buf0buf.ic:53
This structure defines information we will fetch from each buffer pool.
Definition: buf0buf.h:170
ulint young_making_delta
num of pages made young since last printout
Definition: buf0buf.h:223
std::array< size_t, BUF_FLUSH_N_TYPES > n_pending_flush
Number of pages pending flush of given type.
Definition: buf0buf.h:190
double pages_created_rate
num of pages create per second
Definition: buf0buf.h:219
ulint n_pages_read
buf_pool->n_pages_read
Definition: buf0buf.h:196
ulint pool_unique_id
Buffer Pool ID.
Definition: buf0buf.h:174
ulint n_pend_reads
buf_pool->n_pend_reads, pages pending read
Definition: buf0buf.h:188
ulint n_ra_pages_read_rnd
buf_pool->n_ra_pages_read_rnd, number of pages readahead
Definition: buf0buf.h:204
ulint lru_len
Length of buf_pool->LRU.
Definition: buf0buf.h:178
ulint unzip_cur
buf_LRU_stat_cur.unzip, num pages decompressed in current interval
Definition: buf0buf.h:244
ulint page_read_delta
num of pages read since last printout
Definition: buf0buf.h:221
double pages_written_rate
num of pages written per second
Definition: buf0buf.h:220
double page_made_young_rate
page made young rate in pages per second
Definition: buf0buf.h:214
ulint io_sum
buf_LRU_stat_sum.io
Definition: buf0buf.h:240
ulint io_cur
buf_LRU_stat_cur.io, num of IO for current interval
Definition: buf0buf.h:241
ulint old_lru_len
buf_pool->LRU_old_len
Definition: buf0buf.h:180
double pages_readahead_rnd_rate
random readahead rate in pages per second
Definition: buf0buf.h:229
ulint unzip_sum
buf_LRU_stat_sum.unzip
Definition: buf0buf.h:243
ulint n_pages_made_young
number of pages made young
Definition: buf0buf.h:192
ulint n_ra_pages_read
buf_pool->n_ra_pages_read, number of pages readahead
Definition: buf0buf.h:206
ulint n_pages_not_made_young
number of pages not made young
Definition: buf0buf.h:194
ulint n_ra_pages_evicted
buf_pool->n_ra_pages_evicted, number of readahead pages evicted without access
Definition: buf0buf.h:209
ulint n_pages_created
buf_pool->n_pages_created
Definition: buf0buf.h:198
ulint n_page_get_delta
num of buffer pool page gets since last printout
Definition: buf0buf.h:211
ulint free_list_len
Length of buf_pool->free list.
Definition: buf0buf.h:182
double pages_evicted_rate
rate of readahead page evicted without access, in pages per second
Definition: buf0buf.h:233
ulint not_young_making_delta
num of pages not make young since last printout
Definition: buf0buf.h:225
ulint n_pend_unzip
buf_pool->n_pend_unzip, pages pending decompress
Definition: buf0buf.h:186
double pages_readahead_rate
readahead rate in pages per second
Definition: buf0buf.h:231
ulint unzip_lru_len
length of buf_pool->unzip_LRU list
Definition: buf0buf.h:237
ulint pool_size
Buffer Pool size in pages.
Definition: buf0buf.h:176
ulint flush_list_len
Length of buf_pool->flush_list.
Definition: buf0buf.h:184
double page_not_made_young_rate
page not made young rate in pages per second
Definition: buf0buf.h:216
ulint n_page_gets
buf_pool->n_page_gets
Definition: buf0buf.h:202
double pages_read_rate
num of pages read per second
Definition: buf0buf.h:218
ulint n_pages_written
buf_pool->n_pages_written
Definition: buf0buf.h:200
The buffer pool statistics structure.
Definition: buf0buf.h:2186
uint64_t n_pages_not_made_young
Number of pages not made young because the first access was not long enough ago, in buf_page_peek_if_...
Definition: buf0buf.h:2219
std::atomic< uint64_t > n_pages_read
Number of read operations.
Definition: buf0buf.h:2195
std::atomic< uint64_t > n_pages_created
number of pages created in the pool with no read.
Definition: buf0buf.h:2201
uint64_t n_pages_made_young
Number of pages made young, in calls to buf_LRU_make_block_young().
Definition: buf0buf.h:2215
uint64_t n_ra_pages_evicted
Number of read ahead pages that are evicted without being accessed.
Definition: buf0buf.h:2211
std::atomic< uint64_t > n_ra_pages_read_rnd
Number of pages read in as part of random read ahead.
Definition: buf0buf.h:2204
uint64_t flush_list_bytes
Flush_list size in bytes.
Definition: buf0buf.h:2225
std::atomic< uint64_t > n_ra_pages_read
Number of pages read in as part of read ahead.
Definition: buf0buf.h:2207
Shards m_n_page_gets
Number of page gets performed; also successful searches through the adaptive hash index are counted a...
Definition: buf0buf.h:2192
uint64_t LRU_bytes
LRU size in bytes.
Definition: buf0buf.h:2222
void reset()
Definition: buf0buf.h:2251
static void copy(buf_pool_stat_t &dst, const buf_pool_stat_t &src) noexcept
Definition: buf0buf.h:2227
std::atomic< uint64_t > n_pages_written
Number of write operations.
Definition: buf0buf.h:2198
The buffer pool structure.
Definition: buf0buf.h:2294
UT_LIST_BASE_NODE_T(buf_buddy_free_t, list) zip_free[BUF_BUDDY_SIZES_MAX]
Buddy free lists.
UT_LIST_BASE_NODE_T(buf_page_t, list) free
Base node of the free block list.
buf_chunk_t * chunks_old
old buffer pool chunks to be freed after resizing buffer pool
Definition: buf0buf.h:2348
void change_flush_state(buf_flush_t flush_type, F &&change)
Executes change() which modifies fields protected by flush_state_mutex.
Definition: buf0buf.h:2567
hash_table_t * zip_hash
Hash table of buf_block_t blocks whose frames are allocated to the zip buddy system,...
Definition: buf0buf.h:2367
FlushHp flush_hp
"Hazard pointer" used during scan of flush_list while doing flush list batch.
Definition: buf0buf.h:2401
buf_buddy_stat_t buddy_stat[BUF_BUDDY_SIZES_MAX+1]
Statistics of buddy system, indexed by block size.
Definition: buf0buf.h:2380
LRUItr single_scan_itr
Iterator used to scan the LRU list when searching for single page flushing victim.
Definition: buf0buf.h:2478
buf_pool_stat_t old_stat
Old statistics.
Definition: buf0buf.h:2386
void deallocate_chunk(buf_chunk_t *chunk)
A wrapper for buf_pool_t::allocator.deallocate_large which also advices the OS that this chunk can be...
Definition: buf0buf.cc:979
bool try_LRU_scan
Set to false when an LRU scan for free block fails.
Definition: buf0buf.h:2440
ulint buddy_n_frames
Number of frames allocated from the buffer pool to the buddy system.
Definition: buf0buf.h:2335
std::atomic< ulint > n_pend_reads
Number of pending read operations.
Definition: buf0buf.h:2370
UT_LIST_BASE_NODE_T(buf_page_t, list) zip_clean
Unmodified compressed pages.
UT_LIST_BASE_NODE_T(buf_page_t, list) flush_list
Base node of the modified block list.
LRUHp lru_hp
"hazard pointer" used during scan of LRU while doing LRU list batch.
Definition: buf0buf.h:2470
bool allocate_chunk(ulonglong mem_size, buf_chunk_t *chunk)
A wrapper for buf_pool_t::allocator.alocate_large which also advices the OS that this chunk should no...
Definition: buf0buf.cc:945
bool is_tracking()
Check if the page modifications are tracked.
Definition: buf0buf.h:2447
UT_LIST_BASE_NODE_T(buf_block_t, unzip_LRU) unzip_LRU
Base node of the unzip_LRU list.
std::chrono::steady_clock::time_point last_printout_time
when buf_print_io was last time called.
Definition: buf0buf.h:2376
ulint LRU_old_ratio
Reserve this much of the buffer pool for "old" blocks.
Definition: buf0buf.h:2331
BufListMutex chunks_mutex
protects (de)allocation of chunks:
Definition: buf0buf.h:2303
lsn_t track_page_lsn
Page Tracking start LSN.
Definition: buf0buf.h:2443
BufListMutex zip_free_mutex
buddy allocator mutex
Definition: buf0buf.h:2312
volatile ulint n_chunks
Number of buffer pool chunks.
Definition: buf0buf.h:2339
LRUItr lru_scan_itr
Iterator used to scan the LRU list when searching for replaceable victim.
Definition: buf0buf.h:2474
bool madvise_dump()
Advices the OS that all chunks in this buffer pool instance can be dumped to a core file.
Definition: buf0buf.cc:990
ulint old_size
Previous pool size in pages.
Definition: buf0buf.h:2354
UT_LIST_BASE_NODE_T(buf_page_t, LRU) LRU
Base node of the LRU list.
FlushHp oldest_hp
Entry pointer to scan the oldest page except for system temporary.
Definition: buf0buf.h:2404
buf_page_t * LRU_old
Pointer to the about LRU_old_ratio/BUF_LRU_OLD_RATIO_DIV oldest blocks in the LRU list; NULL if LRU l...
Definition: buf0buf.h:2486
buf_page_t * watch
Sentinel records for buffer pool watches.
Definition: buf0buf.h:2515
BufListMutex flush_list_mutex
Mutex protecting the flush list access.
Definition: buf0buf.h:2397
ib_mutex_t flush_state_mutex
Flush state protection mutex.
Definition: buf0buf.h:2318
ib_rbt_t * flush_rbt
A red-black tree is used exclusively during recovery to speed up insertions in the flush_list.
Definition: buf0buf.h:2427
buf_chunk_t * chunks
buffer pool chunks
Definition: buf0buf.h:2345
BufListMutex LRU_list_mutex
LRU list mutex.
Definition: buf0buf.h:2306
hash_table_t * page_hash
Hash table of buf_page_t or buf_block_t file pages, buf_page_in_file() == true, indexed by (space_id,...
Definition: buf0buf.h:2363
ulint withdraw_target
Target length of withdraw block list, when withdrawing.
Definition: buf0buf.h:2466
os_event_t no_flush[BUF_FLUSH_N_TYPES]
This is in the set state when there is no flush batch of the given type running.
Definition: buf0buf.h:2419
buf_pool_stat_t stat
Current statistics.
Definition: buf0buf.h:2383
page_no_t read_ahead_area
Size in pages of the area which the read-ahead algorithms read if invoked.
Definition: buf0buf.h:2358
ulint curr_pool_size
Current pool size in bytes.
Definition: buf0buf.h:2328
bool init_flush[BUF_FLUSH_N_TYPES]
This is true when a flush of the given type is being initialized.
Definition: buf0buf.h:2411
ulint curr_size
Current pool size in pages.
Definition: buf0buf.h:2351
ulint instance_no
Array index of this buffer pool instance.
Definition: buf0buf.h:2325
ulint LRU_old_len
Length of the LRU list from the block to which LRU_old points onward, including that block; see buf0l...
Definition: buf0buf.h:2492
std::array< size_t, BUF_FLUSH_N_TYPES > n_flush
This is the number of pending writes in the given flush type.
Definition: buf0buf.h:2415
std::atomic< ulint > n_pend_unzip
number of pending decompressions.
Definition: buf0buf.h:2373
UT_LIST_BASE_NODE_T(buf_page_t, list) withdraw
base node of the withdraw block list.
lsn_t max_lsn_io
Maximum LSN for which write io has already started.
Definition: buf0buf.h:2450
ulint freed_page_clock
A sequence number used to count the number of buffer blocks removed from the end of the LRU list; NOT...
Definition: buf0buf.h:2434
BufListMutex free_list_mutex
free and withdraw list mutex
Definition: buf0buf.h:2309
BufPoolZipMutex zip_mutex
Zip mutex of this buffer pool instance, protects compressed only pages (of type buf_page_t,...
Definition: buf0buf.h:2322
bool madvise_dont_dump()
Advices the OS that all chunks in this buffer pool instance should not be dumped to a core file.
Definition: buf0buf.cc:1000
volatile ulint n_chunks_new
New number of buffer pool chunks.
Definition: buf0buf.h:2342
BufListMutex zip_hash_mutex
zip_hash mutex
Definition: buf0buf.h:2315
bool is_flushing(buf_flush_t flush_type) const
Checks if the batch is running, which is basically equivalent to !os_event_is_set(no_flush[type]) if ...
Definition: buf0buf.h:2554
The occupied bytes of lists in all buffer pools.
Definition: buf0buf.h:250
ulint LRU_bytes
LRU size in bytes.
Definition: buf0buf.h:251
ulint unzip_LRU_bytes
unzip_LRU size in bytes
Definition: buf0buf.h:252
ulint flush_list_bytes
flush_list size in bytes
Definition: buf0buf.h:253
File space address.
Definition: fil0fil.h:1179
File node of a tablespace or the log data space.
Definition: fil0fil.h:158
Tablespace or log data space.
Definition: fil0fil.h:241
space_id_t id
Tablespace ID.
Definition: fil0fil.h:337
void dec_ref() noexcept
Decrement the page reference count.
Definition: fil0fil.h:299
uint32_t get_current_version() const
Returns current version of the space object.
Definition: fil0fil.cc:11774
uint32_t get_recent_version() const
Returns current version of the space object.
Definition: fil0fil.cc:11778
bool was_not_deleted() const
Definition: fil0fil.cc:11766
void inc_ref() noexcept
Increment the page reference count.
Definition: fil0fil.h:288
bool is_deleted() const
Definition: fil0fil.cc:11761
Red black tree instance.
Definition: ut0rbt.h:72
Mini-transaction handle and buffer.
Definition: mtr0mtr.h:177
InnoDB condition variable.
Definition: os0event.cc:63
Compressed page descriptor.
Definition: page0types.h:201
page_zip_t * data
Compressed page data.
Definition: page0types.h:203
The structure used in the spin lock implementation of a read-write lock.
Definition: sync0rw.h:363
Definition: ut0core.h:36
bool rw_lock_own(const rw_lock_t *lock, ulint lock_type)
Checks if the thread has locked the rw-lock in the specified mode, with the pass value == 0.
Definition: sync0rw.cc:858
rw_lock_type_t
Definition: sync0rw.h:97
@ RW_NO_LATCH
Definition: sync0rw.h:101
bool rw_lock_own_flagged(const rw_lock_t *lock, rw_lock_flags_t flags)
Checks if the thread has locked the rw-lock in the specified mode, with the pass value == 0.
Definition: sync0rw.cc:898
latch_level_t
Latching order levels.
Definition: sync0types.h:201
@ RW_LOCK_S
Definition: sync0types.h:208
@ RW_LOCK_X
Definition: sync0types.h:209
@ RW_LOCK_FLAG_X
Definition: sync0types.h:1216
@ RW_LOCK_FLAG_SX
Definition: sync0types.h:1217
@ RW_LOCK_FLAG_S
Definition: sync0types.h:1215
Version control for database, common definitions, and include files.
constexpr uint32_t UINT32_UNDEFINED
The 'undefined' value for a 32-bit unsigned integer.
Definition: univ.i:428
#define UNIV_PAGE_SIZE_SHIFT
The 2-logarithm of UNIV_PAGE_SIZE:
Definition: univ.i:291
#define IF_DEBUG(...)
Definition: univ.i:674
unsigned long int ulint
Definition: univ.i:406
#define UNIV_MEM_VALID(addr, size)
Definition: univ.i:591
constexpr uint32_t UNIV_ZIP_SIZE_MIN
Smallest compressed page size.
Definition: univ.i:330
Utilities for byte operations.
#define ut_ad(EXPR)
Debug assertion.
Definition: ut0dbg.h:105
#define ut_d(EXPR)
Debug statement.
Definition: ut0dbg.h:107
#define ut_a(EXPR)
Abort execution if EXPR does not evaluate to nonzero.
Definition: ut0dbg.h:93
void ut_list_validate(const List &list, Functor &functor)
Checks the consistency of a two-way list.
Definition: ut0lst.h:493
#define mutex_own(M)
Checks that the current thread owns the mutex.
Definition: ut0mutex.h:165
#define mutex_exit(M)
Definition: ut0mutex.h:123
#define mutex_enter(M)
Definition: ut0mutex.h:117
Various utilities.
static uint64_t lsn
Definition: xcom_base.cc:446
unsigned long id[MAX_DEAD]
Definition: xcom_base.cc:510
int n
Definition: xcom_base.cc:509