MySQL 8.0.39
Source Code Documentation
|
Standard external sort. More...
#include "sql/filesort.h"
#include <limits.h>
#include <math.h>
#include <stddef.h>
#include <stdio.h>
#include <string.h>
#include <algorithm>
#include <atomic>
#include <memory>
#include <new>
#include <optional>
#include <vector>
#include "add_with_saturate.h"
#include "decimal.h"
#include "field_types.h"
#include "m_ctype.h"
#include "map_helpers.h"
#include "my_basename.h"
#include "my_bitmap.h"
#include "my_byteorder.h"
#include "my_compiler.h"
#include "my_config.h"
#include "my_dbug.h"
#include "my_inttypes.h"
#include "my_loglevel.h"
#include "my_sys.h"
#include "mysql/components/services/log_builtins.h"
#include "mysql/components/services/log_shared.h"
#include "mysql/psi/mysql_file.h"
#include "mysql/service_mysql_alloc.h"
#include "mysql/udf_registration_types.h"
#include "mysql_com.h"
#include "mysqld_error.h"
#include "priority_queue.h"
#include "sql-common/json_dom.h"
#include "sql/auth/sql_security_ctx.h"
#include "sql/bounded_queue.h"
#include "sql/cmp_varlen_keys.h"
#include "sql/debug_sync.h"
#include "sql/derror.h"
#include "sql/error_handler.h"
#include "sql/field.h"
#include "sql/filesort_utils.h"
#include "sql/handler.h"
#include "sql/item.h"
#include "sql/item_subselect.h"
#include "sql/iterators/row_iterator.h"
#include "sql/iterators/sorting_iterator.h"
#include "sql/key_spec.h"
#include "sql/malloc_allocator.h"
#include "sql/merge_many_buff.h"
#include "sql/my_decimal.h"
#include "sql/mysqld.h"
#include "sql/opt_costmodel.h"
#include "sql/opt_trace.h"
#include "sql/opt_trace_context.h"
#include "sql/pfs_batch_mode.h"
#include "sql/psi_memory_key.h"
#include "sql/sort_param.h"
#include "sql/sql_array.h"
#include "sql/sql_base.h"
#include "sql/sql_bitmap.h"
#include "sql/sql_class.h"
#include "sql/sql_const.h"
#include "sql/sql_error.h"
#include "sql/sql_lex.h"
#include "sql/sql_optimizer.h"
#include "sql/sql_sort.h"
#include "sql/system_variables.h"
#include "sql/table.h"
#include "sql/thr_malloc.h"
#include "sql/tztime.h"
#include "sql_string.h"
#include "template_utils.h"
Classes | |
struct | anonymous_namespace{filesort.cc}::Mem_compare_queue_key |
class | Filesort_error_handler |
Error handler for filesort. More... | |
Namespaces | |
namespace | anonymous_namespace{filesort.cc} |
Functions | |
static ha_rows | read_all_rows (THD *thd, Sort_param *param, const Mem_root_array< TABLE * > &tables, table_map tables_to_get_rowid_for, Filesort_info *fs_info, IO_CACHE *chunk_file, IO_CACHE *tempfile, Bounded_queue< uchar *, uchar *, Sort_param, Mem_compare_queue_key > *pq, RowIterator *source_iterator, ha_rows *found_rows, size_t *longest_key, size_t *longest_addons) |
Read all rows, and write them into a temporary file (if we run out of space in the sort buffer). More... | |
static int | write_keys (Sort_param *param, Filesort_info *fs_info, uint count, IO_CACHE *buffer_file, IO_CACHE *tempfile) |
static int | merge_index (THD *thd, Sort_param *param, Sort_buffer sort_buffer, Merge_chunk_array chunk_array, IO_CACHE *tempfile, IO_CACHE *outfile) |
static bool | save_index (Sort_param *param, uint count, Filesort_info *table_sort, Sort_result *sort_result) |
This function is used only if the entire result set fits in memory. More... | |
static bool | check_if_pq_applicable (Opt_trace_context *trace, Sort_param *param, Filesort_info *filesort_info, ha_rows num_rows, ulong memory_available) |
Test whether priority queue is worth using to get top elements of an ordered result set. More... | |
static void | trace_filesort_information (Opt_trace_context *trace, const st_sort_field *sortorder, uint s_length) |
bool | filesort (THD *thd, Filesort *filesort, RowIterator *source_iterator, table_map tables_to_get_rowid_for, ha_rows num_rows_estimate, Filesort_info *fs_info, Sort_result *sort_result, ha_rows *found_rows) |
Sort a table. More... | |
void | filesort_free_buffers (TABLE *table, bool full) |
static void | dbug_print_record (TABLE *table, bool print_rowid) |
static bool | alloc_and_make_sortkey (Sort_param *param, Filesort_info *fs_info, const Mem_root_array< TABLE * > &tables, size_t *key_length, size_t *longest_addons) |
static NO_INLINE uint | make_json_sort_key (Item *item, uchar *to, uchar *null_indicator, size_t length, ulonglong *hash) |
Make a sort key for the JSON value in an Item. More... | |
bool | anonymous_namespace{filesort.cc}::write_uint8_overflows (uint8_t val, uchar *to_end, uchar **to) |
bool | anonymous_namespace{filesort.cc}::clear_overflows (size_t num_bytes, uchar *to_end, uchar **to) |
bool | anonymous_namespace{filesort.cc}::advance_overflows (size_t num_bytes, uchar *to_end, uchar **to) |
size_t | anonymous_namespace{filesort.cc}::make_sortkey_from_item (Item *item, Item_result result_type, std::optional< size_t > dst_length, String *tmp_buffer, uchar *to, uchar *to_end, bool *maybe_null, ulonglong *hash) |
static uint | read_to_buffer (IO_CACHE *fromfile, Merge_chunk *merge_chunk, Sort_param *param) |
Read from a disk file into the merge chunk's buffer. More... | |
static int | copy_bytes (IO_CACHE *to_file, IO_CACHE *from_file, size_t count, my_off_t offset) |
Copy “count” bytes from one file, starting at offset “offset”, to the current write position (usually the end) of the other. More... | |
static int | copy_row (IO_CACHE *to_file, IO_CACHE *from_file, Merge_chunk *merge_chunk, uint offset, uint bytes_to_write) |
Copy a row from “from_file” to “to_file” (this is used during merging). More... | |
static int | merge_buffers (THD *thd, Sort_param *param, IO_CACHE *from_file, IO_CACHE *to_file, Sort_buffer sort_buffer, Merge_chunk *last_chunk, Merge_chunk_array chunk_array, bool include_keys) |
Merge buffers to one buffer. More... | |
uint | sortlength (THD *thd, st_sort_field *sortorder, uint s_length) |
Calculate length of sort key. More... | |
bool | SortWillBeOnRowId (const TABLE *table) |
void | change_double_for_sort (double nr, uchar *to) |
Standard external sort.
We read rows into a buffer until there's no more room. At that point, we use it (using the sorting algorithms from STL), and write it to disk (thus the name “filesort”). When there are no more rows, we merge chunks recursively, seven and seven (although we can go all the way up to 15 in the final pass if it helps us do one pass less).
If all the rows fit in a single chunk, the data never hits disk, but remains in RAM.
|
static |
void change_double_for_sort | ( | double | nr, |
uchar * | to | ||
) |
|
static |
Test whether priority queue is worth using to get top elements of an ordered result set.
If it is, then allocates buffer for required amount of records
trace | Current trace context. |
param | Sort parameters. |
filesort_info | Filesort information. |
num_rows | Estimate of number of rows in source record set. |
memory_available | Memory available for sorting. |
DESCRIPTION Given a query like this: SELECT ... FROM t ORDER BY a1,...,an LIMIT max_rows; This function tests whether a priority queue can be used to keep the result (ie., there is enough memory to store <max_rows> rows).
|
static |
Copy “count” bytes from one file, starting at offset “offset”, to the current write position (usually the end) of the other.
|
static |
Copy a row from “from_file” to “to_file” (this is used during merging).
Most commonly, we'll already have all (or most) of it in memory, as indicated by “merge_chunk”, which must be positioned on the row. But in very tight circumstances (see read_to_buffer(), some of it may still be on disk, and will need to be copied directly from file to file.
|
static |
bool filesort | ( | THD * | thd, |
Filesort * | filesort, | ||
RowIterator * | source_iterator, | ||
table_map | tables_to_get_rowid_for, | ||
ha_rows | num_rows_estimate, | ||
Filesort_info * | fs_info, | ||
Sort_result * | sort_result, | ||
ha_rows * | found_rows | ||
) |
Sort a table.
Creates a set of pointers that can be used to read the rows in sorted order. This should be done with the functions in records.cc.
The result set is stored in fs_info->io_cache or fs_info->sorted_result, or left in the main filesort buffer.
thd | Current thread | |
filesort | How to sort the table | |
source_iterator | Where to read the rows to be sorted from. | |
tables_to_get_rowid_for | Which tables we are responsible for getting row IDs for. Tables in this set that are not also in "tables" are ignored. | |
num_rows_estimate | How many rows source_iterator is expected to produce. Only used for whether we intend to use the priority queue optimization or not; if we estimate fewer rows than we can fit into RAM, we never use the priority queue. | |
fs_info | Owns the buffers for sort_result. | |
sort_result | Where to store the sort result. | |
[out] | found_rows | Store the number of found rows here. This is the number of found rows after applying WHERE condition. |
void filesort_free_buffers | ( | TABLE * | table, |
bool | full | ||
) |
|
static |
Make a sort key for the JSON value in an Item.
This function is called by Sort_param::make_sortkey(). We don't want it to be inlined, since that seemed to have a negative impact on some performance tests.
[in] | item | The item for which to create a sort key. |
[out] | to | Pointer into the buffer to which the sort key should be written. It will point to where the data portion of the key should start. |
[out] | null_indicator | For nullable items, the NULL indicator byte. (Ignored otherwise.) Should be initialized by the caller to a value that indicates not NULL. |
[in] | length | The length of the sort key, not including the NULL indicator byte at the beginning of the sort key for nullable items. |
[in,out] | hash | The hash key of the JSON values in the current row. |
|
static |
Merge buffers to one buffer.
thd | thread context | |
param | Sort parameter | |
from_file | File with source data (Merge_chunks point to this file) | |
to_file | File to write the sorted result data. | |
sort_buffer | Buffer for data to store up to MERGEBUFF2 sort keys. | |
[out] | last_chunk | Store here Merge_chunk describing data written to to_file. |
chunk_array | Array of chunks to merge. | |
include_keys | If true, write both the keys and the addons / row positions. If false, the keys will be skipped (useful only for the output of the final merge, where we don't need to compare rows further). |
|
static |
|
static |
Read all rows, and write them into a temporary file (if we run out of space in the sort buffer).
All produced sequences are guaranteed to be non-empty.
thd | Thread handle | |
param | Sorting parameter | |
tables | List of all tables being sorted. | |
tables_to_get_rowid_for | Which tables we are responsible for getting row IDs for. Tables in this set that are not also in "tables" are ignored. | |
fs_info | Struct containing sort buffer etc. | |
chunk_file | File to write Merge_chunks describing sorted segments in tempfile. | |
tempfile | File to write sorted sequences of sortkeys to. | |
pq | If !NULL, use it for keeping top N elements | |
source_iterator | Where to read the rows to be sorted from. | |
[out] | found_rows | The number of FOUND_ROWS(). For a query with LIMIT, this value will typically be larger than the function return value. |
[out] | longest_key | The largest single key found, in bytes. |
[out] | longest_addons | The longest addon field row (sum of all addon fields for any single given row) found. |
while (get_next_sortkey()) { if (using priority queue) push sort key into queue else { try to put sort key into buffer; if (no free space in sort buffer) { do { allocate new, larger buffer; retry putting sort key into buffer; } until (record fits or no space for new buffer) if (no space for new buffer) { sort record pointers (all buffers); dump sorted sequence to 'tempfile'; dump Merge_chunk describing sequence location into 'chunk_file'; } } if (key was packed) tell sort buffer the actual number of bytes used; } } if (buffer has some elements && dumped at least once) sort-dump-dump as above; else don't sort, leave sort buffer to be sorted by caller.
|
static |
Read from a disk file into the merge chunk's buffer.
We generally read as many complete rows as we can, except when bounded by max_keys() or rowcount(). Incomplete rows will be left in the file.
|
static |
This function is used only if the entire result set fits in memory.
For addon fields, we keep the result in the filesort buffer. This saves us a lot of memcpy calls.
For row references, we copy the final sorted result into a buffer, but we do not copy the actual sort-keys, as they are no longer needed. We could have kept the result in the sort buffere here as well, but the new buffer - containing only row references - is probably a lot smaller.
The result data will be unpacked by SortBufferIterator or SortBufferIndirectIterator
Note that SortBufferIterator does not have access to a Sort_param. It does however have access to a Filesort_info, which knows whether we have variable sized keys or not. TODO: consider templatizing SortBufferIterator on is_varlen or not.
[in] | param | Sort parameters. |
count | Number of records | |
[in,out] | table_sort | Information used by SortBufferIterator / SortBufferIndirectIterator |
[out] | sort_result | Where to store the actual result |
uint sortlength | ( | THD * | thd, |
st_sort_field * | sortorder, | ||
uint | s_length | ||
) |
Calculate length of sort key.
Declared here so we can unit test it.
thd | Thread handler |
sortorder | Order of items to sort |
s_length | Number of items to sort |
bool SortWillBeOnRowId | ( | const TABLE * | table | ) |
|
static |
|
static |
Sort the buffer and write:
param | Sort parameters |
fs_info | Contains the buffer to be sorted and written. |
count | Number of records to write. |
chunk_file | One 'Merge_chunk' struct will be written into this file. The Merge_chunk::{file_pos, count} will indicate where the sorted data was stored. |
tempfile | The sorted sequence will be written into this file. |