mysql-server/latest/sql__sort_8h_source.html

#ifndef SQL_SORT_INCLUDED

#define SQL_SORT_INCLUDED


/* Copyright (c) 2000, 2025, Oracle and/or its affiliates.


   This program is free software; you can redistribute it and/or modify

   it under the terms of the GNU General Public License, version 2.0,

   as published by the Free Software Foundation.


   This program is designed to work with certain software (including

   but not limited to OpenSSL) that is licensed under separate terms,

   as designated in a particular file or component or in included license

   documentation.  The authors of MySQL hereby grant you an additional

   permission to link the program and your derivative works with the

   separately licensed software that they have either included with

   the program or referenced in the documentation.


   This program is distributed in the hope that it will be useful,

   but WITHOUT ANY WARRANTY; without even the implied warranty of

   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

   GNU General Public License, version 2.0, for more details.


   You should have received a copy of the GNU General Public License

   along with this program; if not, write to the Free Software

   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301  USA */


#include <assert.h>

#include "map_helpers.h"

#include "my_base.h"  // ha_rows


#include "my_sys.h"

#include "sql/filesort_utils.h"  // Filesort_buffer

#include "sql/mem_root_array.h"


class Addon_fields;

struct TABLE;


/* Defines used by filesort and uniques */


constexpr size_t MERGEBUFF = 7;

constexpr size_t MERGEBUFF2 = 15;

// Number of bytes used to store varlen key's length

constexpr size_t VARLEN_PREFIX = 4;


/**

  Descriptor for a merge chunk to be sort-merged.

  A merge chunk is a sequence of pre-sorted records, written to a

  temporary file. A Merge_chunk instance describes where this chunk is stored

  in the file, and where it is located when it is in memory.


  It is a POD because we read/write them from/to files (but note,

  only m_file_position and m_rowcount are actually used in that

  situation).


  We have accessors (getters/setters) for all struct members.

 */

struct Merge_chunk {

 public:

  my_off_t file_position() const { return m_file_position; }

  void set_file_position(my_off_t val) { m_file_position = val; }

  void advance_file_position(my_off_t val) { m_file_position += val; }


  uchar *buffer_start() { return m_buffer_start; }

  const uchar *buffer_end() const { return m_buffer_end; }

  const uchar *valid_buffer_end() const { return m_valid_buffer_end; }


  void set_buffer(uchar *start, uchar *end) {

    m_buffer_start = start;

    m_buffer_end = end;

  }

  void set_buffer_start(uchar *start) { m_buffer_start = start; }

  void set_buffer_end(uchar *end) {

    assert(m_buffer_end == nullptr || end <= m_buffer_end);

    m_buffer_end = end;

  }

  void set_valid_buffer_end(uchar *end) {

    assert(end <= m_buffer_end);

    m_valid_buffer_end = end;

  }


  void init_current_key() { m_current_key = m_buffer_start; }

  uchar *current_key() const { return m_current_key; }

  void advance_current_key(uint val) { m_current_key += val; }


  void decrement_rowcount(ha_rows val) { m_rowcount -= val; }

  void set_rowcount(ha_rows val) { m_rowcount = val; }

  ha_rows rowcount() const { return m_rowcount; }


  ha_rows mem_count() const { return m_mem_count; }

  void set_mem_count(ha_rows val) { m_mem_count = val; }

  ha_rows decrement_mem_count() { return --m_mem_count; }


  ha_rows max_keys() const { return m_max_keys; }

  void set_max_keys(ha_rows val) { m_max_keys = val; }


  size_t buffer_size() const { return m_buffer_end - m_buffer_start; }


  /**

    Tries to merge *this with *mc, returns true if successful.

    The assumption is that *this is no longer in use,

    and the space it has been allocated can be handed over to a

    buffer which is adjacent to it.

   */

  bool merge_freed_buff(Merge_chunk *mc) const {

    if (mc->m_buffer_end == m_buffer_start) {

      mc->m_buffer_end = m_buffer_end;

      mc->m_max_keys += m_max_keys;

      return true;

    } else if (mc->m_buffer_start == m_buffer_end) {

      mc->m_buffer_start = m_buffer_start;

      mc->m_max_keys += m_max_keys;

      return true;

    }

    return false;

  }


 private:

  /// The current key for this chunk.

  uchar *m_current_key = nullptr;


  /// Current position in the file to be sorted.

  my_off_t m_file_position = 0;


  /// Start of main-memory buffer for this chunk.

  uchar *m_buffer_start = nullptr;


  /// End of main-memory buffer for this chunk.

  uchar *m_buffer_end = nullptr;


  /// End of actual, valid data for this chunk.

  uchar *m_valid_buffer_end;


  /// Number of unread rows in this chunk.

  ha_rows m_rowcount = 0;


  /// Number of rows in the main-memory buffer.

  ha_rows m_mem_count = 0;


  /// If we have fixed-size rows: max number of rows in buffer.

  ha_rows m_max_keys = 0;

};


typedef Bounds_checked_array<Merge_chunk> Merge_chunk_array;


/*

  The result of Unique or filesort; can either be stored on disk

  (in which case io_cache points to the file) or in memory in one

  of two ways. See sorted_result_in_fsbuf.


  Note if sort_result points into memory, it does _not_ own the sort buffer;

  Filesort_info does.


  TODO: Clean up so that Filesort / Filesort_info / Filesort_buffer /

  Sort_result have less confusing overlap.

*/

class Sort_result {

 public:

  Sort_result() : sorted_result_in_fsbuf(false), sorted_result_end(nullptr) {}


  bool has_result_in_memory() const {

    return sorted_result || sorted_result_in_fsbuf;

  }


  bool has_result() const {

    return has_result_in_memory() || (io_cache && my_b_inited(io_cache));

  }


  IO_CACHE *io_cache{nullptr};


  /**

    If the entire result fits in memory, we skip the merge phase.

    We may leave the result in the parent Filesort_info's filesort_buffer

    (indicated by sorted_result_in_fsbuf), or we may strip away

    the sort keys, and copy the sorted result into a new buffer.

    Unique always uses the latter.

    This new buffer is [sorted_result ... sorted_result_end]

    @see save_index()

   */

  bool sorted_result_in_fsbuf{false};

  unique_ptr_my_free<uchar> sorted_result{nullptr};

  uchar *sorted_result_end{nullptr};


  ha_rows found_records{0};  ///< How many records in sort.

};


/**

  A class wrapping misc buffers used for sorting.

 */

class Filesort_info {

  /// Buffer for sorting keys.

  Filesort_buffer filesort_buffer;


 public:

  Merge_chunk_array merge_chunks;  ///< Array of chunk descriptors


  Addon_fields *addon_fields{nullptr};  ///< Addon field descriptors.


  bool m_using_varlen_keys{false};

  uint m_sort_length{0};


  Filesort_info(const Filesort_info &) = delete;

  Filesort_info &operator=(const Filesort_info &) = delete;


  Filesort_info() : m_using_varlen_keys(false), m_sort_length(0) {}


  /** Sort filesort_buffer

    @return Number of records, after any deduplication

   */

  size_t sort_buffer(Sort_param *param, size_t num_input_rows,

                     size_t max_output_rows) {

    return filesort_buffer.sort_buffer(param, num_input_rows, max_output_rows);

  }


  /**

    Copies (unpacks) values appended to sorted fields from a buffer back to

    their regular positions specified by the Field::ptr pointers.

    @param tables  Tables in the join; for NULL row flags.

    @param buff    Buffer which to unpack the value from.

  */

  template <bool Packed_addon_fields>

  inline void unpack_addon_fields(const Mem_root_array<TABLE *> &tables,

                                  uchar *buff);


  /**

    Reads 'count' number of chunk descriptors into the merge_chunks array.

    In case of error, the merge_chunks array will be empty.

    @param chunk_file File containing the descriptors.

    @param count      Number of chunks to read.

  */

  void read_chunk_descriptors(IO_CACHE *chunk_file, uint count);


  /// Are we using "addon fields"?

  bool using_addon_fields() const { return addon_fields != nullptr; }


  void reset() { filesort_buffer.reset(); }


  void clear_peak_memory_used() { filesort_buffer.clear_peak_memory_used(); }


  Bounds_checked_array<uchar> get_next_record_pointer(size_t min_size) {

    return filesort_buffer.get_next_record_pointer(min_size);

  }


  void commit_used_memory(size_t num_bytes) {

    filesort_buffer.commit_used_memory(num_bytes);

  }


  uchar *get_sorted_record(uint idx) {

    return filesort_buffer.get_sorted_record(idx);

  }


  uchar **get_sort_keys() { return filesort_buffer.get_sort_keys(); }


  Bounds_checked_array<uchar> get_contiguous_buffer() {

    return filesort_buffer.get_contiguous_buffer();

  }


  void set_max_size(size_t max_size, size_t record_length) {

    filesort_buffer.set_max_size(max_size, record_length);

  }


  void free_sort_buffer() { filesort_buffer.free_sort_buffer(); }


  bool preallocate_records(size_t num_records) {

    return filesort_buffer.preallocate_records(num_records);

  }


  size_t peak_memory_used() const { return filesort_buffer.peak_memory_used(); }


  size_t max_size_in_bytes() const {

    return filesort_buffer.max_size_in_bytes();

  }


  uint sort_length() const { return m_sort_length; }

  bool using_varlen_keys() const { return m_using_varlen_keys; }


  void set_sort_length(uint val, bool is_varlen) {

    m_sort_length = val;

    m_using_varlen_keys = is_varlen;

  }

};


typedef Bounds_checked_array<uchar> Sort_buffer;


/**

  Put all room used by freed buffer to use in adjacent buffer.


  Note, that we can't simply distribute memory evenly between all buffers,

  because new areas must not overlap with old ones.

*/

template <typename Heap_type>

void reuse_freed_buff(Merge_chunk *old_top, Heap_type *heap) {

  typename Heap_type::iterator it = heap->begin();

  typename Heap_type::iterator end = heap->end();

  for (; it != end; ++it) {

    if (old_top->merge_freed_buff(*it)) return;

  }

  assert(0);

}


#endif /* SQL_SORT_INCLUDED */

nullptr
Kerberos Client Authentication nullptr
Definition: auth_kerberos_client_plugin.cc:247

Addon_fields
This class wraps information about usage of addon fields.
Definition: sort_param.h:129

Bounds_checked_array< Merge_chunk >

Filesort_buffer
Buffer used for storing records to be sorted.
Definition: filesort_utils.h:81

Filesort_buffer::get_sort_keys
uchar ** get_sort_keys()
Get the list of record pointers as a contiguous array.
Definition: filesort_utils.h:191

Filesort_buffer::reset
void reset()
Prepares the buffer for the next batch of records to process.
Definition: filesort_utils.cc:249

Filesort_buffer::preallocate_records
bool preallocate_records(size_t num_records)
Removes any existing rows and allocates num_records maximum-sized rows (call get_sorted_record() to g...
Definition: filesort_utils.cc:277

Filesort_buffer::get_next_record_pointer
Bounds_checked_array< uchar > get_next_record_pointer(size_t min_size)
Where should the next record be stored?
Definition: filesort_utils.h:116

Filesort_buffer::peak_memory_used
size_t peak_memory_used() const
How much memory has been allocated (counting both the sort buffer and the record pointers) at most si...
Definition: filesort_utils.h:153

Filesort_buffer::clear_peak_memory_used
void clear_peak_memory_used()
See peak_memory_used.
Definition: filesort_utils.h:159

Filesort_buffer::sort_buffer
size_t sort_buffer(Sort_param *param, size_t num_input_rows, size_t max_output_rows)
Sort me...
Definition: filesort_utils.cc:131

Filesort_buffer::free_sort_buffer
void free_sort_buffer()
Frees all memory.
Definition: filesort_utils.cc:415

Filesort_buffer::commit_used_memory
void commit_used_memory(size_t num_bytes)
Definition: filesort_utils.h:129

Filesort_buffer::get_contiguous_buffer
Bounds_checked_array< uchar > get_contiguous_buffer()
Clears all rows, then returns a contiguous buffer of maximum size.
Definition: filesort_utils.cc:437

Filesort_buffer::max_size_in_bytes
size_t max_size_in_bytes() const
Definition: filesort_utils.h:145

Filesort_buffer::set_max_size
void set_max_size(size_t max_size, size_t record_length)
Set the memory limit for the sort buffer before starting to add records.
Definition: filesort_utils.h:171

Filesort_buffer::get_sorted_record
uchar * get_sorted_record(size_t ix)
Gets sorted record number ix.
Definition: filesort_utils.h:200

Filesort_info
A class wrapping misc buffers used for sorting.
Definition: sql_sort.h:189

Filesort_info::free_sort_buffer
void free_sort_buffer()
Definition: sql_sort.h:261

Filesort_info::addon_fields
Addon_fields * addon_fields
Addon field descriptors.
Definition: sql_sort.h:196

Filesort_info::preallocate_records
bool preallocate_records(size_t num_records)
Definition: sql_sort.h:263

Filesort_info::clear_peak_memory_used
void clear_peak_memory_used()
Definition: sql_sort.h:237

Filesort_info::operator=
Filesort_info & operator=(const Filesort_info &)=delete

Filesort_info::get_sort_keys
uchar ** get_sort_keys()
Definition: sql_sort.h:251

Filesort_info::commit_used_memory
void commit_used_memory(size_t num_bytes)
Definition: sql_sort.h:243

Filesort_info::unpack_addon_fields
void unpack_addon_fields(const Mem_root_array< TABLE * > &tables, uchar *buff)
Copies (unpacks) values appended to sorted fields from a buffer back to their regular positions speci...
Definition: sorting_iterator.cc:550

Filesort_info::Filesort_info
Filesort_info()
Definition: sql_sort.h:204

Filesort_info::using_addon_fields
bool using_addon_fields() const
Are we using "addon fields"?
Definition: sql_sort.h:233

Filesort_info::read_chunk_descriptors
void read_chunk_descriptors(IO_CACHE *chunk_file, uint count)
Reads 'count' number of chunk descriptors into the merge_chunks array.
Definition: filesort.cc:709

Filesort_info::m_using_varlen_keys
bool m_using_varlen_keys
Definition: sql_sort.h:198

Filesort_info::set_sort_length
void set_sort_length(uint val, bool is_varlen)
Definition: sql_sort.h:276

Filesort_info::using_varlen_keys
bool using_varlen_keys() const
Definition: sql_sort.h:274

Filesort_info::merge_chunks
Merge_chunk_array merge_chunks
Array of chunk descriptors.
Definition: sql_sort.h:194

Filesort_info::filesort_buffer
Filesort_buffer filesort_buffer
Buffer for sorting keys.
Definition: sql_sort.h:191

Filesort_info::m_sort_length
uint m_sort_length
Definition: sql_sort.h:199

Filesort_info::sort_buffer
size_t sort_buffer(Sort_param *param, size_t num_input_rows, size_t max_output_rows)
Sort filesort_buffer.
Definition: sql_sort.h:209

Filesort_info::max_size_in_bytes
size_t max_size_in_bytes() const
Definition: sql_sort.h:269

Filesort_info::get_sorted_record
uchar * get_sorted_record(uint idx)
Definition: sql_sort.h:247

Filesort_info::get_contiguous_buffer
Bounds_checked_array< uchar > get_contiguous_buffer()
Definition: sql_sort.h:253

Filesort_info::reset
void reset()
Definition: sql_sort.h:235

Filesort_info::set_max_size
void set_max_size(size_t max_size, size_t record_length)
Definition: sql_sort.h:257

Filesort_info::sort_length
uint sort_length() const
Definition: sql_sort.h:273

Filesort_info::peak_memory_used
size_t peak_memory_used() const
Definition: sql_sort.h:267

Filesort_info::get_next_record_pointer
Bounds_checked_array< uchar > get_next_record_pointer(size_t min_size)
Definition: sql_sort.h:239

Filesort_info::Filesort_info
Filesort_info(const Filesort_info &)=delete

Mem_root_array
A typesafe replacement for DYNAMIC_ARRAY.
Definition: mem_root_array.h:432

Sort_param
There are several record formats for sorting:
Definition: sort_param.h:302

Sort_result
Definition: sql_sort.h:156

Sort_result::io_cache
IO_CACHE * io_cache
Definition: sql_sort.h:168

Sort_result::has_result
bool has_result() const
Definition: sql_sort.h:164

Sort_result::sorted_result
unique_ptr_my_free< uchar > sorted_result
Definition: sql_sort.h:180

Sort_result::Sort_result
Sort_result()
Definition: sql_sort.h:158

Sort_result::sorted_result_end
uchar * sorted_result_end
Definition: sql_sort.h:181

Sort_result::has_result_in_memory
bool has_result_in_memory() const
Definition: sql_sort.h:160

Sort_result::sorted_result_in_fsbuf
bool sorted_result_in_fsbuf
If the entire result fits in memory, we skip the merge phase.
Definition: sql_sort.h:179

Sort_result::found_records
ha_rows found_records
How many records in sort.
Definition: sql_sort.h:183

filesort_utils.h

my_b_inited
bool my_b_inited(const IO_CACHE *info)
Definition: my_sys.h:486

start
static void start(mysql_harness::PluginFuncEnv *env)
Definition: http_auth_backend_plugin.cc:180

map_helpers.h

unique_ptr_my_free
std::unique_ptr< T, My_free_deleter > unique_ptr_my_free
std::unique_ptr, but with my_free as deleter.
Definition: map_helpers.h:97

mem_root_array.h

my_base.h
This file includes constants used by all storage engines.

ha_rows
my_off_t ha_rows
Definition: my_base.h:1141

my_off_t
ulonglong my_off_t
Definition: my_inttypes.h:72

uchar
unsigned char uchar
Definition: my_inttypes.h:52

my_sys.h
Common header for many mysys elements.

count
static int count
Definition: myisam_ftdump.cc:45

rules_table_service::end
Cursor end()
A past-the-end Cursor.
Definition: rules_table_service.cc:192

MERGEBUFF2
constexpr size_t MERGEBUFF2
Definition: sql_sort.h:41

Merge_chunk_array
Bounds_checked_array< Merge_chunk > Merge_chunk_array
Definition: sql_sort.h:143

MERGEBUFF
constexpr size_t MERGEBUFF
Definition: sql_sort.h:40

VARLEN_PREFIX
constexpr size_t VARLEN_PREFIX
Definition: sql_sort.h:43

reuse_freed_buff
void reuse_freed_buff(Merge_chunk *old_top, Heap_type *heap)
Put all room used by freed buffer to use in adjacent buffer.
Definition: sql_sort.h:291

Sort_buffer
Bounds_checked_array< uchar > Sort_buffer
Definition: sql_sort.h:282

IO_CACHE
Definition: my_sys.h:337

Merge_chunk
Descriptor for a merge chunk to be sort-merged.
Definition: sql_sort.h:57

Merge_chunk::buffer_end
const uchar * buffer_end() const
Definition: sql_sort.h:64

Merge_chunk::m_buffer_start
uchar * m_buffer_start
Start of main-memory buffer for this chunk.
Definition: sql_sort.h:125

Merge_chunk::init_current_key
void init_current_key()
Definition: sql_sort.h:81

Merge_chunk::merge_freed_buff
bool merge_freed_buff(Merge_chunk *mc) const
Tries to merge *this with *mc, returns true if successful.
Definition: sql_sort.h:104

Merge_chunk::m_rowcount
ha_rows m_rowcount
Number of unread rows in this chunk.
Definition: sql_sort.h:134

Merge_chunk::set_mem_count
void set_mem_count(ha_rows val)
Definition: sql_sort.h:90

Merge_chunk::set_buffer_start
void set_buffer_start(uchar *start)
Definition: sql_sort.h:71

Merge_chunk::advance_current_key
void advance_current_key(uint val)
Definition: sql_sort.h:83

Merge_chunk::mem_count
ha_rows mem_count() const
Definition: sql_sort.h:89

Merge_chunk::set_file_position
void set_file_position(my_off_t val)
Definition: sql_sort.h:60

Merge_chunk::set_max_keys
void set_max_keys(ha_rows val)
Definition: sql_sort.h:94

Merge_chunk::advance_file_position
void advance_file_position(my_off_t val)
Definition: sql_sort.h:61

Merge_chunk::m_file_position
my_off_t m_file_position
Current position in the file to be sorted.
Definition: sql_sort.h:122

Merge_chunk::m_valid_buffer_end
uchar * m_valid_buffer_end
End of actual, valid data for this chunk.
Definition: sql_sort.h:131

Merge_chunk::rowcount
ha_rows rowcount() const
Definition: sql_sort.h:87

Merge_chunk::decrement_rowcount
void decrement_rowcount(ha_rows val)
Definition: sql_sort.h:85

Merge_chunk::set_valid_buffer_end
void set_valid_buffer_end(uchar *end)
Definition: sql_sort.h:76

Merge_chunk::set_buffer
void set_buffer(uchar *start, uchar *end)
Definition: sql_sort.h:67

Merge_chunk::file_position
my_off_t file_position() const
Definition: sql_sort.h:59

Merge_chunk::decrement_mem_count
ha_rows decrement_mem_count()
Definition: sql_sort.h:91

Merge_chunk::set_rowcount
void set_rowcount(ha_rows val)
Definition: sql_sort.h:86

Merge_chunk::set_buffer_end
void set_buffer_end(uchar *end)
Definition: sql_sort.h:72

Merge_chunk::buffer_size
size_t buffer_size() const
Definition: sql_sort.h:96

Merge_chunk::max_keys
ha_rows max_keys() const
Definition: sql_sort.h:93

Merge_chunk::m_max_keys
ha_rows m_max_keys
If we have fixed-size rows: max number of rows in buffer.
Definition: sql_sort.h:140

Merge_chunk::valid_buffer_end
const uchar * valid_buffer_end() const
Definition: sql_sort.h:65

Merge_chunk::m_current_key
uchar * m_current_key
The current key for this chunk.
Definition: sql_sort.h:119

Merge_chunk::current_key
uchar * current_key() const
Definition: sql_sort.h:82

Merge_chunk::m_mem_count
ha_rows m_mem_count
Number of rows in the main-memory buffer.
Definition: sql_sort.h:137

Merge_chunk::m_buffer_end
uchar * m_buffer_end
End of main-memory buffer for this chunk.
Definition: sql_sort.h:128

Merge_chunk::buffer_start
uchar * buffer_start()
Definition: sql_sort.h:63

TABLE
Definition: table.h:1425

mc
plugin_messages_callback mc
Definition: webauthn_client_plugin.cc:55