mysql-server/8.4.0/m__ctype_8h_source.html

/* Copyright (c) 2000, 2024, Oracle and/or its affiliates.


   This program is free software; you can redistribute it and/or modify

   it under the terms of the GNU General Public License, version 2.0,

   as published by the Free Software Foundation.


   This program is designed to work with certain software (including

   but not limited to OpenSSL) that is licensed under separate terms,

   as designated in a particular file or component or in included license

   documentation.  The authors of MySQL hereby grant you an additional

   permission to link the program and your derivative works with the

   separately licensed software that they have either included with

   the program or referenced in the documentation.


   This program is distributed in the hope that it will be useful,

   but WITHOUT ANY WARRANTY; without even the implied warranty of

   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

   GNU General Public License, version 2.0, for more details.


   You should have received a copy of the GNU General Public License

   along with this program; if not, write to the Free Software

   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301  USA */


#ifndef INCLUDE_MYSQL_STRINGS_M_CTYPE_H_

#define INCLUDE_MYSQL_STRINGS_M_CTYPE_H_


/**

  @file include/mysql/strings/m_ctype.h

  A better implementation of the UNIX ctype(3) library.

*/


#include <sys/types.h>


#include <cassert>

#include <cstddef>

#include <cstdint>

#include <cstdlib>

#include <cstring>

#include <deque>


#include "mysql/attribute.h"

#include "mysql/my_loglevel.h"

#include "mysql/strings/api.h"

#include "template_utils.h"


constexpr int MY_CS_NAME_SIZE = 32;


constexpr const char *CHARSET_DIR = "charsets/";


typedef int myf; /* Type of MyFlags in my_funcs */


/**

  Our own version of wchar_t, ie., a type that holds a single Unicode code point

  ("wide character"). unsigned long is always big enough to hold any character

  in the BMP.

*/

typedef unsigned long my_wc_t;


static inline void MY_PUT_MB2(unsigned char *s, uint16_t code) {

  s[0] = code >> 8;

  s[1] = code & 0xFF;

}


struct MY_UNICASE_CHARACTER {

  uint32_t toupper;

  uint32_t tolower;

  uint32_t sort;

};


struct MY_UNICASE_INFO {

  my_wc_t maxchar;

  const MY_UNICASE_CHARACTER **page;

};


struct MY_UCA_INFO;


struct MY_UNI_CTYPE {

  uint8_t pctype;

  uint8_t *ctype;

};


/* wm_wc and wc_mb return codes */

/* clang-format off */

static constexpr int

       MY_CS_ILSEQ = 0;        /* Wrong by sequence: wb_wc                   */

static constexpr int

       MY_CS_ILUNI = 0;        /* Cannot encode Unicode to charset: wc_mb    */

static constexpr int

       MY_CS_TOOSMALL  = -101; /* Need at least one byte:    wc_mb and mb_wc */

static constexpr int

       MY_CS_TOOSMALL2 = -102; /* Need at least two bytes:   wc_mb and mb_wc */

static constexpr int

       MY_CS_TOOSMALL3 = -103; /* Need at least three bytes: wc_mb and mb_wc */


/* These following three are currently not really used */

static constexpr int

       MY_CS_TOOSMALL4 = -104; /* Need at least 4 bytes: wc_mb and mb_wc */

static constexpr int

       MY_CS_TOOSMALL5 = -105; /* Need at least 5 bytes: wc_mb and mb_wc */

static constexpr int

       MY_CS_TOOSMALL6 = -106; /* Need at least 6 bytes: wc_mb and mb_wc */

/* clang-format on */


static constexpr int MY_SEQ_INTTAIL = 1;

static constexpr int MY_SEQ_SPACES = 2;


/* CHARSET_INFO::state flags */

/* clang-format off */

static constexpr uint32_t

       MY_CHARSET_UNDEFINED     = 0;       // for unit testing

static constexpr uint32_t

       MY_CS_COMPILED           = 1 << 0;  // compiled-in charsets

static constexpr uint32_t

       MY_CS_CONFIG_UNUSED      = 1 << 1;  // unused bitmask

static constexpr uint32_t

       MY_CS_INDEX_UNUSED       = 1 << 2;  // unused bitmask

static constexpr uint32_t

       MY_CS_LOADED             = 1 << 3;  // charsets that are currently loaded

static constexpr uint32_t

       MY_CS_BINSORT            = 1 << 4;  // if binary sort order

static constexpr uint32_t

       MY_CS_PRIMARY            = 1 << 5;  // if primary collation

static constexpr uint32_t

       MY_CS_STRNXFRM           = 1 << 6;  // if _not_ set, sort_order will

                                           // give same result as strnxfrm --

                                           // all new collations should have

                                           // this flag set,

                                           // do not check it in new code

static constexpr uint32_t

       MY_CS_UNICODE            = 1 << 7;  // if a charset is BMP Unicode

static constexpr uint32_t

       MY_CS_READY              = 1 << 8;  // if a charset is initialized

static constexpr uint32_t

       MY_CS_AVAILABLE          = 1 << 9;  // if either compiled-in or loaded

static constexpr uint32_t

       MY_CS_CSSORT             = 1 << 10; // if case sensitive sort order

static constexpr uint32_t

       MY_CS_HIDDEN             = 1 << 11; // don't display in SHOW

static constexpr uint32_t

       MY_CS_PUREASCII          = 1 << 12; // if a charset is pure ascii

static constexpr uint32_t

       MY_CS_NONASCII           = 1 << 13; // if not ASCII-compatible

static constexpr uint32_t

       MY_CS_UNICODE_SUPPLEMENT = 1 << 14; // Non-BMP Unicode characters

static constexpr uint32_t

       MY_CS_LOWER_SORT         = 1 << 15; // if use lower case as weight

static constexpr uint32_t

       MY_CS_INLINE             = 1 << 16; // CS definition is C++ source


/* Character repertoire flags */

static constexpr uint32_t

       MY_REPERTOIRE_ASCII = 1;     /* Pure ASCII            U+0000..U+007F */

static constexpr uint32_t

       MY_REPERTOIRE_EXTENDED = 2;  /* Extended characters:  U+0080..U+FFFF */

static constexpr uint32_t

       MY_REPERTOIRE_UNICODE30 = 3; /* ASCII | EXTENDED:     U+0000..U+FFFF */


/* Flags for strxfrm */

static constexpr uint32_t

       MY_STRXFRM_PAD_TO_MAXLEN = 0x00000080; /* if pad tail(for filesort) */


/* clang-format on */


struct MY_UNI_IDX {

  uint16_t from;

  uint16_t to;

  const uint8_t *tab;

};


struct my_match_t {

  unsigned beg;

  unsigned end;

  unsigned mb_len;

};


struct CHARSET_INFO;


/**

  Helper structure to return error messages from collation parser/initializer.

*/

struct MY_CHARSET_ERRMSG {

  static constexpr int errmsg_size = 192;

  unsigned errcode{0};         ///< See include/mysys_err.h

  char errarg[errmsg_size]{};  ///< Error message text

};


/**

  User-specified callback interface for collation parser/initializer

*/

class MY_CHARSET_LOADER {

 public:

  MY_CHARSET_LOADER() = default;

  virtual ~MY_CHARSET_LOADER();


  MY_CHARSET_LOADER(const MY_CHARSET_LOADER &) = delete;

  MY_CHARSET_LOADER(const MY_CHARSET_LOADER &&) = delete;


  MY_CHARSET_LOADER &operator=(const MY_CHARSET_LOADER &) = delete;

  MY_CHARSET_LOADER &operator=(const MY_CHARSET_LOADER &&) = delete;


  /**

    Intercepts error messages from collation parser/initializer


    @param loglevel     ERROR_LEVEL or WARNING_LEVEL

    @param errcode      See include/mysys_err.h

  */

  virtual void reporter(enum loglevel loglevel, unsigned errcode, ...) = 0;


  /**

    Loads a file by its OS path into collation parser/initializer


    @param path         '\0'-terminated file path to load

    @param size         Byte size of @p path


    @returns Pointer to file data on success, otherwise nullptr.

             This is a caller's responsibility to free this pointer

             with free().

  */

  virtual void *read_file(const char *path, size_t *size) = 0;


  /**

    Collation parser helper function (not overloadable).


    @param cs   New collation object to register in the collation library


    @return MY_XML_OK on success, otherwise MY_XML_ERROR

  */

  int add_collation(CHARSET_INFO *cs);


  /**

    Allocate-and-forget version of malloc().

  */

  virtual void *once_alloc(size_t);


  virtual void *mem_malloc(size_t size) { return malloc(size); }

  virtual void mem_free(void *ptr) { free(ptr); }


 private:

  std::deque<void *> m_delete_list;

};


extern MYSQL_STRINGS_EXPORT int (*my_string_stack_guard)(int);


enum Pad_attribute { PAD_SPACE, NO_PAD };


/* See strings/CHARSET_INFO.txt for information about this structure  */

struct MY_COLLATION_HANDLER {

  bool (*init)(CHARSET_INFO *, MY_CHARSET_LOADER *, MY_CHARSET_ERRMSG *);

  void (*uninit)(CHARSET_INFO *, MY_CHARSET_LOADER *);

  /* Collation routines */

  int (*strnncoll)(const CHARSET_INFO *, const uint8_t *, size_t,

                   const uint8_t *, size_t, bool);

  /**

    Compare the two strings under the pad rules given by the collation.


    Thus, for NO PAD collations, this is identical to strnncoll with is_prefix

    set to false. For PAD SPACE collations, the two strings are conceptually

    extended infinitely at the end using space characters (0x20) and then

    compared under the collation's normal comparison rules, so that e.g 'a' is

    equal to 'a '.

  */

  int (*strnncollsp)(const CHARSET_INFO *, const uint8_t *, size_t,

                     const uint8_t *, size_t);

  /**

    Transform the string into a form such that memcmp() between transformed

    strings yields the correct collation order.


    @param [out] dst Buffer for the transformed string.

    @param [out] dstlen Number of bytes available in dstlen.

      Must be even.

    @param num_codepoints Treat the string as if it were of type

      CHAR(num_codepoints). In particular, this means that if the

      collation is a pad collation (pad_attribute is PAD_SPACE) and

      string has fewer than "num_codepoints" codepoints, the string

      will be transformed as if it ended in (num_codepoints-n) extra spaces.

      If the string has more than "num_codepoints" codepoints,

      behavior is undefined; may truncate, may crash, or do something

      else entirely. Note that MY_STRXFRM_PAD_TO_MAXLEN overrides this;

      if it is given for a PAD SPACE collation, this value is taken to be

      effectively infinity.

    @param src The source string, in the required character set

      for the collation.

    @param srclen Number of bytes in src.

    @param flags ORed bitmask of MY_STRXFRM_* flags.


    @return Number of bytes written to dst.

  */

  size_t (*strnxfrm)(const CHARSET_INFO *, uint8_t *dst, size_t dstlen,

                     unsigned num_codepoints, const uint8_t *src, size_t srclen,

                     unsigned flags);


  /**

    Return the maximum number of output bytes needed for strnxfrm()

    to output all weights for any string of the given input length.

    You can use this to e.g. size buffers for sort keys.


    @param num_bytes Number of bytes in the input string. Note that for

      multibyte character sets, this _must_ be a pessimistic estimate,

      ie., one that's cs->mbmaxlen * max_num_codepoints. So for e.g.

      the utf8mb4 string "foo", you will need to give in 12, not 3.

  */

  size_t (*strnxfrmlen)(const CHARSET_INFO *, size_t num_bytes);

  bool (*like_range)(const CHARSET_INFO *, const char *s, size_t s_length,

                     char w_prefix, char w_one, char w_many, size_t res_length,

                     char *min_str, char *max_str, size_t *min_len,

                     size_t *max_len);

  int (*wildcmp)(const CHARSET_INFO *, const char *str, const char *str_end,

                 const char *wildstr, const char *wildend, int escape,

                 int w_one, int w_many);


  int (*strcasecmp)(const CHARSET_INFO *, const char *, const char *);


  unsigned (*strstr)(const CHARSET_INFO *, const char *b, size_t b_length,

                     const char *s, size_t s_length, my_match_t *match,

                     unsigned nmatch);


  /**

    Compute a sort hash for the given key. This hash must preserve equality

    under the given collation, so that a=b => H(a)=H(b). Note that this hash

    is used for hash-based partitioning (PARTITION KEY), so you cannot change

    it except when writing a new collation; it needs to be unchanged across

    releases, so that the on-disk format does not change. (It is also used

    for testing equality in the MEMORY storage engine.)


    nr1 and nr2 are both in/out parameters. nr1 is the actual hash value;

    nr2 holds extra state between invocations.

  */

  void (*hash_sort)(const CHARSET_INFO *cs, const uint8_t *key, size_t len,

                    uint64_t *nr1, uint64_t *nr2);

  bool (*propagate)(const CHARSET_INFO *cs, const uint8_t *str, size_t len);

};


/* Some typedef to make it easy for C++ to make function pointers */

typedef int (*my_charset_conv_mb_wc)(const CHARSET_INFO *, my_wc_t *,

                                     const uint8_t *, const uint8_t *);

typedef int (*my_charset_conv_wc_mb)(const CHARSET_INFO *, my_wc_t, uint8_t *,

                                     uint8_t *);

typedef size_t (*my_charset_conv_case)(const CHARSET_INFO *, char *, size_t,

                                       char *, size_t);


/* See strings/CHARSET_INFO.txt about information on this structure  */

struct MY_CHARSET_HANDLER {

  bool (*init)(CHARSET_INFO *, MY_CHARSET_LOADER *loader, MY_CHARSET_ERRMSG *);

  /* Multibyte routines */

  unsigned (*ismbchar)(const CHARSET_INFO *, const char *, const char *);

  unsigned (*mbcharlen)(const CHARSET_INFO *, unsigned c);

  size_t (*numchars)(const CHARSET_INFO *, const char *b, const char *e);


  /**

    Return at which byte codepoint number "pos" begins, relative to

    the start of the string. If the string is shorter than or is

    exactly "pos" codepoints long, returns a value equal or greater to

    (e-b).

  */

  size_t (*charpos)(const CHARSET_INFO *, const char *b, const char *e,

                    size_t pos);

  size_t (*well_formed_len)(const CHARSET_INFO *, const char *b, const char *e,

                            size_t nchars, int *error);

  /**

    Given a pointer and a length in bytes, returns a new length in bytes where

    all trailing space characters are stripped. This holds even for NO PAD

    collations.


    Exception: The "binary" collation, which is used behind-the-scenes to

    implement the BINARY type (by mapping it to CHAR(n) COLLATE "binary"),

    returns just the length back with no stripping. It's done that way so that

    Field_string (implementing CHAR(n)) returns the full padded width on read

    (as opposed to a normal CHAR, where we usually strip the spaces on read),

    but it's suboptimal, since lengthsp() is also used in a number of other

    places, e.g. stripping trailing spaces from enum values given in by the

    user. If you call this function, be aware of this special exception and

    consider the implications.

  */

  size_t (*lengthsp)(const CHARSET_INFO *, const char *ptr, size_t length);

  size_t (*numcells)(const CHARSET_INFO *, const char *b, const char *e);


  /* Unicode conversion */

  my_charset_conv_mb_wc mb_wc;

  my_charset_conv_wc_mb wc_mb;


  /* CTYPE scanner */

  int (*ctype)(const CHARSET_INFO *cs, int *ctype, const uint8_t *s,

               const uint8_t *e);


  /* Functions for case and sort conversion */

  size_t (*caseup_str)(const CHARSET_INFO *, char *);

  size_t (*casedn_str)(const CHARSET_INFO *, char *);


  my_charset_conv_case caseup;

  my_charset_conv_case casedn;


  /* Charset dependant snprintf() */

  size_t (*snprintf)(const CHARSET_INFO *, char *to, size_t n, const char *fmt,

                     ...) MY_ATTRIBUTE((format(printf, 4, 5)));


  size_t (*long10_to_str)(const CHARSET_INFO *, char *to, size_t n, int radix,

                          long int val);

  size_t (*longlong10_to_str)(const CHARSET_INFO *, char *to, size_t n,

                              int radix, long long val);


  void (*fill)(const CHARSET_INFO *, char *to, size_t len, int fill);


  /* String-to-number conversion routines */

  long (*strntol)(const CHARSET_INFO *, const char *s, size_t l, int base,

                  const char **e, int *err);

  unsigned long (*strntoul)(const CHARSET_INFO *, const char *s, size_t l,

                            int base, const char **e, int *err);

  long long (*strntoll)(const CHARSET_INFO *, const char *s, size_t l, int base,

                        const char **e, int *err);

  unsigned long long (*strntoull)(const CHARSET_INFO *, const char *s, size_t l,

                                  int base, const char **e, int *err);

  double (*strntod)(const CHARSET_INFO *, const char *s, size_t l,

                    const char **e, int *err);

  long long (*strtoll10)(const CHARSET_INFO *cs, const char *nptr,

                         const char **endptr, int *error);

  unsigned long long (*strntoull10rnd)(const CHARSET_INFO *cs, const char *str,

                                       size_t length, int unsigned_fl,

                                       const char **endptr, int *error);

  size_t (*scan)(const CHARSET_INFO *, const char *b, const char *e, int sq);

};


/* See strings/CHARSET_INFO.txt about information on this structure  */

struct CHARSET_INFO {

  unsigned number;

  unsigned primary_number;

  unsigned binary_number;

  unsigned state;

  const char *csname;

  const char *m_coll_name;

  const char *comment;

  const char *tailoring;

  struct Coll_param *coll_param;

  const uint8_t *ctype;

  const uint8_t *to_lower;

  const uint8_t *to_upper;

  const uint8_t *sort_order;

  struct MY_UCA_INFO *uca; /* This can be changed in apply_one_rule() */

  const uint16_t *tab_to_uni;

  const MY_UNI_IDX *tab_from_uni;

  const MY_UNICASE_INFO *caseinfo;

  const struct lex_state_maps_st *state_maps; /* parser internal data */

  const uint8_t *ident_map;                   /* parser internal data */

  unsigned strxfrm_multiply;

  uint8_t caseup_multiply;

  uint8_t casedn_multiply;

  unsigned mbminlen;

  unsigned mbmaxlen;

  unsigned mbmaxlenlen;

  my_wc_t min_sort_char;

  my_wc_t max_sort_char; /* For LIKE optimization */

  uint8_t pad_char;

  bool escape_with_backslash_is_dangerous;

  uint8_t levels_for_compare;


  MY_CHARSET_HANDLER *cset;

  MY_COLLATION_HANDLER *coll;


  /**

    If this collation is PAD_SPACE, it collates as if all inputs were

    padded with a given number of spaces at the end (see the "num_codepoints"

    flag to strnxfrm). NO_PAD simply compares unextended strings.


    Note that this is fundamentally about the behavior of coll->strnxfrm.

  */

  enum Pad_attribute pad_attribute;

};


/*

  NOTE: You cannot use a CHARSET_INFO without it having been initialized first.

  In particular, they are not initialized when a unit test starts; do not use

  these globals indiscriminately from there, and do not add more. Instead,

  initialize them using my_collation_get_by_name().

*/


extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_bin;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_latin1;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_filename;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_0900_ai_ci;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_0900_bin;


extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_latin1_bin;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf32_unicode_ci;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_general_ci;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_tolower_ci;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_unicode_ci;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_bin;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_bin;

extern MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_general_ci;


/**

  @note Deprecated function, please call cs->coll->wildcmp(cs...) instead.

*/

MYSQL_STRINGS_EXPORT int my_wildcmp_mb_bin(const CHARSET_INFO *cs,

                                           const char *str, const char *str_end,

                                           const char *wildstr,

                                           const char *wildend, int escape,

                                           int w_one, int w_many);


MYSQL_STRINGS_EXPORT extern size_t my_strcspn(const CHARSET_INFO *cs,

                                              const char *str, const char *end,

                                              const char *reject,

                                              size_t reject_length);


MYSQL_STRINGS_EXPORT unsigned my_string_repertoire(const CHARSET_INFO *cs,

                                                   const char *str, size_t len);


MYSQL_STRINGS_EXPORT bool my_charset_is_ascii_based(const CHARSET_INFO *cs);


/**

  Detect whether a character set is ASCII compatible.

*/

inline bool my_charset_is_ascii_based(const CHARSET_INFO *cs) {

  return (cs->state & MY_CS_NONASCII) == 0;

}


inline bool my_charset_same(const CHARSET_INFO *cs1, const CHARSET_INFO *cs2) {

  assert(0 != strcmp(cs1->csname, "utf8"));

  assert(0 != strcmp(cs2->csname, "utf8"));

  return ((cs1 == cs2) || !strcmp(cs1->csname, cs2->csname));

}


MYSQL_STRINGS_EXPORT unsigned my_charset_repertoire(const CHARSET_INFO *cs);


MYSQL_STRINGS_EXPORT unsigned my_strxfrm_flag_normalize(unsigned flags);


MYSQL_STRINGS_EXPORT size_t my_convert(char *to, size_t to_length,

                                       const CHARSET_INFO *to_cs,

                                       const char *from, size_t from_length,

                                       const CHARSET_INFO *from_cs,

                                       unsigned *errors);


MYSQL_STRINGS_EXPORT unsigned my_mbcharlen_ptr(const CHARSET_INFO *cs,

                                               const char *s, const char *e);


MYSQL_STRINGS_EXPORT bool my_is_prefixidx_cand(const CHARSET_INFO *cs,

                                               const char *wildstr,

                                               const char *wildend, int escape,

                                               int w_many, size_t *prefix_len);


/* clang-format off */

static constexpr uint8_t MY_CHAR_U   =   01; /* Upper case */

static constexpr uint8_t MY_CHAR_L   =   02; /* Lower case */

static constexpr uint8_t MY_CHAR_NMR =   04; /* Numeral (digit) */

static constexpr uint8_t MY_CHAR_SPC =  010; /* Spacing character */

static constexpr uint8_t MY_CHAR_PNT =  020; /* Punctuation */

static constexpr uint8_t MY_CHAR_CTR =  040; /* Control character */

static constexpr uint8_t MY_CHAR_B   = 0100; /* Blank */

static constexpr uint8_t MY_CHAR_X   = 0200; /* heXadecimal digit */

/* clang-format on */


/* The following functions make sense only for one-byte character sets.

They will not fail for multibyte character sets, but will not produce

the expected results. They may have some limited usability like

e.g. for utf8mb3/utf8mb4, meaningful results will be produced for

values < 0x7F. */


inline bool my_isascii(char ch) { return (ch & ~0177) == 0; }


inline char my_toupper(const CHARSET_INFO *cs, char ch) {

  return static_cast<char>(cs->to_upper[static_cast<uint8_t>(ch)]);

}


inline char my_tolower(const CHARSET_INFO *cs, char ch) {

  return static_cast<char>(cs->to_lower[static_cast<uint8_t>(ch)]);

}


inline bool my_isalpha(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] &

          (MY_CHAR_U | MY_CHAR_L)) != 0;

}


inline bool my_isupper(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_U) != 0;

}


inline bool my_islower(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_L) != 0;

}


inline bool my_isdigit(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_NMR) != 0;

}


inline bool my_isxdigit(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_X) != 0;

}


inline bool my_isalnum(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] &

          (MY_CHAR_U | MY_CHAR_L | MY_CHAR_NMR)) != 0;

}


inline bool my_isspace(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_SPC) != 0;

}


inline bool my_ispunct(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_PNT) != 0;

}


inline bool my_isgraph(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] &

          (MY_CHAR_PNT | MY_CHAR_U | MY_CHAR_L | MY_CHAR_NMR)) != 0;

}


inline bool my_iscntrl(const CHARSET_INFO *cs, char ch) {

  return ((cs->ctype + 1)[static_cast<uint8_t>(ch)] & MY_CHAR_CTR) != 0;

}


inline bool my_isvar(const CHARSET_INFO *cs, char ch) {

  return my_isalnum(cs, ch) || (ch == '_');

}


inline bool my_isvar_start(const CHARSET_INFO *cs, char ch) {

  return my_isalpha(cs, ch) || (ch == '_');

}


// Properties of character sets.

inline bool my_binary_compare(const CHARSET_INFO *cs) {

  return (cs->state & MY_CS_BINSORT) != 0;

}


inline bool use_strnxfrm(const CHARSET_INFO *cs) {

  return (cs->state & MY_CS_STRNXFRM) != 0;

}


// Interfaces to member functions.

inline size_t my_strnxfrm(const CHARSET_INFO *cs, uint8_t *dst, size_t dstlen,

                          const uint8_t *src, size_t srclen) {

  return cs->coll->strnxfrm(cs, dst, dstlen, dstlen, src, srclen, 0);

}


inline int my_strnncoll(const CHARSET_INFO *cs, const uint8_t *a,

                        size_t a_length, const uint8_t *b, size_t b_length) {

  return cs->coll->strnncoll(cs, a, a_length, b, b_length, false);

}


inline bool my_like_range(const CHARSET_INFO *cs, const char *s,

                          size_t s_length, char w_prefix, char w_one,

                          char w_many, size_t res_length, char *min_str,

                          char *max_str, size_t *min_len, size_t *max_len) {

  return cs->coll->like_range(cs, s, s_length, w_prefix, w_one, w_many,

                              res_length, min_str, max_str, min_len, max_len);

}


inline int my_wildcmp(const CHARSET_INFO *cs, const char *str,

                      const char *str_end, const char *wildstr,

                      const char *wildend, int escape, int w_one, int w_many) {

  return cs->coll->wildcmp(cs, str, str_end, wildstr, wildend, escape, w_one,

                           w_many);

}


inline int my_strcasecmp(const CHARSET_INFO *cs, const char *s1,

                         const char *s2) {

  return cs->coll->strcasecmp(cs, s1, s2);

}


inline size_t my_charpos(const CHARSET_INFO *cs, const char *beg,

                         const char *end, size_t pos) {

  return cs->cset->charpos(cs, beg, end, pos);

}


inline size_t my_charpos(const CHARSET_INFO *cs, const unsigned char *beg,

                         const unsigned char *end, size_t pos) {

  return cs->cset->charpos(cs, pointer_cast<const char *>(beg),

                           pointer_cast<const char *>(end), pos);

}


inline bool use_mb(const CHARSET_INFO *cs) {

  return cs->cset->ismbchar != nullptr;

}


inline unsigned my_ismbchar(const CHARSET_INFO *cs, const char *str,

                            const char *strend) {

  return cs->cset->ismbchar(cs, str, strend);

}


inline unsigned my_ismbchar(const CHARSET_INFO *cs, const uint8_t *str,

                            const uint8_t *strend) {

  return cs->cset->ismbchar(cs, pointer_cast<const char *>(str),

                            pointer_cast<const char *>(strend));

}


inline unsigned my_mbcharlen(const CHARSET_INFO *cs, unsigned first_byte) {

  return cs->cset->mbcharlen(cs, first_byte);

}


/**

  Get the length of gb18030 code by the given two leading bytes


  @param[in] cs charset_info

  @param[in] first_byte first byte of gb18030 code

  @param[in] second_byte second byte of gb18030 code

  @return    the length of gb18030 code starting with given two bytes,

             the length would be 2 or 4 for valid gb18030 code,

             or 0 for invalid gb18030 code

*/

inline unsigned my_mbcharlen_2(const CHARSET_INFO *cs, uint8_t first_byte,

                               uint8_t second_byte) {

  return cs->cset->mbcharlen(cs,

                             ((first_byte & 0xFF) << 8) + (second_byte & 0xFF));

}


/**

  Get the maximum length of leading bytes needed to determine the length of a

  multi-byte gb18030 code


  @param[in] cs charset_info

  @return    number of leading bytes we need, would be 2 for gb18030

             and 1 for all other charsets

*/

inline unsigned my_mbmaxlenlen(const CHARSET_INFO *cs) {

  return cs->mbmaxlenlen;

}


/**

  Judge if the given byte is a possible leading byte for a charset.

  For gb18030 whose mbmaxlenlen is 2, we can't determine the length of

  a multi-byte character by looking at the first byte only


  @param[in] cs charset_info

  @param[in] leading_byte possible leading byte

  @return    true if it is, otherwise false

*/

inline bool my_ismb1st(const CHARSET_INFO *cs, unsigned leading_byte) {

  return my_mbcharlen(cs, leading_byte) > 1 ||

         (my_mbmaxlenlen(cs) == 2 && my_mbcharlen(cs, leading_byte) == 0);

}


inline size_t my_caseup_str(const CHARSET_INFO *cs, char *str) {

  return cs->cset->caseup_str(cs, str);

}


inline size_t my_casedn_str(const CHARSET_INFO *cs, char *str) {

  return cs->cset->casedn_str(cs, str);

}


inline long my_strntol(const CHARSET_INFO *cs, const char *str, size_t length,

                       int base, const char **end, int *err) {

  return cs->cset->strntol(cs, str, length, base, end, err);

}


inline unsigned long my_strntoul(const CHARSET_INFO *cs, const char *str,

                                 size_t length, int base, const char **end,

                                 int *err) {

  return cs->cset->strntoul(cs, str, length, base, end, err);

}


inline int64_t my_strntoll(const CHARSET_INFO *cs, const char *str,

                           size_t length, int base, const char **end,

                           int *err) {

  return cs->cset->strntoll(cs, str, length, base, end, err);

}


inline uint64_t my_strntoull(const CHARSET_INFO *cs, const char *str,

                             size_t length, int base, const char **end,

                             int *err) {

  return cs->cset->strntoull(cs, str, length, base, end, err);

}


inline double my_strntod(const CHARSET_INFO *cs, const char *str, size_t length,

                         const char **end, int *err) {

  return cs->cset->strntod(cs, str, length, end, err);

}


inline bool is_supported_parser_charset(const CHARSET_INFO *cs) {

  return (cs->mbminlen == 1);

}


#endif  // INCLUDE_MYSQL_STRINGS_M_CTYPE_H_

api.h

MYSQL_STRINGS_EXPORT
#define MYSQL_STRINGS_EXPORT
Definition: api.h:47

loader
static Mysys_charset_loader * loader
Definition: charset.cc:185

MY_CHARSET_LOADER
User-specified callback interface for collation parser/initializer.
Definition: m_ctype.h:190

MY_CHARSET_LOADER::~MY_CHARSET_LOADER
virtual ~MY_CHARSET_LOADER()
Definition: ctype.cc:1158

MY_CHARSET_LOADER::mem_malloc
virtual void * mem_malloc(size_t size)
Definition: m_ctype.h:235

MY_CHARSET_LOADER::MY_CHARSET_LOADER
MY_CHARSET_LOADER()=default

MY_CHARSET_LOADER::once_alloc
virtual void * once_alloc(size_t)
Allocate-and-forget version of malloc().
Definition: ctype.cc:1286

MY_CHARSET_LOADER::operator=
MY_CHARSET_LOADER & operator=(const MY_CHARSET_LOADER &&)=delete

MY_CHARSET_LOADER::MY_CHARSET_LOADER
MY_CHARSET_LOADER(const MY_CHARSET_LOADER &)=delete

MY_CHARSET_LOADER::mem_free
virtual void mem_free(void *ptr)
Definition: m_ctype.h:236

MY_CHARSET_LOADER::m_delete_list
std::deque< void * > m_delete_list
Definition: m_ctype.h:239

MY_CHARSET_LOADER::add_collation
int add_collation(CHARSET_INFO *cs)
Collation parser helper function (not overloadable).
Definition: ctype.cc:1164

MY_CHARSET_LOADER::MY_CHARSET_LOADER
MY_CHARSET_LOADER(const MY_CHARSET_LOADER &&)=delete

MY_CHARSET_LOADER::read_file
virtual void * read_file(const char *path, size_t *size)=0
Loads a file by its OS path into collation parser/initializer.

MY_CHARSET_LOADER::operator=
MY_CHARSET_LOADER & operator=(const MY_CHARSET_LOADER &)=delete

MY_CHARSET_LOADER::reporter
virtual void reporter(enum loglevel loglevel, unsigned errcode,...)=0
Intercepts error messages from collation parser/initializer.

flags
static int flags[50]
Definition: hp_test1.cc:40

attribute.h

malloc
#define malloc(A)
Definition: lexyy.cc:914

free
#define free(A)
Definition: lexyy.cc:915

MY_CS_TOOSMALL4
static constexpr int MY_CS_TOOSMALL4
Definition: m_ctype.h:97

MY_SEQ_SPACES
static constexpr int MY_SEQ_SPACES
Definition: m_ctype.h:105

MY_CS_PUREASCII
static constexpr uint32_t MY_CS_PUREASCII
Definition: m_ctype.h:140

MY_CHAR_CTR
static constexpr uint8_t MY_CHAR_CTR
Definition: m_ctype.h:546

MY_PUT_MB2
static void MY_PUT_MB2(unsigned char *s, uint16_t code)
Definition: m_ctype.h:59

MY_CS_TOOSMALL
static constexpr int MY_CS_TOOSMALL
Definition: m_ctype.h:89

MY_CHAR_L
static constexpr uint8_t MY_CHAR_L
Definition: m_ctype.h:542

myf
int myf
Definition: m_ctype.h:50

my_tolower
char my_tolower(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:563

MY_CHAR_NMR
static constexpr uint8_t MY_CHAR_NMR
Definition: m_ctype.h:543

my_strcasecmp
int my_strcasecmp(const CHARSET_INFO *cs, const char *s1, const char *s2)
Definition: m_ctype.h:653

my_like_range
bool my_like_range(const CHARSET_INFO *cs, const char *s, size_t s_length, char w_prefix, char w_one, char w_many, size_t res_length, char *min_str, char *max_str, size_t *min_len, size_t *max_len)
Definition: m_ctype.h:638

MY_REPERTOIRE_UNICODE30
static constexpr uint32_t MY_REPERTOIRE_UNICODE30
Definition: m_ctype.h:156

MY_CS_READY
static constexpr uint32_t MY_CS_READY
Definition: m_ctype.h:132

MY_CS_INLINE
static constexpr uint32_t MY_CS_INLINE
Definition: m_ctype.h:148

MY_CHAR_PNT
static constexpr uint8_t MY_CHAR_PNT
Definition: m_ctype.h:545

my_charset_bin
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_bin
Definition: ctype-bin.cc:509

MY_CS_NONASCII
static constexpr uint32_t MY_CS_NONASCII
Definition: m_ctype.h:142

my_charset_conv_wc_mb
int(* my_charset_conv_wc_mb)(const CHARSET_INFO *, my_wc_t, uint8_t *, uint8_t *)
Definition: m_ctype.h:336

MY_CS_STRNXFRM
static constexpr uint32_t MY_CS_STRNXFRM
Definition: m_ctype.h:124

my_isvar_start
bool my_isvar_start(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:614

MY_CS_NAME_SIZE
constexpr int MY_CS_NAME_SIZE
Definition: m_ctype.h:46

my_charset_utf8mb3_tolower_ci
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_tolower_ci
Definition: ctype-utf8.cc:5830

my_charset_utf8mb4_bin
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_bin
Definition: ctype-utf8.cc:7823

MY_CS_BINSORT
static constexpr uint32_t MY_CS_BINSORT
Definition: m_ctype.h:120

my_isxdigit
bool my_isxdigit(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:584

my_charset_latin1_bin
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_latin1_bin
Definition: ctype-latin1.cc:671

MY_CS_ILUNI
static constexpr int MY_CS_ILUNI
Definition: m_ctype.h:87

my_charset_utf8mb4_0900_ai_ci
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_0900_ai_ci
Definition: ctype-uca.cc:9611

MY_STRXFRM_PAD_TO_MAXLEN
static constexpr uint32_t MY_STRXFRM_PAD_TO_MAXLEN
Definition: m_ctype.h:160

my_isupper
bool my_isupper(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:572

my_strntoll
int64_t my_strntoll(const CHARSET_INFO *cs, const char *str, size_t length, int base, const char **end, int *err)
Definition: m_ctype.h:749

my_charset_utf8mb3_unicode_ci
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_unicode_ci
Definition: ctype-uca.cc:6132

my_charpos
size_t my_charpos(const CHARSET_INFO *cs, const char *beg, const char *end, size_t pos)
Definition: m_ctype.h:658

my_convert
MYSQL_STRINGS_EXPORT size_t my_convert(char *to, size_t to_length, const CHARSET_INFO *to_cs, const char *from, size_t from_length, const CHARSET_INFO *from_cs, unsigned *errors)
Convert a string between two character sets.
Definition: ctype.cc:912

my_strntoull
uint64_t my_strntoull(const CHARSET_INFO *cs, const char *str, size_t length, int base, const char **end, int *err)
Definition: m_ctype.h:755

my_isalnum
bool my_isalnum(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:588

MY_CS_LOWER_SORT
static constexpr uint32_t MY_CS_LOWER_SORT
Definition: m_ctype.h:146

my_wildcmp
int my_wildcmp(const CHARSET_INFO *cs, const char *str, const char *str_end, const char *wildstr, const char *wildend, int escape, int w_one, int w_many)
Definition: m_ctype.h:646

my_casedn_str
size_t my_casedn_str(const CHARSET_INFO *cs, char *str)
Definition: m_ctype.h:734

MY_CHAR_SPC
static constexpr uint8_t MY_CHAR_SPC
Definition: m_ctype.h:544

my_is_prefixidx_cand
MYSQL_STRINGS_EXPORT bool my_is_prefixidx_cand(const CHARSET_INFO *cs, const char *wildstr, const char *wildend, int escape, int w_many, size_t *prefix_len)
Identify whether given like pattern looks like a prefix pattern, which can become candidate for index...
Definition: ctype.cc:999

my_ispunct
bool my_ispunct(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:597

MY_CS_UNICODE_SUPPLEMENT
static constexpr uint32_t MY_CS_UNICODE_SUPPLEMENT
Definition: m_ctype.h:144

my_isvar
bool my_isvar(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:610

my_strntoul
unsigned long my_strntoul(const CHARSET_INFO *cs, const char *str, size_t length, int base, const char **end, int *err)
Definition: m_ctype.h:743

my_isdigit
bool my_isdigit(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:580

MY_CS_TOOSMALL3
static constexpr int MY_CS_TOOSMALL3
Definition: m_ctype.h:93

my_mbcharlen_2
unsigned my_mbcharlen_2(const CHARSET_INFO *cs, uint8_t first_byte, uint8_t second_byte)
Get the length of gb18030 code by the given two leading bytes.
Definition: m_ctype.h:698

my_charset_conv_case
size_t(* my_charset_conv_case)(const CHARSET_INFO *, char *, size_t, char *, size_t)
Definition: m_ctype.h:338

my_string_repertoire
MYSQL_STRINGS_EXPORT unsigned my_string_repertoire(const CHARSET_INFO *cs, const char *str, size_t len)
Definition: ctype.cc:778

my_charset_conv_mb_wc
int(* my_charset_conv_mb_wc)(const CHARSET_INFO *, my_wc_t *, const uint8_t *, const uint8_t *)
Definition: m_ctype.h:334

MY_CS_AVAILABLE
static constexpr uint32_t MY_CS_AVAILABLE
Definition: m_ctype.h:134

my_isspace
bool my_isspace(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:593

my_strntod
double my_strntod(const CHARSET_INFO *cs, const char *str, size_t length, const char **end, int *err)
Definition: m_ctype.h:761

use_strnxfrm
bool use_strnxfrm(const CHARSET_INFO *cs)
Definition: m_ctype.h:623

MY_REPERTOIRE_EXTENDED
static constexpr uint32_t MY_REPERTOIRE_EXTENDED
Definition: m_ctype.h:154

my_wc_t
unsigned long my_wc_t
Our own version of wchar_t, ie., a type that holds a single Unicode code point ("wide character").
Definition: m_ctype.h:57

MY_SEQ_INTTAIL
static constexpr int MY_SEQ_INTTAIL
Definition: m_ctype.h:104

my_iscntrl
bool my_iscntrl(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:606

my_charset_latin1
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_latin1
Definition: ctype-latin1.cc:366

my_mbcharlen
unsigned my_mbcharlen(const CHARSET_INFO *cs, unsigned first_byte)
Definition: m_ctype.h:684

MY_CHARSET_UNDEFINED
static constexpr uint32_t MY_CHARSET_UNDEFINED
Definition: m_ctype.h:110

MY_CS_TOOSMALL5
static constexpr int MY_CS_TOOSMALL5
Definition: m_ctype.h:99

MY_CS_UNICODE
static constexpr uint32_t MY_CS_UNICODE
Definition: m_ctype.h:130

my_ismbchar
unsigned my_ismbchar(const CHARSET_INFO *cs, const char *str, const char *strend)
Definition: m_ctype.h:673

my_isascii
bool my_isascii(char ch)
Definition: m_ctype.h:557

my_charset_utf8mb4_general_ci
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_general_ci
Definition: ctype-utf8.cc:7787

MY_CS_HIDDEN
static constexpr uint32_t MY_CS_HIDDEN
Definition: m_ctype.h:138

my_strcspn
MYSQL_STRINGS_EXPORT size_t my_strcspn(const CHARSET_INFO *cs, const char *str, const char *end, const char *reject, size_t reject_length)
Calculate the length of the initial segment of 'str' which consists entirely of characters not in 're...
Definition: my_strchr.cc:64

my_mbcharlen_ptr
MYSQL_STRINGS_EXPORT unsigned my_mbcharlen_ptr(const CHARSET_INFO *cs, const char *s, const char *e)
Get the length of the first code in given sequence of chars.
Definition: ctype.cc:971

my_ismb1st
bool my_ismb1st(const CHARSET_INFO *cs, unsigned leading_byte)
Judge if the given byte is a possible leading byte for a charset.
Definition: m_ctype.h:725

MY_CS_ILSEQ
static constexpr int MY_CS_ILSEQ
Definition: m_ctype.h:85

my_charset_utf8mb4_0900_bin
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb4_0900_bin
Definition: ctype-uca.cc:11482

my_charset_same
bool my_charset_same(const CHARSET_INFO *cs1, const CHARSET_INFO *cs2)
Definition: m_ctype.h:516

my_strnxfrm
size_t my_strnxfrm(const CHARSET_INFO *cs, uint8_t *dst, size_t dstlen, const uint8_t *src, size_t srclen)
Definition: m_ctype.h:628

my_string_stack_guard
MYSQL_STRINGS_EXPORT int(* my_string_stack_guard)(int)
Definition: collations_internal.cc:43

MY_CS_CONFIG_UNUSED
static constexpr uint32_t MY_CS_CONFIG_UNUSED
Definition: m_ctype.h:114

my_strntol
long my_strntol(const CHARSET_INFO *cs, const char *str, size_t length, int base, const char **end, int *err)
Definition: m_ctype.h:738

MY_CS_LOADED
static constexpr uint32_t MY_CS_LOADED
Definition: m_ctype.h:118

MY_CS_INDEX_UNUSED
static constexpr uint32_t MY_CS_INDEX_UNUSED
Definition: m_ctype.h:116

my_charset_utf8mb3_bin
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_bin
Definition: ctype-utf8.cc:5900

CHARSET_DIR
constexpr const char * CHARSET_DIR
Definition: m_ctype.h:48

use_mb
bool use_mb(const CHARSET_INFO *cs)
Definition: m_ctype.h:669

my_charset_repertoire
MYSQL_STRINGS_EXPORT unsigned my_charset_repertoire(const CHARSET_INFO *cs)
Definition: ctype.cc:800

my_mbmaxlenlen
unsigned my_mbmaxlenlen(const CHARSET_INFO *cs)
Get the maximum length of leading bytes needed to determine the length of a multi-byte gb18030 code.
Definition: m_ctype.h:712

my_isalpha
bool my_isalpha(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:567

my_caseup_str
size_t my_caseup_str(const CHARSET_INFO *cs, char *str)
Definition: m_ctype.h:730

MY_REPERTOIRE_ASCII
static constexpr uint32_t MY_REPERTOIRE_ASCII
Definition: m_ctype.h:152

is_supported_parser_charset
bool is_supported_parser_charset(const CHARSET_INFO *cs)
Definition: m_ctype.h:766

my_charset_utf8mb3_general_ci
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf8mb3_general_ci
Definition: ctype-utf8.cc:5795

my_strxfrm_flag_normalize
MYSQL_STRINGS_EXPORT unsigned my_strxfrm_flag_normalize(unsigned flags)
Definition: ctype-simple.cc:1497

my_charset_is_ascii_based
MYSQL_STRINGS_EXPORT bool my_charset_is_ascii_based(const CHARSET_INFO *cs)
Detect whether a character set is ASCII compatible.
Definition: m_ctype.h:512

MY_CHAR_X
static constexpr uint8_t MY_CHAR_X
Definition: m_ctype.h:548

MY_CS_TOOSMALL2
static constexpr int MY_CS_TOOSMALL2
Definition: m_ctype.h:91

my_wildcmp_mb_bin
MYSQL_STRINGS_EXPORT int my_wildcmp_mb_bin(const CHARSET_INFO *cs, const char *str, const char *str_end, const char *wildstr, const char *wildend, int escape, int w_one, int w_many)
Definition: ctype-mb.cc:1040

my_islower
bool my_islower(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:576

MY_CS_PRIMARY
static constexpr uint32_t MY_CS_PRIMARY
Definition: m_ctype.h:122

my_binary_compare
bool my_binary_compare(const CHARSET_INFO *cs)
Definition: m_ctype.h:619

MY_CS_COMPILED
static constexpr uint32_t MY_CS_COMPILED
Definition: m_ctype.h:112

MY_CHAR_B
static constexpr uint8_t MY_CHAR_B
Definition: m_ctype.h:547

my_strnncoll
int my_strnncoll(const CHARSET_INFO *cs, const uint8_t *a, size_t a_length, const uint8_t *b, size_t b_length)
Definition: m_ctype.h:633

my_isgraph
bool my_isgraph(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:601

my_charset_filename
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_filename
Definition: ctype-utf8.cc:7057

MY_CS_CSSORT
static constexpr uint32_t MY_CS_CSSORT
Definition: m_ctype.h:136

my_toupper
char my_toupper(const CHARSET_INFO *cs, char ch)
Definition: m_ctype.h:559

my_charset_utf32_unicode_ci
MYSQL_STRINGS_EXPORT CHARSET_INFO my_charset_utf32_unicode_ci
Definition: ctype-uca.cc:7837

Pad_attribute
Pad_attribute
Definition: m_ctype.h:244

NO_PAD
@ NO_PAD
Definition: m_ctype.h:244

PAD_SPACE
@ PAD_SPACE
Definition: m_ctype.h:244

MY_CS_TOOSMALL6
static constexpr int MY_CS_TOOSMALL6
Definition: m_ctype.h:101

MY_CHAR_U
static constexpr uint8_t MY_CHAR_U
Definition: m_ctype.h:541

strend
static const char * strend(const char *s)
Definition: m_string.h:69

my_loglevel.h
Definition of the global "loglevel" enumeration.

loglevel
loglevel
Definition: my_loglevel.h:41

path
static char * path
Definition: mysqldump.cc:149

anonymous_namespace{config_generator.cc}::str
std::string str(const mysqlrouter::ConfigGenerator::Options::Endpoint &ep)
Definition: config_generator.cc:1073

cs
Definition: commit_order_queue.h:34

dd::system_views::escape
static std::string escape(const std::string &str)
Escapes (only) apostrophes.
Definition: st_units_of_measure.cc:39

gis::length
bool length(const dd::Spatial_reference_system *srs, const Geometry *g1, double *length, bool *null) noexcept
Computes the length of linestrings and multilinestrings.
Definition: length.cc:76

json_binary::err
static Value err()
Create a Value object that represents an error condition.
Definition: json_binary.cc:927

mysqlrouter::size
size_t size(const char *const c)
Definition: base64.h:46

rules_table_service::end
Cursor end()
A past-the-end Cursor.
Definition: rules_table_service.cc:192

key
required string key
Definition: replication_asynchronous_connection_failover.proto:60

CHARSET_INFO
Definition: m_ctype.h:423

CHARSET_INFO::casedn_multiply
uint8_t casedn_multiply
Definition: m_ctype.h:445

CHARSET_INFO::pad_char
uint8_t pad_char
Definition: m_ctype.h:451

CHARSET_INFO::state_maps
const struct lex_state_maps_st * state_maps
Definition: m_ctype.h:441

CHARSET_INFO::tab_to_uni
const uint16_t * tab_to_uni
Definition: m_ctype.h:438

CHARSET_INFO::binary_number
unsigned binary_number
Definition: m_ctype.h:426

CHARSET_INFO::ctype
const uint8_t * ctype
Definition: m_ctype.h:433

CHARSET_INFO::csname
const char * csname
Definition: m_ctype.h:428

CHARSET_INFO::max_sort_char
my_wc_t max_sort_char
Definition: m_ctype.h:450

CHARSET_INFO::caseinfo
const MY_UNICASE_INFO * caseinfo
Definition: m_ctype.h:440

CHARSET_INFO::escape_with_backslash_is_dangerous
bool escape_with_backslash_is_dangerous
Definition: m_ctype.h:452

CHARSET_INFO::number
unsigned number
Definition: m_ctype.h:424

CHARSET_INFO::to_lower
const uint8_t * to_lower
Definition: m_ctype.h:434

CHARSET_INFO::caseup_multiply
uint8_t caseup_multiply
Definition: m_ctype.h:444

CHARSET_INFO::mbmaxlenlen
unsigned mbmaxlenlen
Definition: m_ctype.h:448

CHARSET_INFO::mbmaxlen
unsigned mbmaxlen
Definition: m_ctype.h:447

CHARSET_INFO::strxfrm_multiply
unsigned strxfrm_multiply
Definition: m_ctype.h:443

CHARSET_INFO::coll
MY_COLLATION_HANDLER * coll
Definition: m_ctype.h:456

CHARSET_INFO::sort_order
const uint8_t * sort_order
Definition: m_ctype.h:436

CHARSET_INFO::cset
MY_CHARSET_HANDLER * cset
Definition: m_ctype.h:455

CHARSET_INFO::m_coll_name
const char * m_coll_name
Definition: m_ctype.h:429

CHARSET_INFO::ident_map
const uint8_t * ident_map
Definition: m_ctype.h:442

CHARSET_INFO::levels_for_compare
uint8_t levels_for_compare
Definition: m_ctype.h:453

CHARSET_INFO::mbminlen
unsigned mbminlen
Definition: m_ctype.h:446

CHARSET_INFO::tab_from_uni
const MY_UNI_IDX * tab_from_uni
Definition: m_ctype.h:439

CHARSET_INFO::coll_param
struct Coll_param * coll_param
Definition: m_ctype.h:432

CHARSET_INFO::uca
struct MY_UCA_INFO * uca
Definition: m_ctype.h:437

CHARSET_INFO::to_upper
const uint8_t * to_upper
Definition: m_ctype.h:435

CHARSET_INFO::min_sort_char
my_wc_t min_sort_char
Definition: m_ctype.h:449

CHARSET_INFO::primary_number
unsigned primary_number
Definition: m_ctype.h:425

CHARSET_INFO::pad_attribute
enum Pad_attribute pad_attribute
If this collation is PAD_SPACE, it collates as if all inputs were padded with a given number of space...
Definition: m_ctype.h:465

CHARSET_INFO::tailoring
const char * tailoring
Definition: m_ctype.h:431

CHARSET_INFO::state
unsigned state
Definition: m_ctype.h:427

CHARSET_INFO::comment
const char * comment
Definition: m_ctype.h:430

Coll_param
Definition: str_uca_type.h:74

MY_CHARSET_ERRMSG
Helper structure to return error messages from collation parser/initializer.
Definition: m_ctype.h:181

MY_CHARSET_ERRMSG::errcode
unsigned errcode
See include/mysys_err.h.
Definition: m_ctype.h:183

MY_CHARSET_ERRMSG::errarg
char errarg[errmsg_size]
Error message text.
Definition: m_ctype.h:184

MY_CHARSET_ERRMSG::errmsg_size
static constexpr int errmsg_size
Definition: m_ctype.h:182

MY_CHARSET_HANDLER
Definition: m_ctype.h:342

MY_CHARSET_HANDLER::lengthsp
size_t(* lengthsp)(const CHARSET_INFO *, const char *ptr, size_t length)
Given a pointer and a length in bytes, returns a new length in bytes where all trailing space charact...
Definition: m_ctype.h:374

MY_CHARSET_HANDLER::strntod
double(* strntod)(const CHARSET_INFO *, const char *s, size_t l, const char **e, int *err)
Definition: m_ctype.h:412

MY_CHARSET_HANDLER::strtoll10
long long(* strtoll10)(const CHARSET_INFO *cs, const char *nptr, const char **endptr, int *error)
Definition: m_ctype.h:414

MY_CHARSET_HANDLER::ctype
int(* ctype)(const CHARSET_INFO *cs, int *ctype, const uint8_t *s, const uint8_t *e)
Definition: m_ctype.h:382

MY_CHARSET_HANDLER::well_formed_len
size_t(* well_formed_len)(const CHARSET_INFO *, const char *b, const char *e, size_t nchars, int *error)
Definition: m_ctype.h:357

MY_CHARSET_HANDLER::caseup_str
size_t(* caseup_str)(const CHARSET_INFO *, char *)
Definition: m_ctype.h:386

MY_CHARSET_HANDLER::strntoull10rnd
unsigned long long(* strntoull10rnd)(const CHARSET_INFO *cs, const char *str, size_t length, int unsigned_fl, const char **endptr, int *error)
Definition: m_ctype.h:416

MY_CHARSET_HANDLER::ismbchar
unsigned(* ismbchar)(const CHARSET_INFO *, const char *, const char *)
Definition: m_ctype.h:345

MY_CHARSET_HANDLER::strntoull
unsigned long long(* strntoull)(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: m_ctype.h:410

MY_CHARSET_HANDLER::strntoul
unsigned long(* strntoul)(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: m_ctype.h:406

MY_CHARSET_HANDLER::init
bool(* init)(CHARSET_INFO *, MY_CHARSET_LOADER *loader, MY_CHARSET_ERRMSG *)
Definition: m_ctype.h:343

MY_CHARSET_HANDLER::strntol
long(* strntol)(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: m_ctype.h:404

MY_CHARSET_HANDLER::charpos
size_t(* charpos)(const CHARSET_INFO *, const char *b, const char *e, size_t pos)
Return at which byte codepoint number "pos" begins, relative to the start of the string.
Definition: m_ctype.h:355

MY_CHARSET_HANDLER::longlong10_to_str
size_t(* longlong10_to_str)(const CHARSET_INFO *, char *to, size_t n, int radix, long long val)
Definition: m_ctype.h:398

MY_CHARSET_HANDLER::numchars
size_t(* numchars)(const CHARSET_INFO *, const char *b, const char *e)
Definition: m_ctype.h:347

MY_CHARSET_HANDLER::numcells
size_t(* numcells)(const CHARSET_INFO *, const char *b, const char *e)
Definition: m_ctype.h:375

MY_CHARSET_HANDLER::fill
void(* fill)(const CHARSET_INFO *, char *to, size_t len, int fill)
Definition: m_ctype.h:401

MY_CHARSET_HANDLER::wc_mb
my_charset_conv_wc_mb wc_mb
Definition: m_ctype.h:379

MY_CHARSET_HANDLER::scan
size_t(* scan)(const CHARSET_INFO *, const char *b, const char *e, int sq)
Definition: m_ctype.h:419

MY_CHARSET_HANDLER::strntoll
long long(* strntoll)(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: m_ctype.h:408

MY_CHARSET_HANDLER::mb_wc
my_charset_conv_mb_wc mb_wc
Definition: m_ctype.h:378

MY_CHARSET_HANDLER::mbcharlen
unsigned(* mbcharlen)(const CHARSET_INFO *, unsigned c)
Definition: m_ctype.h:346

MY_CHARSET_HANDLER::caseup
my_charset_conv_case caseup
Definition: m_ctype.h:389

MY_CHARSET_HANDLER::casedn_str
size_t(* casedn_str)(const CHARSET_INFO *, char *)
Definition: m_ctype.h:387

MY_CHARSET_HANDLER::long10_to_str
size_t(* long10_to_str)(const CHARSET_INFO *, char *to, size_t n, int radix, long int val)
Definition: m_ctype.h:396

MY_CHARSET_HANDLER::casedn
my_charset_conv_case casedn
Definition: m_ctype.h:390

MY_CHARSET_HANDLER::snprintf
size_t(* snprintf)(const CHARSET_INFO *, char *to, size_t n, const char *fmt,...)
Definition: m_ctype.h:393

MY_COLLATION_HANDLER
Definition: m_ctype.h:247

MY_COLLATION_HANDLER::strcasecmp
int(* strcasecmp)(const CHARSET_INFO *, const char *, const char *)
Definition: m_ctype.h:311

MY_COLLATION_HANDLER::strnxfrm
size_t(* strnxfrm)(const CHARSET_INFO *, uint8_t *dst, size_t dstlen, unsigned num_codepoints, const uint8_t *src, size_t srclen, unsigned flags)
Transform the string into a form such that memcmp() between transformed strings yields the correct co...
Definition: m_ctype.h:288

MY_COLLATION_HANDLER::strstr
unsigned(* strstr)(const CHARSET_INFO *, const char *b, size_t b_length, const char *s, size_t s_length, my_match_t *match, unsigned nmatch)
Definition: m_ctype.h:313

MY_COLLATION_HANDLER::like_range
bool(* like_range)(const CHARSET_INFO *, const char *s, size_t s_length, char w_prefix, char w_one, char w_many, size_t res_length, char *min_str, char *max_str, size_t *min_len, size_t *max_len)
Definition: m_ctype.h:303

MY_COLLATION_HANDLER::strnncoll
int(* strnncoll)(const CHARSET_INFO *, const uint8_t *, size_t, const uint8_t *, size_t, bool)
Definition: m_ctype.h:251

MY_COLLATION_HANDLER::hash_sort
void(* hash_sort)(const CHARSET_INFO *cs, const uint8_t *key, size_t len, uint64_t *nr1, uint64_t *nr2)
Compute a sort hash for the given key.
Definition: m_ctype.h:328

MY_COLLATION_HANDLER::wildcmp
int(* wildcmp)(const CHARSET_INFO *, const char *str, const char *str_end, const char *wildstr, const char *wildend, int escape, int w_one, int w_many)
Definition: m_ctype.h:307

MY_COLLATION_HANDLER::propagate
bool(* propagate)(const CHARSET_INFO *cs, const uint8_t *str, size_t len)
Definition: m_ctype.h:330

MY_COLLATION_HANDLER::init
bool(* init)(CHARSET_INFO *, MY_CHARSET_LOADER *, MY_CHARSET_ERRMSG *)
Definition: m_ctype.h:248

MY_COLLATION_HANDLER::strnncollsp
int(* strnncollsp)(const CHARSET_INFO *, const uint8_t *, size_t, const uint8_t *, size_t)
Compare the two strings under the pad rules given by the collation.
Definition: m_ctype.h:262

MY_COLLATION_HANDLER::strnxfrmlen
size_t(* strnxfrmlen)(const CHARSET_INFO *, size_t num_bytes)
Return the maximum number of output bytes needed for strnxfrm() to output all weights for any string ...
Definition: m_ctype.h:302

MY_COLLATION_HANDLER::uninit
void(* uninit)(CHARSET_INFO *, MY_CHARSET_LOADER *)
Definition: m_ctype.h:249

MY_UCA_INFO
Definition: str_uca_type.h:125

MY_UNICASE_CHARACTER
Definition: m_ctype.h:64

MY_UNICASE_CHARACTER::tolower
uint32_t tolower
Definition: m_ctype.h:66

MY_UNICASE_CHARACTER::toupper
uint32_t toupper
Definition: m_ctype.h:65

MY_UNICASE_CHARACTER::sort
uint32_t sort
Definition: m_ctype.h:67

MY_UNICASE_INFO
Definition: m_ctype.h:70

MY_UNICASE_INFO::page
const MY_UNICASE_CHARACTER ** page
Definition: m_ctype.h:72

MY_UNICASE_INFO::maxchar
my_wc_t maxchar
Definition: m_ctype.h:71

MY_UNI_CTYPE
Definition: m_ctype.h:77

MY_UNI_CTYPE::ctype
uint8_t * ctype
Definition: m_ctype.h:79

MY_UNI_CTYPE::pctype
uint8_t pctype
Definition: m_ctype.h:78

MY_UNI_IDX
Definition: m_ctype.h:164

MY_UNI_IDX::to
uint16_t to
Definition: m_ctype.h:166

MY_UNI_IDX::from
uint16_t from
Definition: m_ctype.h:165

MY_UNI_IDX::tab
const uint8_t * tab
Definition: m_ctype.h:167

lex_state_maps_st
Definition: sql_chars.h:90

my_match_t
Definition: m_ctype.h:170

my_match_t::mb_len
unsigned mb_len
Definition: m_ctype.h:173

my_match_t::beg
unsigned beg
Definition: m_ctype.h:171

my_match_t::end
unsigned end
Definition: m_ctype.h:172

template_utils.h

privilege_status::error
@ error

n
int n
Definition: xcom_base.cc:509