MySQL 8.4.3
Source Code Documentation
ctype-sjis.cc File Reference
#include <cstddef>
#include <cstdint>
#include "my_compiler.h"
#include "mysql/strings/m_ctype.h"
#include "strings/m_ctype_internals.h"
#include "template_utils.h"

Macros

#define issjishead(c)    ((0x81 <= (c) && (c) <= 0x9f) || ((0xe0 <= (c)) && (c) <= 0xfc))
 
#define issjistail(c)    ((0x40 <= (c) && (c) <= 0x7e) || (0x80 <= (c) && (c) <= 0xfc))
 
#define sjiscode(c, d)    ((((unsigned)(uint8_t)(c)) << 8) | (unsigned)(uint8_t)(d))
 

Functions

static unsigned ismbchar_sjis (const CHARSET_INFO *cs, const char *p, const char *e)
 
static unsigned mbcharlen_sjis (const CHARSET_INFO *cs, unsigned c)
 
static int my_strnncoll_sjis_internal (const CHARSET_INFO *cs, const uint8_t **a_res, size_t a_length, const uint8_t **b_res, size_t b_length)
 
static int my_strnncoll_sjis (const CHARSET_INFO *cs, const uint8_t *a, size_t a_length, const uint8_t *b, size_t b_length, bool b_is_prefix)
 
static int my_strnncollsp_sjis (const CHARSET_INFO *cs, const uint8_t *a, size_t a_length, const uint8_t *b, size_t b_length)
 
static int my_mb_wc_sjis (const CHARSET_INFO *cs, my_wc_t *pwc, const uint8_t *s, const uint8_t *e)
 Scans an SJIS character from the input string and converts to Unicode code point. More...
 
static int my_wc_mb_sjis (const CHARSET_INFO *cs, my_wc_t wc, uint8_t *s, uint8_t *e)
 Puts the given Unicode character into an SJIS string. More...
 
static size_t my_numcells_sjis (const CHARSET_INFO *cs, const char *str, const char *str_end)
 
static size_t my_well_formed_len_sjis (const CHARSET_INFO *cs, const char *b, const char *e, size_t pos, int *error)
 

Variables

static const uint8_t ctype_sjis [257]
 
static const uint8_t to_lower_sjis []
 
static const uint8_t to_upper_sjis []
 
static const uint8_t sort_order_sjis []
 
static const MY_UNICASE_CHARACTER c81 [256]
 
static const MY_UNICASE_CHARACTER c82 [256]
 
static const MY_UNICASE_CHARACTER c83 [256]
 
static const MY_UNICASE_CHARACTER c84 [256]
 
static const MY_UNICASE_CHARACTERmy_caseinfo_pages_sjis [256]
 
static MY_UNICASE_INFO my_caseinfo_sjis = {0xFFFF, my_caseinfo_pages_sjis}
 
static const uint16_t sjis_to_unicode [65536]
 
static const uint16_t unicode_to_sjis [65536]
 
static MY_COLLATION_HANDLER my_collation_ci_handler
 
static MY_CHARSET_HANDLER my_charset_handler
 
CHARSET_INFO my_charset_sjis_japanese_ci
 
CHARSET_INFO my_charset_sjis_bin
 

Macro Definition Documentation

◆ issjishead

#define issjishead (   c)     ((0x81 <= (c) && (c) <= 0x9f) || ((0xe0 <= (c)) && (c) <= 0xfc))

◆ issjistail

#define issjistail (   c)     ((0x40 <= (c) && (c) <= 0x7e) || (0x80 <= (c) && (c) <= 0xfc))

◆ sjiscode

#define sjiscode (   c,
 
)     ((((unsigned)(uint8_t)(c)) << 8) | (unsigned)(uint8_t)(d))

Function Documentation

◆ ismbchar_sjis()

static unsigned ismbchar_sjis ( const CHARSET_INFO cs,
const char *  p,
const char *  e 
)
static

◆ mbcharlen_sjis()

static unsigned mbcharlen_sjis ( const CHARSET_INFO cs,
unsigned  c 
)
static

◆ my_mb_wc_sjis()

static int my_mb_wc_sjis ( const CHARSET_INFO cs,
my_wc_t pwc,
const uint8_t *  s,
const uint8_t *  e 
)
static

Scans an SJIS character from the input string and converts to Unicode code point.

Parameters
[in]csCharacter set info, unused
[out]pwcUnicode code point
[in]sBeginning of the input string
[in]eEnd of the input string
Return values
MY_CS_TOOSMALLIf the string was too short to scan a character
1If a 1-byte character was scanned
2If a 2-byte character was scanned
-2If a 2-byte unassigned character was scanned
MY_CS_ILSEQIf a wrong byte sequence was found

◆ my_numcells_sjis()

static size_t my_numcells_sjis ( const CHARSET_INFO cs,
const char *  str,
const char *  str_end 
)
static

◆ my_strnncoll_sjis()

static int my_strnncoll_sjis ( const CHARSET_INFO cs,
const uint8_t *  a,
size_t  a_length,
const uint8_t *  b,
size_t  b_length,
bool  b_is_prefix 
)
static

◆ my_strnncoll_sjis_internal()

static int my_strnncoll_sjis_internal ( const CHARSET_INFO cs,
const uint8_t **  a_res,
size_t  a_length,
const uint8_t **  b_res,
size_t  b_length 
)
static

◆ my_strnncollsp_sjis()

static int my_strnncollsp_sjis ( const CHARSET_INFO cs,
const uint8_t *  a,
size_t  a_length,
const uint8_t *  b,
size_t  b_length 
)
static

◆ my_wc_mb_sjis()

static int my_wc_mb_sjis ( const CHARSET_INFO cs,
my_wc_t  wc,
uint8_t *  s,
uint8_t *  e 
)
static

Puts the given Unicode character into an SJIS string.

Parameters
[in]csCharacter set info, unused
[in]wcUnicode code point
[in]sBeginning of the out string
[in]eEnd of the out string
Return values
MY_CS_TOOSMALLIf the string was too short to put a character
1If a 1-byte character was put
2If a 2-byte character was put
MY_CS_ILUNIIf the Unicode character does not exist in SJIS

◆ my_well_formed_len_sjis()

static size_t my_well_formed_len_sjis ( const CHARSET_INFO cs,
const char *  b,
const char *  e,
size_t  pos,
int *  error 
)
static

Variable Documentation

◆ c81

const MY_UNICASE_CHARACTER c81[256]
static

◆ c82

const MY_UNICASE_CHARACTER c82[256]
static

◆ c83

const MY_UNICASE_CHARACTER c83[256]
static

◆ c84

const MY_UNICASE_CHARACTER c84[256]
static

◆ ctype_sjis

const uint8_t ctype_sjis[257]
static
Initial value:
= {
0,
0040, 0040, 0040, 0040, 0040, 0040, 0040, 0040,
0040, 0050, 0050, 0050, 0050, 0050, 0040, 0040,
0040, 0040, 0040, 0040, 0040, 0040, 0040, 0040,
0040, 0040, 0040, 0040, 0040, 0040, 0040, 0040,
0110, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0204, 0204, 0204, 0204, 0204, 0204, 0204, 0204,
0204, 0204, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0201, 0201, 0201, 0201, 0201, 0201, 0001,
0001, 0001, 0001, 0001, 0001, 0001, 0001, 0001,
0001, 0001, 0001, 0001, 0001, 0001, 0001, 0001,
0001, 0001, 0001, 0020, 0020, 0020, 0020, 0020,
0020, 0202, 0202, 0202, 0202, 0202, 0202, 0002,
0002, 0002, 0002, 0002, 0002, 0002, 0002, 0002,
0002, 0002, 0002, 0002, 0002, 0002, 0002, 0002,
0002, 0002, 0002, 0020, 0020, 0020, 0020, 0040,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0000, 0000, 0000}

◆ my_caseinfo_pages_sjis

const MY_UNICASE_CHARACTER* my_caseinfo_pages_sjis[256]
static

◆ my_caseinfo_sjis

MY_UNICASE_INFO my_caseinfo_sjis = {0xFFFF, my_caseinfo_pages_sjis}
static

◆ my_charset_handler

MY_CHARSET_HANDLER my_charset_handler
static
Initial value:
= {nullptr,
int my_mb_ctype_mb(const CHARSET_INFO *cs, int *ctype, const uint8_t *s, const uint8_t *e)
Definition: ctype-mb.cc:1322
size_t my_numchars_mb(const CHARSET_INFO *cs, const char *pos, const char *end)
Definition: ctype-mb.cc:315
size_t my_casedn_mb(const CHARSET_INFO *cs, char *src, size_t srclen, char *dst, size_t dstlen)
Definition: ctype-mb.cc:112
size_t my_casedn_str_mb(const CHARSET_INFO *cs, char *str)
Definition: ctype-mb.cc:58
size_t my_caseup_mb(const CHARSET_INFO *cs, char *src, size_t srclen, char *dst, size_t dstlen)
Definition: ctype-mb.cc:85
size_t my_charpos_mb3(const CHARSET_INFO *cs, const char *pos, const char *end, size_t length)
Definition: ctype-mb.cc:326
size_t my_caseup_str_mb(const CHARSET_INFO *cs, char *str)
Definition: ctype-mb.cc:41
long long my_strtoll10_8bit(const CHARSET_INFO *cs, const char *nptr, const char **endptr, int *error)
Definition: ctype-simple.cc:1125
unsigned long long my_strntoull10rnd_8bit(const CHARSET_INFO *cs, const char *str, size_t length, int unsigned_flag, const char **endptr, int *error)
Definition: ctype-simple.cc:1221
double my_strntod_8bit(const CHARSET_INFO *cs, const char *str, size_t length, const char **end, int *err)
Definition: ctype-simple.cc:636
long long my_strntoll_8bit(const CHARSET_INFO *cs, const char *nptr, size_t l, int base, const char **endptr, int *err)
Definition: ctype-simple.cc:461
size_t my_longlong10_to_str_8bit(const CHARSET_INFO *cs, char *dst, size_t len, int radix, long long val)
Definition: ctype-simple.cc:686
size_t my_long10_to_str_8bit(const CHARSET_INFO *cs, char *dst, size_t len, int radix, long int val)
Definition: ctype-simple.cc:650
size_t my_lengthsp_8bit(const CHARSET_INFO *cs, const char *ptr, size_t length)
Definition: ctype-simple.cc:927
unsigned long long my_strntoull_8bit(const CHARSET_INFO *cs, const char *nptr, size_t l, int base, const char **endptr, int *err)
Definition: ctype-simple.cc:539
size_t my_snprintf_8bit(const CHARSET_INFO *cs, char *to, size_t n, const char *fmt,...)
Definition: ctype-simple.cc:278
void my_fill_8bit(const CHARSET_INFO *cs, char *s, size_t l, int fill)
Definition: ctype-simple.cc:898
unsigned long my_strntoul_8bit(const CHARSET_INFO *cs, const char *nptr, size_t l, int base, const char **endptr, int *err)
Definition: ctype-simple.cc:389
long my_strntol_8bit(const CHARSET_INFO *cs, const char *nptr, size_t l, int base, const char **endptr, int *err)
Definition: ctype-simple.cc:311
size_t my_scan_8bit(const CHARSET_INFO *cs, const char *str, const char *end, int sq)
Definition: ctype-simple.cc:876
static int my_wc_mb_sjis(const CHARSET_INFO *cs, my_wc_t wc, uint8_t *s, uint8_t *e)
Puts the given Unicode character into an SJIS string.
Definition: ctype-sjis.cc:17898
static unsigned ismbchar_sjis(const CHARSET_INFO *cs, const char *p, const char *e)
Definition: ctype-sjis.cc:252
static size_t my_well_formed_len_sjis(const CHARSET_INFO *cs, const char *b, const char *e, size_t pos, int *error)
Definition: ctype-sjis.cc:17963
static int my_mb_wc_sjis(const CHARSET_INFO *cs, my_wc_t *pwc, const uint8_t *s, const uint8_t *e)
Scans an SJIS character from the input string and converts to Unicode code point.
Definition: ctype-sjis.cc:17858
static size_t my_numcells_sjis(const CHARSET_INFO *cs, const char *str, const char *str_end)
Definition: ctype-sjis.cc:17938
static unsigned mbcharlen_sjis(const CHARSET_INFO *cs, unsigned c)
Definition: ctype-sjis.cc:259

◆ my_charset_sjis_bin

CHARSET_INFO my_charset_sjis_bin

◆ my_charset_sjis_japanese_ci

CHARSET_INFO my_charset_sjis_japanese_ci

◆ my_collation_ci_handler

MY_COLLATION_HANDLER my_collation_ci_handler
static
Initial value:
= {
nullptr,
nullptr,
unsigned my_instr_mb(const CHARSET_INFO *cs, const char *b, size_t b_length, const char *s, size_t s_length, my_match_t *match, unsigned nmatch)
Definition: ctype-mb.cc:357
int my_wildcmp_mb(const CHARSET_INFO *cs, const char *str, const char *str_end, const char *wildstr, const char *wildend, int escape, int w_one, int w_many)
Definition: ctype-mb.cc:308
size_t my_strnxfrm_mb(const CHARSET_INFO *cs, uint8_t *dst, size_t dstlen, unsigned nweights, const uint8_t *src, size_t srclen, unsigned flags)
Definition: ctype-mb.cc:496
bool my_like_range_mb(const CHARSET_INFO *cs, const char *ptr, size_t ptr_length, char escape, char w_one, char w_many, size_t res_length, char *min_str, char *max_str, size_t *min_length, size_t *max_length)
Definition: ctype-mb.cc:657
bool my_propagate_simple(const CHARSET_INFO *cs, const uint8_t *str, size_t length)
Definition: ctype-simple.cc:1474
int my_strcasecmp_8bit(const CHARSET_INFO *cs, const char *s, const char *t)
Definition: ctype-simple.cc:241
size_t my_strnxfrmlen_simple(const CHARSET_INFO *cs, size_t len)
Definition: ctype-simple.cc:62
void my_hash_sort_simple(const CHARSET_INFO *cs, const uint8_t *key, size_t len, uint64_t *nr1, uint64_t *nr2)
Definition: ctype-simple.cc:288
static int my_strnncoll_sjis(const CHARSET_INFO *cs, const uint8_t *a, size_t a_length, const uint8_t *b, size_t b_length, bool b_is_prefix)
Definition: ctype-sjis.cc:1402
static int my_strnncollsp_sjis(const CHARSET_INFO *cs, const uint8_t *a, size_t a_length, const uint8_t *b, size_t b_length)
Definition: ctype-sjis.cc:1410

◆ sjis_to_unicode

const uint16_t sjis_to_unicode[65536]
static

◆ sort_order_sjis

const uint8_t sort_order_sjis[]
static

◆ to_lower_sjis

const uint8_t to_lower_sjis[]
static

◆ to_upper_sjis

const uint8_t to_upper_sjis[]
static

◆ unicode_to_sjis

const uint16_t unicode_to_sjis[65536]
static