MySQL 8.0.40
Source Code Documentation
ctype-sjis.cc File Reference
#include <stddef.h>
#include <sys/types.h>
#include "m_ctype.h"
#include "my_compiler.h"
#include "my_inttypes.h"
#include "template_utils.h"

Macros

#define issjishead(c)    ((0x81 <= (c) && (c) <= 0x9f) || ((0xe0 <= (c)) && (c) <= 0xfc))
 
#define issjistail(c)    ((0x40 <= (c) && (c) <= 0x7e) || (0x80 <= (c) && (c) <= 0xfc))
 
#define sjiscode(c, d)   ((((uint)(uchar)(c)) << 8) | (uint)(uchar)(d))
 

Functions

static uint ismbchar_sjis (const CHARSET_INFO *cs, const char *p, const char *e)
 
static uint mbcharlen_sjis (const CHARSET_INFO *cs, uint c)
 
static int my_strnncoll_sjis_internal (const CHARSET_INFO *cs, const uchar **a_res, size_t a_length, const uchar **b_res, size_t b_length)
 
static int my_strnncoll_sjis (const CHARSET_INFO *cs, const uchar *a, size_t a_length, const uchar *b, size_t b_length, bool b_is_prefix)
 
static int my_strnncollsp_sjis (const CHARSET_INFO *cs, const uchar *a, size_t a_length, const uchar *b, size_t b_length)
 
static int my_mb_wc_sjis (const CHARSET_INFO *cs, my_wc_t *pwc, const uchar *s, const uchar *e)
 Scans an SJIS character from the input string and converts to Unicode code point. More...
 
static int my_wc_mb_sjis (const CHARSET_INFO *cs, my_wc_t wc, uchar *s, uchar *e)
 Puts the given Unicode character into an SJIS string. More...
 
static size_t my_numcells_sjis (const CHARSET_INFO *cs, const char *str, const char *str_end)
 
static size_t my_well_formed_len_sjis (const CHARSET_INFO *cs, const char *b, const char *e, size_t pos, int *error)
 

Variables

static const uchar ctype_sjis [257]
 
static const uchar to_lower_sjis []
 
static const uchar to_upper_sjis []
 
static const uchar sort_order_sjis []
 
static const MY_UNICASE_CHARACTER c81 [256]
 
static const MY_UNICASE_CHARACTER c82 [256]
 
static const MY_UNICASE_CHARACTER c83 [256]
 
static const MY_UNICASE_CHARACTER c84 [256]
 
static const MY_UNICASE_CHARACTERmy_caseinfo_pages_sjis [256]
 
static MY_UNICASE_INFO my_caseinfo_sjis = {0xFFFF, my_caseinfo_pages_sjis}
 
static const uint16 sjis_to_unicode [65536]
 
static const uint16 unicode_to_sjis [65536]
 
static MY_COLLATION_HANDLER my_collation_ci_handler
 
static MY_CHARSET_HANDLER my_charset_handler
 
CHARSET_INFO my_charset_sjis_japanese_ci
 
CHARSET_INFO my_charset_sjis_bin
 

Macro Definition Documentation

◆ issjishead

#define issjishead (   c)     ((0x81 <= (c) && (c) <= 0x9f) || ((0xe0 <= (c)) && (c) <= 0xfc))

◆ issjistail

#define issjistail (   c)     ((0x40 <= (c) && (c) <= 0x7e) || (0x80 <= (c) && (c) <= 0xfc))

◆ sjiscode

#define sjiscode (   c,
 
)    ((((uint)(uchar)(c)) << 8) | (uint)(uchar)(d))

Function Documentation

◆ ismbchar_sjis()

static uint ismbchar_sjis ( const CHARSET_INFO cs,
const char *  p,
const char *  e 
)
static

◆ mbcharlen_sjis()

static uint mbcharlen_sjis ( const CHARSET_INFO cs,
uint  c 
)
static

◆ my_mb_wc_sjis()

static int my_mb_wc_sjis ( const CHARSET_INFO cs,
my_wc_t pwc,
const uchar s,
const uchar e 
)
static

Scans an SJIS character from the input string and converts to Unicode code point.

Parameters
[in]csCharacter set info, unused
[out]pwcUnicode code point
[in]sBeginning of the input string
[in]eEnd of the input string
Return values
MY_CS_TOOSMALLIf the string was too short to scan a character
1If a 1-byte character was scanned
2If a 2-byte character was scanned
-2If a 2-byte unassigned character was scanned
MY_CS_ILSEQIf a wrong byte sequence was found

◆ my_numcells_sjis()

static size_t my_numcells_sjis ( const CHARSET_INFO cs,
const char *  str,
const char *  str_end 
)
static

◆ my_strnncoll_sjis()

static int my_strnncoll_sjis ( const CHARSET_INFO cs,
const uchar a,
size_t  a_length,
const uchar b,
size_t  b_length,
bool  b_is_prefix 
)
static

◆ my_strnncoll_sjis_internal()

static int my_strnncoll_sjis_internal ( const CHARSET_INFO cs,
const uchar **  a_res,
size_t  a_length,
const uchar **  b_res,
size_t  b_length 
)
static

◆ my_strnncollsp_sjis()

static int my_strnncollsp_sjis ( const CHARSET_INFO cs,
const uchar a,
size_t  a_length,
const uchar b,
size_t  b_length 
)
static

◆ my_wc_mb_sjis()

static int my_wc_mb_sjis ( const CHARSET_INFO cs,
my_wc_t  wc,
uchar s,
uchar e 
)
static

Puts the given Unicode character into an SJIS string.

Parameters
[in]csCharacter set info, unused
[in]wcUnicode code point
[in]sBeginning of the out string
[in]eEnd of the out string
Return values
MY_CS_TOOSMALLIf the string was too short to put a character
1If a 1-byte character was put
2If a 2-byte character was put
MY_CS_ILUNIIf the Unicode character does not exist in SJIS

◆ my_well_formed_len_sjis()

static size_t my_well_formed_len_sjis ( const CHARSET_INFO cs,
const char *  b,
const char *  e,
size_t  pos,
int *  error 
)
static

Variable Documentation

◆ c81

const MY_UNICASE_CHARACTER c81[256]
static

◆ c82

const MY_UNICASE_CHARACTER c82[256]
static

◆ c83

const MY_UNICASE_CHARACTER c83[256]
static

◆ c84

const MY_UNICASE_CHARACTER c84[256]
static

◆ ctype_sjis

const uchar ctype_sjis[257]
static
Initial value:
= {
0,
0040, 0040, 0040, 0040, 0040, 0040, 0040, 0040,
0040, 0050, 0050, 0050, 0050, 0050, 0040, 0040,
0040, 0040, 0040, 0040, 0040, 0040, 0040, 0040,
0040, 0040, 0040, 0040, 0040, 0040, 0040, 0040,
0110, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0204, 0204, 0204, 0204, 0204, 0204, 0204, 0204,
0204, 0204, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0201, 0201, 0201, 0201, 0201, 0201, 0001,
0001, 0001, 0001, 0001, 0001, 0001, 0001, 0001,
0001, 0001, 0001, 0001, 0001, 0001, 0001, 0001,
0001, 0001, 0001, 0020, 0020, 0020, 0020, 0020,
0020, 0202, 0202, 0202, 0202, 0202, 0202, 0002,
0002, 0002, 0002, 0002, 0002, 0002, 0002, 0002,
0002, 0002, 0002, 0002, 0002, 0002, 0002, 0002,
0002, 0002, 0002, 0020, 0020, 0020, 0020, 0040,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020, 0020,
0020, 0020, 0020, 0020, 0020, 0000, 0000, 0000}

◆ my_caseinfo_pages_sjis

const MY_UNICASE_CHARACTER* my_caseinfo_pages_sjis[256]
static

◆ my_caseinfo_sjis

MY_UNICASE_INFO my_caseinfo_sjis = {0xFFFF, my_caseinfo_pages_sjis}
static

◆ my_charset_handler

MY_CHARSET_HANDLER my_charset_handler
static
Initial value:
= {nullptr,
static uint ismbchar_sjis(const CHARSET_INFO *cs, const char *p, const char *e)
Definition: ctype-sjis.cc:246
static size_t my_well_formed_len_sjis(const CHARSET_INFO *cs, const char *b, const char *e, size_t pos, int *error)
Definition: ctype-sjis.cc:17952
static int my_wc_mb_sjis(const CHARSET_INFO *cs, my_wc_t wc, uchar *s, uchar *e)
Puts the given Unicode character into an SJIS string.
Definition: ctype-sjis.cc:17887
static int my_mb_wc_sjis(const CHARSET_INFO *cs, my_wc_t *pwc, const uchar *s, const uchar *e)
Scans an SJIS character from the input string and converts to Unicode code point.
Definition: ctype-sjis.cc:17847
static uint mbcharlen_sjis(const CHARSET_INFO *cs, uint c)
Definition: ctype-sjis.cc:252
static size_t my_numcells_sjis(const CHARSET_INFO *cs, const char *str, const char *str_end)
Definition: ctype-sjis.cc:17927
size_t my_casedn_str_mb(const CHARSET_INFO *, char *)
Definition: ctype-mb.cc:61
size_t my_charpos_mb3(const CHARSET_INFO *, const char *b, const char *e, size_t pos)
Definition: ctype-mb.cc:331
double my_strntod_8bit(const CHARSET_INFO *, const char *s, size_t l, const char **e, int *err)
Definition: ctype-simple.cc:646
size_t my_snprintf_8bit(const CHARSET_INFO *, char *to, size_t n, const char *fmt,...)
Definition: ctype-simple.cc:281
ulonglong my_strntoull10rnd_8bit(const CHARSET_INFO *cs, const char *str, size_t length, int unsigned_fl, const char **endptr, int *error)
Definition: ctype-simple.cc:1235
ulong my_strntoul_8bit(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: ctype-simple.cc:397
size_t my_caseup_mb(const CHARSET_INFO *, char *src, size_t srclen, char *dst, size_t dstlen)
Definition: ctype-mb.cc:88
void my_fill_8bit(const CHARSET_INFO *cs, char *to, size_t l, int fill)
Definition: ctype-simple.cc:907
size_t my_casedn_mb(const CHARSET_INFO *, char *src, size_t srclen, char *dst, size_t dstlen)
Definition: ctype-mb.cc:115
size_t my_caseup_str_mb(const CHARSET_INFO *, char *)
Definition: ctype-mb.cc:44
size_t my_longlong10_to_str_8bit(const CHARSET_INFO *, char *to, size_t l, int radix, longlong val)
Definition: ctype-simple.cc:695
size_t my_numchars_mb(const CHARSET_INFO *, const char *b, const char *e)
Definition: ctype-mb.cc:320
int my_mb_ctype_mb(const CHARSET_INFO *, int *, const uchar *, const uchar *)
Definition: ctype-mb.cc:1324
long my_strntol_8bit(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: ctype-simple.cc:318
size_t my_lengthsp_8bit(const CHARSET_INFO *cs, const char *ptr, size_t length)
Definition: ctype-simple.cc:936
longlong my_strtoll10_8bit(const CHARSET_INFO *cs, const char *nptr, const char **endptr, int *error)
Definition: ctype-simple.cc:1139
size_t my_long10_to_str_8bit(const CHARSET_INFO *, char *to, size_t l, int radix, long int val)
Definition: ctype-simple.cc:659
ulonglong my_strntoull_8bit(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: ctype-simple.cc:549
size_t my_scan_8bit(const CHARSET_INFO *cs, const char *b, const char *e, int sq)
Definition: ctype-simple.cc:885
longlong my_strntoll_8bit(const CHARSET_INFO *, const char *s, size_t l, int base, const char **e, int *err)
Definition: ctype-simple.cc:470

◆ my_charset_sjis_bin

CHARSET_INFO my_charset_sjis_bin

◆ my_charset_sjis_japanese_ci

CHARSET_INFO my_charset_sjis_japanese_ci

◆ my_collation_ci_handler

MY_COLLATION_HANDLER my_collation_ci_handler
static
Initial value:
= {
nullptr,
nullptr,
static int my_strnncoll_sjis(const CHARSET_INFO *cs, const uchar *a, size_t a_length, const uchar *b, size_t b_length, bool b_is_prefix)
Definition: ctype-sjis.cc:1392
static int my_strnncollsp_sjis(const CHARSET_INFO *cs, const uchar *a, size_t a_length, const uchar *b, size_t b_length)
Definition: ctype-sjis.cc:1400
int my_strcasecmp_8bit(const CHARSET_INFO *cs, const char *, const char *)
Definition: ctype-simple.cc:245
size_t my_strnxfrmlen_simple(const CHARSET_INFO *, size_t)
Definition: ctype-simple.cc:64
uint my_instr_mb(const CHARSET_INFO *, const char *b, size_t b_length, const char *s, size_t s_length, my_match_t *match, uint nmatch)
Definition: ctype-mb.cc:362
int my_wildcmp_mb(const CHARSET_INFO *, const char *str, const char *str_end, const char *wildstr, const char *wildend, int escape, int w_one, int w_many)
Definition: ctype-mb.cc:313
void my_hash_sort_simple(const CHARSET_INFO *cs, const uchar *key, size_t len, uint64 *nr1, uint64 *nr2)
Definition: ctype-simple.cc:291
size_t my_strnxfrm_mb(const CHARSET_INFO *, uchar *dst, size_t dstlen, uint nweights, const uchar *src, size_t srclen, uint flags)
Definition: ctype-mb.cc:502
bool my_like_range_mb(const CHARSET_INFO *cs, const char *ptr, size_t ptr_length, char escape, char w_one, char w_many, size_t res_length, char *min_str, char *max_str, size_t *min_length, size_t *max_length)
Definition: ctype-mb.cc:661
bool my_propagate_simple(const CHARSET_INFO *cs, const uchar *str, size_t len)
Definition: ctype-simple.cc:1484

◆ sjis_to_unicode

const uint16 sjis_to_unicode[65536]
static

◆ sort_order_sjis

const uchar sort_order_sjis[]
static

◆ to_lower_sjis

const uchar to_lower_sjis[]
static

◆ to_upper_sjis

const uchar to_upper_sjis[]
static

◆ unicode_to_sjis

const uint16 unicode_to_sjis[65536]
static