37#define UCA_MAX_CHAR_GRP 4
81#define MY_UCA_MAX_CONTRACTION 6
82#define MY_UCA_MAX_WEIGHT_SIZE 25
83#define MY_UCA_WEIGHT_LEVELS 1
174#define MY_UCA_CNT_FLAG_SIZE 4096
175#define MY_UCA_CNT_FLAG_MASK 4095
178#define MY_UCA_CNT_HEAD 1
181#define MY_UCA_CNT_TAIL 2
196#define MY_UCA_CNT_MID1 4
213#define MY_UCA_PREVIOUS_CONTEXT_HEAD 64
216#define MY_UCA_PREVIOUS_CONTEXT_TAIL 128
218#define MY_UCA_PSHIFT 8
249 const std::vector<MY_CONTRACTION> *cont_nodes,
my_wc_t wc1,
my_wc_t wc2);
static int flags[50]
Definition: hp_test1.cc:40
ulong my_wc_t
Our own version of wchar_t, ie., a type that holds a single Unicode code point ("wide character").
Definition: m_ctype.h:59
Some integer typedefs for easier portability.
unsigned char uchar
Definition: my_inttypes.h:52
uint16_t uint16
Definition: my_inttypes.h:65
enum_uca_ver
Definition: str_uca_type.h:38
@ UCA_V520
Definition: str_uca_type.h:38
@ UCA_V400
Definition: str_uca_type.h:38
@ UCA_V900
Definition: str_uca_type.h:38
#define MY_UCA_CNT_TAIL
Whether the given character can be the last in any contraction.
Definition: str_uca_type.h:181
bool my_uca_can_be_contraction_tail(const char *flags, my_wc_t wc)
Check if a code point can be contraction tail.
Definition: str_uca_type.h:244
bool my_uca_can_be_contraction_head(const char *flags, my_wc_t wc)
Check if a code point can be contraction head.
Definition: str_uca_type.h:230
enum_char_grp
Definition: str_uca_type.h:40
@ CHARGRP_NONE
Definition: str_uca_type.h:41
@ CHARGRP_ARAB
Definition: str_uca_type.h:45
@ CHARGRP_LATIN
Definition: str_uca_type.h:43
@ CHARGRP_CYRILLIC
Definition: str_uca_type.h:44
@ CHARGRP_KANA
Definition: str_uca_type.h:46
@ CHARGRP_CORE
Definition: str_uca_type.h:42
@ CHARGRP_OTHERS
Definition: str_uca_type.h:47
const uint16 * my_uca_contraction2_weight(const std::vector< MY_CONTRACTION > *cont_nodes, my_wc_t wc1, my_wc_t wc2)
Find a contraction consisting of two code points and return its weight array.
Definition: ctype-uca.cc:946
#define MY_UCA_MAX_WEIGHT_SIZE
Definition: str_uca_type.h:82
#define UCA_MAX_CHAR_GRP
Definition: str_uca_type.h:37
#define MY_UCA_CNT_FLAG_MASK
Definition: str_uca_type.h:175
#define MY_UCA_CNT_HEAD
Whether the given character can be the first in any contraction.
Definition: str_uca_type.h:178
enum_case_first
Definition: str_uca_type.h:67
@ CASE_FIRST_UPPER
Definition: str_uca_type.h:67
@ CASE_FIRST_LOWER
Definition: str_uca_type.h:67
@ CASE_FIRST_OFF
Definition: str_uca_type.h:67
Definition: str_uca_type.h:69
struct Reorder_param * reorder_param
Definition: str_uca_type.h:70
enum enum_case_first case_first
Definition: str_uca_type.h:73
bool norm_enabled
Definition: str_uca_type.h:71
Definition: str_uca_type.h:108
std::vector< MY_CONTRACTION > child_nodes_context
Definition: str_uca_type.h:112
std::vector< MY_CONTRACTION > child_nodes
Definition: str_uca_type.h:111
uint16 weight[MY_UCA_MAX_WEIGHT_SIZE]
Definition: str_uca_type.h:115
my_wc_t ch
Definition: str_uca_type.h:109
size_t contraction_len
Definition: str_uca_type.h:117
bool is_contraction_tail
Definition: str_uca_type.h:116
Definition: str_uca_type.h:120
uint16 extra_ce_ter_base
Definition: str_uca_type.h:171
my_wc_t first_non_ignorable
Definition: str_uca_type.h:144
uint16 extra_ce_pri_base
Definition: str_uca_type.h:169
uint16 ** weights
Definition: str_uca_type.h:126
my_wc_t last_tertiary_ignorable
Definition: str_uca_type.h:151
my_wc_t last_secondary_ignorable
Definition: str_uca_type.h:149
my_wc_t maxchar
Definition: str_uca_type.h:124
char * contraction_flags
Definition: str_uca_type.h:141
my_wc_t last_primary_ignorable
Definition: str_uca_type.h:147
bool have_contractions
Definition: str_uca_type.h:127
my_wc_t first_variable
Definition: str_uca_type.h:154
my_wc_t first_tertiary_ignorable
Definition: str_uca_type.h:150
my_wc_t last_trailing
Definition: str_uca_type.h:153
my_wc_t first_secondary_ignorable
Definition: str_uca_type.h:148
enum enum_uca_ver version
Definition: str_uca_type.h:121
my_wc_t last_non_ignorable
Definition: str_uca_type.h:145
uchar * lengths
Definition: str_uca_type.h:125
my_wc_t last_variable
Definition: str_uca_type.h:155
my_wc_t first_primary_ignorable
Definition: str_uca_type.h:146
my_wc_t first_trailing
Definition: str_uca_type.h:152
std::vector< MY_CONTRACTION > * contraction_nodes
Definition: str_uca_type.h:128
uint16 extra_ce_sec_base
Definition: str_uca_type.h:170
Definition: str_uca_type.h:60
enum enum_char_grp reorder_grp[UCA_MAX_CHAR_GRP]
Definition: str_uca_type.h:61
int wt_rec_num
Definition: str_uca_type.h:63
uint16 max_weight
Definition: str_uca_type.h:64
struct Reorder_wt_rec wt_rec[2 *UCA_MAX_CHAR_GRP]
Definition: str_uca_type.h:62
Definition: str_uca_type.h:55
struct Weight_boundary old_wt_bdy
Definition: str_uca_type.h:56
struct Weight_boundary new_wt_bdy
Definition: str_uca_type.h:57
Definition: str_uca_type.h:50
uint16 end
Definition: str_uca_type.h:52
uint16 begin
Definition: str_uca_type.h:51