/* Copyright (c) 2000, 2018, Oracle and/or its affiliates. All rights reserved. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License, version 2.0, as published by the Free Software Foundation. This program is also distributed with certain software (including but not limited to OpenSSL) that is licensed under separate terms, as designated in a particular file or component or in included license documentation. The authors of MySQL hereby grant you an additional permission to link the program and your derivative works with the separately licensed software that they have included with MySQL. Without limiting anything contained in the foregoing, this file, which is part of C Driver for MySQL (Connector/C), is also subject to the Universal FOSS Exception, version 1.0, a copy of which can be found at http://oss.oracle.com/licenses/universal-foss-exception. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License, version 2.0, for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */ /* Copyright (C) 2003 by Sathit Jittanupat * solving bug crash with long text field string * sorting with different number of space or sign char. within string Copyright (C) 2001 by Korakot Chaovavanich and Apisilp Trunganont Copyright (C) 1998, 1999 by Pruet Boonma Copyright (C) 1998 by Theppitak Karoonboonyanan Copyright (C) 1989, 1991 by Samphan Raruenrom Permission to use, copy, modify, distribute and sell this software and its documentation for any purpose is hereby granted without fee, provided that the above copyright notice appear in all copies. Samphan Raruenrom , Theppitak Karoonboonyanan , Pruet Boonma , Korakot Chaovavanich and Apisilp Trunganont makes no representations about the suitability of this software for any purpose. It is provided "as is" without express or implied warranty. */ /* This file is basicly tis620 character sets with some extra functions for tis-620 handling */ /* * This comment is parsed by configure to create ctype.c, * so don't change it unless you know what you are doing. * * .configure. strxfrm_multiply_tis620=4 */ #include #include #include "m_ctype.h" #include "m_string.h" #include "my_compiler.h" #include "my_inttypes.h" #include "my_macros.h" #include "strings/t_ctype.h" #define M L_MIDDLE #define U L_UPPER #define L L_LOWER #define UU L_UPRUPR #define X L_MIDDLE static const int t_ctype[][TOT_LEVELS] = { /*0x00*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x01*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x02*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x03*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x04*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x05*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x06*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x07*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x08*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x09*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x0A*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x0B*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x0C*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x0D*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x0E*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x0F*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x10*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x11*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x12*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x13*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x14*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x15*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x16*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x17*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x18*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x19*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x1A*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x1B*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x1C*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x1D*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x1E*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x1F*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x20*/ {IGNORE, IGNORE, L3_SPACE, IGNORE, M}, /*0x21*/ {IGNORE, IGNORE, L3_EXCLAMATION, IGNORE, M}, /*0x22*/ {IGNORE, IGNORE, L3_QUOTATION, IGNORE, M}, /*0x23*/ {IGNORE, IGNORE, L3_NUMBER, IGNORE, M}, /*0x24*/ {IGNORE, IGNORE, L3_DOLLAR, IGNORE, M}, /*0x25*/ {IGNORE, IGNORE, L3_PERCENT, IGNORE, M}, /*0x26*/ {IGNORE, IGNORE, L3_AMPERSAND, IGNORE, M}, /*0x27*/ {IGNORE, IGNORE, L3_APOSTROPHE, IGNORE, M}, /*0x28*/ {IGNORE, IGNORE, L3_L_PARANTHESIS, IGNORE, M}, /*0x29*/ {IGNORE, IGNORE, L3_R_PARENTHESIS, IGNORE, M}, /*0x2A*/ {IGNORE, IGNORE, L3_ASTERISK, IGNORE, M}, /*0x2B*/ {IGNORE, IGNORE, L3_PLUS, IGNORE, M}, /*0x2C*/ {IGNORE, IGNORE, L3_COMMA, IGNORE, M}, /*0x2D*/ {IGNORE, IGNORE, L3_HYPHEN, IGNORE, M}, /*0x2E*/ {IGNORE, IGNORE, L3_FULL_STOP, IGNORE, M}, /*0x2F*/ {IGNORE, IGNORE, L3_SOLIDUS, IGNORE, M}, /*0x30*/ {L1_08, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x31*/ {L1_18, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x32*/ {L1_28, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x33*/ {L1_38, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x34*/ {L1_48, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x35*/ {L1_58, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x36*/ {L1_68, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x37*/ {L1_78, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x38*/ {L1_88, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x39*/ {L1_98, L2_BLANK, L3_BLANK, L4_BLANK, M}, /*0x3A*/ {IGNORE, IGNORE, L3_COLON, IGNORE, M}, /*0x3B*/ {IGNORE, IGNORE, L3_SEMICOLON, IGNORE, M}, /*0x3C*/ {IGNORE, IGNORE, L3_LESS_THAN, IGNORE, M}, /*0x3D*/ {IGNORE, IGNORE, L3_EQUAL, IGNORE, M}, /*0x3E*/ {IGNORE, IGNORE, L3_GREATER_THAN, IGNORE, M}, /*0x3F*/ {IGNORE, IGNORE, L3_QUESTION, IGNORE, M}, /*0x40*/ {IGNORE, IGNORE, L3_AT, IGNORE, M}, /*0x41*/ {L1_A8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x42*/ {L1_B8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x43*/ {L1_C8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x44*/ {L1_D8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x45*/ {L1_E8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x46*/ {L1_F8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x47*/ {L1_G8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x48*/ {L1_H8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x49*/ {L1_I8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x4A*/ {L1_J8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x4B*/ {L1_K8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x4C*/ {L1_L8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x4D*/ {L1_M8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x4E*/ {L1_N8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x4F*/ {L1_O8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x50*/ {L1_P8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x51*/ {L1_Q8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x52*/ {L1_R8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x53*/ {L1_S8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x54*/ {L1_T8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x55*/ {L1_U8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x56*/ {L1_V8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x57*/ {L1_W8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x58*/ {L1_X8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x59*/ {L1_Y8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x5A*/ {L1_Z8, L2_BLANK, L3_BLANK, L4_CAP, M}, /*0x5B*/ {IGNORE, IGNORE, L3_L_BRACKET, IGNORE, M}, /*0x5C*/ {IGNORE, IGNORE, L3_BK_SOLIDUS, IGNORE, M}, /*0x5D*/ {IGNORE, IGNORE, L3_R_BRACKET, IGNORE, M}, /*0x5E*/ {IGNORE, IGNORE, L3_CIRCUMFLEX, IGNORE, M}, /*0x5F*/ {IGNORE, IGNORE, L3_LOW_LINE, IGNORE, M}, /*0x60*/ {IGNORE, IGNORE, L3_GRAVE, IGNORE, M}, /*0x61*/ {L1_A8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x62*/ {L1_B8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x63*/ {L1_C8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x64*/ {L1_D8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x65*/ {L1_E8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x66*/ {L1_F8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x67*/ {L1_G8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x68*/ {L1_H8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x69*/ {L1_I8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x6A*/ {L1_J8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x6B*/ {L1_K8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x6C*/ {L1_L8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x6D*/ {L1_M8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x6E*/ {L1_N8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x6F*/ {L1_O8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x70*/ {L1_P8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x71*/ {L1_Q8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x72*/ {L1_R8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x73*/ {L1_S8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x74*/ {L1_T8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x75*/ {L1_U8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x76*/ {L1_V8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x77*/ {L1_W8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x78*/ {L1_X8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x79*/ {L1_Y8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x7A*/ {L1_Z8, L2_BLANK, L3_BLANK, L4_MIN, M}, /*0x7B*/ {IGNORE, IGNORE, L3_L_BRACE, IGNORE, M}, /*0x7C*/ {IGNORE, IGNORE, L3_V_LINE, IGNORE, M}, /*0x7D*/ {IGNORE, IGNORE, L3_R_BRACE, IGNORE, M}, /*0x7E*/ {IGNORE, IGNORE, L3_TILDE, IGNORE, M}, /*0x7F*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x80*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x81*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x82*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x83*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x84*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x85*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x86*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x87*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x88*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x89*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x8A*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x8B*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x8C*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x8D*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x8E*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x8F*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x90*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x91*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x92*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x93*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x94*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x95*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x96*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x97*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x98*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x99*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x9A*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x9B*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x9C*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x9D*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x9E*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0x9F*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xA0*/ {IGNORE, IGNORE, L3_NB_SACE, IGNORE, X}, /*0xA1*/ {L1_KO_KAI, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA2*/ {L1_KHO_KHAI, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA3*/ {L1_KHO_KHUAT, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA4*/ {L1_KHO_KHWAI, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA5*/ {L1_KHO_KHON, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA6*/ {L1_KHO_RAKHANG, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA7*/ {L1_NGO_NGU, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA8*/ {L1_CHO_CHAN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xA9*/ {L1_CHO_CHING, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xAA*/ {L1_CHO_CHANG, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xAB*/ {L1_SO_SO, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xAC*/ {L1_CHO_CHOE, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xAD*/ {L1_YO_YING, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xAE*/ {L1_DO_CHADA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xAF*/ {L1_TO_PATAK, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB0*/ {L1_THO_THAN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB1*/ {L1_THO_NANGMONTHO, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB2*/ {L1_THO_PHUTHAO, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB3*/ {L1_NO_NEN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB4*/ {L1_DO_DEK, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB5*/ {L1_TO_TAO, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB6*/ {L1_THO_THUNG, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB7*/ {L1_THO_THAHAN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB8*/ {L1_THO_THONG, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xB9*/ {L1_NO_NU, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xBA*/ {L1_BO_BAIMAI, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xBB*/ {L1_PO_PLA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xBC*/ {L1_PHO_PHUNG, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xBD*/ {L1_FO_FA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xBE*/ {L1_PHO_PHAN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xBF*/ {L1_FO_FAN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC0*/ {L1_PHO_SAMPHAO, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC1*/ {L1_MO_MA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC2*/ {L1_YO_YAK, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC3*/ {L1_RO_RUA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC4*/ {L1_RU, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC5*/ {L1_LO_LING, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC6*/ {L1_LU, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC7*/ {L1_WO_WAEN, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC8*/ {L1_SO_SALA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xC9*/ {L1_SO_RUSI, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xCA*/ {L1_SO_SUA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xCB*/ {L1_HO_HIP, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xCC*/ {L1_LO_CHULA, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xCD*/ {L1_O_ANG, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xCE*/ {L1_HO_NOKHUK, L2_BLANK, L3_BLANK, L4_BLANK, M | _consnt}, /*0xCF*/ {IGNORE, IGNORE, L3_PAIYAN_NOI, IGNORE, M}, /*0xD0*/ {L1_SARA_A, L2_BLANK, L3_BLANK, L4_BLANK, M | _fllwvowel}, /*0xD1*/ {L1_MAI_HAN_AKAT, L2_BLANK, L3_BLANK, L4_BLANK, U | _uprvowel}, /*0xD2*/ {L1_SARA_AA, L2_BLANK, L3_BLANK, L4_BLANK, M | _fllwvowel}, /*0xD3*/ {L1_SARA_AM, L2_BLANK, L3_BLANK, L4_BLANK, M | _fllwvowel}, /*0xD4*/ {L1_SARA_I, L2_BLANK, L3_BLANK, L4_BLANK, U | _uprvowel}, /*0xD5*/ {L1_SARA_II, L2_BLANK, L3_BLANK, L4_BLANK, U | _uprvowel}, /*0xD6*/ {L1_SARA_UE, L2_BLANK, L3_BLANK, L4_BLANK, U | _uprvowel}, /*0xD7*/ {L1_SARA_UEE, L2_BLANK, L3_BLANK, L4_BLANK, U | _uprvowel}, /*0xD8*/ {L1_SARA_U, L2_BLANK, L3_BLANK, L4_BLANK, L | _lwrvowel}, /*0xD9*/ {L1_SARA_UU, L2_BLANK, L3_BLANK, L4_BLANK, L | _lwrvowel}, /*0xDA*/ {IGNORE, L2_PINTHU, L3_BLANK, L4_BLANK, L}, /*0xDB*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xDC*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xDD*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xDE*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xDF*/ {IGNORE, IGNORE, L3_BAHT, IGNORE, M}, /*0xE0*/ {L1_SARA_E, L2_BLANK, L3_BLANK, L4_BLANK, M | _ldvowel}, /*0xE1*/ {L1_SARA_AE, L2_BLANK, L3_BLANK, L4_BLANK, M | _ldvowel}, /*0xE2*/ {L1_SARA_O, L2_BLANK, L3_BLANK, L4_BLANK, M | _ldvowel}, /*0xE3*/ {L1_SARA_AI_MAIMUAN, L2_BLANK, L3_BLANK, L4_BLANK, M | _ldvowel}, /*0xE4*/ {L1_SARA_AI_MAIMALAI, L2_BLANK, L3_BLANK, L4_BLANK, M | _ldvowel}, /*0xE5*/ {L1_SARA_AA, L2_BLANK, L3_BLANK, L4_EXT, M | _fllwvowel}, /*0xE6*/ {IGNORE, IGNORE, L3_MAI_YAMOK, IGNORE, M | _stone}, /*0xE7*/ {IGNORE, L2_TYKHU, L3_BLANK, L4_BLANK, U | _diacrt1 | _stone}, /*0xE8*/ {IGNORE, L2_TONE1, L3_BLANK, L4_BLANK, UU | _tone | _combine | _stone}, /*0xE9*/ {IGNORE, L2_TONE2, L3_BLANK, L4_BLANK, UU | _tone | _combine | _stone}, /*0xEA*/ {IGNORE, L2_TONE3, L3_BLANK, L4_BLANK, UU | _tone | _combine | _stone}, /*0xEB*/ {IGNORE, L2_TONE4, L3_BLANK, L4_BLANK, UU | _tone | _combine | _stone}, /*0xEC*/ {IGNORE, L2_GARAN, L3_BLANK, L4_BLANK, UU | _diacrt2 | _combine | _stone}, /*0xED*/ {L1_NKHIT, L2_BLANK, L3_BLANK, L4_BLANK, U | _diacrt1}, /*0xEE*/ {IGNORE, L2_YAMAK, L3_BLANK, L4_BLANK, U | _diacrt1}, /*0xEF*/ {IGNORE, IGNORE, L3_FONGMAN, IGNORE, M}, /*0xF0*/ {L1_08, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF1*/ {L1_18, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF2*/ {L1_28, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF3*/ {L1_38, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF4*/ {L1_48, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF5*/ {L1_58, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF6*/ {L1_68, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF7*/ {L1_78, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF8*/ {L1_88, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xF9*/ {L1_98, L2_THAII, L3_BLANK, L4_BLANK, M | _tdig}, /*0xFA*/ {IGNORE, IGNORE, L3_ANGKHANKHU, IGNORE, X}, /*0xFB*/ {IGNORE, IGNORE, L3_KHOMUT, IGNORE, X}, /*0xFC*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xFD*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /*0xFE*/ {IGNORE, IGNORE, IGNORE, IGNORE, X}, /* Utilize 0xFF for max_sort_chr in my_like_range_tis620 */ /*0xFF*/ {255 /*IGNORE*/, IGNORE, IGNORE, IGNORE, X}, }; static const uchar ctype_tis620[257] = { 0, /* For standard library */ 32, 32, 32, 32, 32, 32, 32, 32, 32, 40, 40, 40, 40, 40, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 72, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16, 132, 132, 132, 132, 132, 132, 132, 132, 132, 132, 16, 16, 16, 16, 16, 16, 16, 129, 129, 129, 129, 129, 129, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 16, 16, 16, 16, 16, 16, 130, 130, 130, 130, 130, 130, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 16, 16, 16, 16, 32, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, }; static const uchar to_lower_tis620[] = { '\000', '\001', '\002', '\003', '\004', '\005', '\006', '\007', '\010', '\011', '\012', '\013', '\014', '\015', '\016', '\017', '\020', '\021', '\022', '\023', '\024', '\025', '\026', '\027', '\030', '\031', '\032', '\033', '\034', '\035', '\036', '\037', ' ', '!', '"', '#', '$', '%', '&', '\'', '(', ')', '*', '+', ',', '-', '.', '/', '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', ':', ';', '<', '=', '>', '?', '@', 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', '[', '\\', ']', '^', '_', '`', 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', '{', '|', '}', '~', '\177', (uchar)'\200', (uchar)'\201', (uchar)'\202', (uchar)'\203', (uchar)'\204', (uchar)'\205', (uchar)'\206', (uchar)'\207', (uchar)'\210', (uchar)'\211', (uchar)'\212', (uchar)'\213', (uchar)'\214', (uchar)'\215', (uchar)'\216', (uchar)'\217', (uchar)'\220', (uchar)'\221', (uchar)'\222', (uchar)'\223', (uchar)'\224', (uchar)'\225', (uchar)'\226', (uchar)'\227', (uchar)'\230', (uchar)'\231', (uchar)'\232', (uchar)'\233', (uchar)'\234', (uchar)'\235', (uchar)'\236', (uchar)'\237', (uchar)'\240', (uchar)'\241', (uchar)'\242', (uchar)'\243', (uchar)'\244', (uchar)'\245', (uchar)'\246', (uchar)'\247', (uchar)'\250', (uchar)'\251', (uchar)'\252', (uchar)'\253', (uchar)'\254', (uchar)'\255', (uchar)'\256', (uchar)'\257', (uchar)'\260', (uchar)'\261', (uchar)'\262', (uchar)'\263', (uchar)'\264', (uchar)'\265', (uchar)'\266', (uchar)'\267', (uchar)'\270', (uchar)'\271', (uchar)'\272', (uchar)'\273', (uchar)'\274', (uchar)'\275', (uchar)'\276', (uchar)'\277', (uchar)'\300', (uchar)'\301', (uchar)'\302', (uchar)'\303', (uchar)'\304', (uchar)'\305', (uchar)'\306', (uchar)'\307', (uchar)'\310', (uchar)'\311', (uchar)'\312', (uchar)'\313', (uchar)'\314', (uchar)'\315', (uchar)'\316', (uchar)'\317', (uchar)'\320', (uchar)'\321', (uchar)'\322', (uchar)'\323', (uchar)'\324', (uchar)'\325', (uchar)'\326', (uchar)'\327', (uchar)'\330', (uchar)'\331', (uchar)'\332', (uchar)'\333', (uchar)'\334', (uchar)'\335', (uchar)'\336', (uchar)'\337', (uchar)'\340', (uchar)'\341', (uchar)'\342', (uchar)'\343', (uchar)'\344', (uchar)'\345', (uchar)'\346', (uchar)'\347', (uchar)'\350', (uchar)'\351', (uchar)'\352', (uchar)'\353', (uchar)'\354', (uchar)'\355', (uchar)'\356', (uchar)'\357', (uchar)'\360', (uchar)'\361', (uchar)'\362', (uchar)'\363', (uchar)'\364', (uchar)'\365', (uchar)'\366', (uchar)'\367', (uchar)'\370', (uchar)'\371', (uchar)'\372', (uchar)'\373', (uchar)'\374', (uchar)'\375', (uchar)'\376', (uchar)'\377', }; static const uchar to_upper_tis620[] = { '\000', '\001', '\002', '\003', '\004', '\005', '\006', '\007', '\010', '\011', '\012', '\013', '\014', '\015', '\016', '\017', '\020', '\021', '\022', '\023', '\024', '\025', '\026', '\027', '\030', '\031', '\032', '\033', '\034', '\035', '\036', '\037', ' ', '!', '"', '#', '$', '%', '&', '\'', '(', ')', '*', '+', ',', '-', '.', '/', '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', ':', ';', '<', '=', '>', '?', '@', 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', '[', '\\', ']', '^', '_', '`', 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', '{', '|', '}', '~', '\177', (uchar)'\200', (uchar)'\201', (uchar)'\202', (uchar)'\203', (uchar)'\204', (uchar)'\205', (uchar)'\206', (uchar)'\207', (uchar)'\210', (uchar)'\211', (uchar)'\212', (uchar)'\213', (uchar)'\214', (uchar)'\215', (uchar)'\216', (uchar)'\217', (uchar)'\220', (uchar)'\221', (uchar)'\222', (uchar)'\223', (uchar)'\224', (uchar)'\225', (uchar)'\226', (uchar)'\227', (uchar)'\230', (uchar)'\231', (uchar)'\232', (uchar)'\233', (uchar)'\234', (uchar)'\235', (uchar)'\236', (uchar)'\237', (uchar)'\240', (uchar)'\241', (uchar)'\242', (uchar)'\243', (uchar)'\244', (uchar)'\245', (uchar)'\246', (uchar)'\247', (uchar)'\250', (uchar)'\251', (uchar)'\252', (uchar)'\253', (uchar)'\254', (uchar)'\255', (uchar)'\256', (uchar)'\257', (uchar)'\260', (uchar)'\261', (uchar)'\262', (uchar)'\263', (uchar)'\264', (uchar)'\265', (uchar)'\266', (uchar)'\267', (uchar)'\270', (uchar)'\271', (uchar)'\272', (uchar)'\273', (uchar)'\274', (uchar)'\275', (uchar)'\276', (uchar)'\277', (uchar)'\300', (uchar)'\301', (uchar)'\302', (uchar)'\303', (uchar)'\304', (uchar)'\305', (uchar)'\306', (uchar)'\307', (uchar)'\310', (uchar)'\311', (uchar)'\312', (uchar)'\313', (uchar)'\314', (uchar)'\315', (uchar)'\316', (uchar)'\317', (uchar)'\320', (uchar)'\321', (uchar)'\322', (uchar)'\323', (uchar)'\324', (uchar)'\325', (uchar)'\326', (uchar)'\327', (uchar)'\330', (uchar)'\331', (uchar)'\332', (uchar)'\333', (uchar)'\334', (uchar)'\335', (uchar)'\336', (uchar)'\337', (uchar)'\340', (uchar)'\341', (uchar)'\342', (uchar)'\343', (uchar)'\344', (uchar)'\345', (uchar)'\346', (uchar)'\347', (uchar)'\350', (uchar)'\351', (uchar)'\352', (uchar)'\353', (uchar)'\354', (uchar)'\355', (uchar)'\356', (uchar)'\357', (uchar)'\360', (uchar)'\361', (uchar)'\362', (uchar)'\363', (uchar)'\364', (uchar)'\365', (uchar)'\366', (uchar)'\367', (uchar)'\370', (uchar)'\371', (uchar)'\372', (uchar)'\373', (uchar)'\374', (uchar)'\375', (uchar)'\376', (uchar)'\377', }; static const uchar sort_order_tis620[] = { '\000', '\001', '\002', '\003', '\004', '\005', '\006', '\007', '\010', '\011', '\012', '\013', '\014', '\015', '\016', '\017', '\020', '\021', '\022', '\023', '\024', '\025', '\026', '\027', '\030', '\031', '\032', '\033', '\034', '\035', '\036', '\037', ' ', '!', '"', '#', '$', '%', '&', '\'', '(', ')', '*', '+', ',', '-', '.', '/', '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', ':', ';', '<', '=', '>', '?', '@', 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', '\\', ']', '[', '^', '_', 'E', 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', '{', '|', '}', 'Y', '\177', (uchar)'\200', (uchar)'\201', (uchar)'\202', (uchar)'\203', (uchar)'\204', (uchar)'\205', (uchar)'\206', (uchar)'\207', (uchar)'\210', (uchar)'\211', (uchar)'\212', (uchar)'\213', (uchar)'\214', (uchar)'\215', (uchar)'\216', (uchar)'\217', (uchar)'\220', (uchar)'\221', (uchar)'\222', (uchar)'\223', (uchar)'\224', (uchar)'\225', (uchar)'\226', (uchar)'\227', (uchar)'\230', (uchar)'\231', (uchar)'\232', (uchar)'\233', (uchar)'\234', (uchar)'\235', (uchar)'\236', (uchar)'\237', (uchar)'\240', (uchar)'\241', (uchar)'\242', (uchar)'\243', (uchar)'\244', (uchar)'\245', (uchar)'\246', (uchar)'\247', (uchar)'\250', (uchar)'\251', (uchar)'\252', (uchar)'\253', (uchar)'\254', (uchar)'\255', (uchar)'\256', (uchar)'\257', (uchar)'\260', (uchar)'\261', (uchar)'\262', (uchar)'\263', (uchar)'\264', (uchar)'\265', (uchar)'\266', (uchar)'\267', (uchar)'\270', (uchar)'\271', (uchar)'\272', (uchar)'\273', (uchar)'\274', (uchar)'\275', (uchar)'\276', (uchar)'\277', (uchar)'\300', (uchar)'\301', (uchar)'\302', (uchar)'\303', (uchar)'\304', (uchar)'\305', (uchar)'\306', (uchar)'\307', (uchar)'\310', (uchar)'\311', (uchar)'\312', (uchar)'\313', (uchar)'\314', (uchar)'\315', (uchar)'\316', (uchar)'\317', (uchar)'\320', (uchar)'\321', (uchar)'\322', (uchar)'\323', (uchar)'\324', (uchar)'\325', (uchar)'\326', (uchar)'\327', (uchar)'\330', (uchar)'\331', (uchar)'\332', (uchar)'\333', (uchar)'\334', (uchar)'\335', (uchar)'\336', (uchar)'\337', (uchar)'\340', (uchar)'\341', (uchar)'\342', (uchar)'\343', (uchar)'\344', (uchar)'\345', (uchar)'\346', (uchar)'\347', (uchar)'\350', (uchar)'\351', (uchar)'\352', (uchar)'\353', (uchar)'\354', (uchar)'\355', (uchar)'\356', (uchar)'\357', (uchar)'\360', (uchar)'\361', (uchar)'\362', (uchar)'\363', (uchar)'\364', (uchar)'\365', (uchar)'\366', (uchar)'\367', (uchar)'\370', (uchar)'\371', (uchar)'\372', (uchar)'\373', (uchar)'\374', (uchar)'\375', (uchar)'\376', (uchar)'\377', }; /* Convert thai string to "Standard C String Function" sortable string SYNOPSIS thai2sortable() tstr String to convert. Does not have to end with \0 len Length of tstr */ static size_t thai2sortable(uchar *tstr, size_t len) { uchar *p; size_t tlen; uchar l2bias; tlen = len; l2bias = 256 - 8; for (p = tstr; tlen > 0; p++, tlen--) { uchar c = *p; if (isthai(c)) { const int *t_ctype0 = t_ctype[c]; if (isconsnt(c)) l2bias -= 8; if (isldvowel(c) && tlen != 1 && isconsnt(p[1])) { /* simply swap between leading-vowel and consonant */ *p = p[1]; p[1] = c; tlen--; p++; continue; } /* if found level 2 char (L2_GARAN,L2_TONE*,L2_TYKHU) move to last */ if (t_ctype0[1] >= L2_GARAN) { /* l2bias use to control position weight of l2char example (*=l2char) XX*X must come before X*XX */ memmove((char *)p, (char *)(p + 1), tlen - 1); tstr[len - 1] = l2bias + t_ctype0[1] - L2_GARAN + 1; p--; continue; } } else { l2bias -= 8; *p = to_lower_tis620[c]; } } return len; } /* strncoll() replacement, compare 2 string, both are converted to sortable string NOTE: We can't cut strings at end \0 as this would break comparision with LIKE characters, where the min range is stored as end \0 Arg: 2 Strings and it compare length Ret: strcmp result */ extern "C" { static int my_strnncoll_tis620(const CHARSET_INFO *cs MY_ATTRIBUTE((unused)), const uchar *s1, size_t len1, const uchar *s2, size_t len2, bool s2_is_prefix) { uchar buf[80]; uchar *tc1, *tc2; int i; if (s2_is_prefix && len1 > len2) len1 = len2; tc1 = buf; if ((len1 + len2 + 2) > (int)sizeof(buf)) tc1 = static_cast(my_str_malloc(len1 + len2 + 2)); tc2 = tc1 + len1 + 1; memcpy(tc1, s1, len1); tc1[len1] = 0; /* if length(s1)> len1, need to put 'end of string' */ memcpy(tc2, s2, len2); tc2[len2] = 0; /* put end of string */ thai2sortable(tc1, len1); thai2sortable(tc2, len2); i = strcmp((char *)tc1, (char *)tc2); if (tc1 != buf) my_str_free(tc1); return i; } static int my_strnncollsp_tis620(const CHARSET_INFO *cs MY_ATTRIBUTE((unused)), const uchar *a0, size_t a_length, const uchar *b0, size_t b_length) { uchar buf[80], *end, *a, *b, *alloced = NULL; size_t length; int res = 0; a = buf; if ((a_length + b_length + 2) > (int)sizeof(buf)) alloced = a = (uchar *)my_str_malloc(a_length + b_length + 2); b = a + a_length + 1; memcpy(a, a0, a_length); a[a_length] = 0; /* if length(a0)> len1, need to put 'end of string' */ memcpy(b, b0, b_length); b[b_length] = 0; /* put end of string */ a_length = thai2sortable(a, a_length); b_length = thai2sortable(b, b_length); end = a + (length = MY_MIN(a_length, b_length)); while (a < end) { if (*a++ != *b++) { res = ((int)a[-1] - (int)b[-1]); goto ret; } } if (a_length != b_length) { int swap = 1; /* Check the next not space character of the longer key. If it's < ' ', then it's smaller than the other key. */ if (a_length < b_length) { /* put shorter key in s */ a_length = b_length; a = b; swap = -1; /* swap sign of result */ res = -res; } for (end = a + a_length - length; a < end; a++) { if (*a != ' ') { res = (*a < ' ') ? -swap : swap; goto ret; } } } ret: if (alloced) my_str_free(alloced); return res; } /* strnxfrm replacment, convert Thai string to sortable string Arg: Destination buffer, source string, dest length and source length Ret: Conveted string size */ static size_t my_strnxfrm_tis620(const CHARSET_INFO *cs, uchar *dst, size_t dstlen, uint nweights, const uchar *src, size_t srclen, uint flags) { size_t dstlen0 = dstlen; size_t min_len = MY_MIN(dstlen, srclen); size_t len = 0; /* We don't use strmake here, since it requires one more character for the terminating '\0', while this function itself and the following calling functions do not require it */ while (len < min_len) { if (!(dst[len] = src[len])) break; len++; } len = thai2sortable(dst, len); set_if_smaller(dstlen, nweights); set_if_smaller(len, dstlen); len = my_strxfrm_pad(cs, dst, dst + len, dst + dstlen, (uint)(dstlen - len), flags); if ((flags & MY_STRXFRM_PAD_TO_MAXLEN) && len < dstlen0) { size_t fill_length = dstlen0 - len; cs->cset->fill(cs, (char *)dst + len, fill_length, cs->pad_char); len = dstlen0; } return len; } } // extern "C" static const unsigned short cs_to_uni[256] = { 0x0000, 0x0001, 0x0002, 0x0003, 0x0004, 0x0005, 0x0006, 0x0007, 0x0008, 0x0009, 0x000A, 0x000B, 0x000C, 0x000D, 0x000E, 0x000F, 0x0010, 0x0011, 0x0012, 0x0013, 0x0014, 0x0015, 0x0016, 0x0017, 0x0018, 0x0019, 0x001A, 0x001B, 0x001C, 0x001D, 0x001E, 0x001F, 0x0020, 0x0021, 0x0022, 0x0023, 0x0024, 0x0025, 0x0026, 0x0027, 0x0028, 0x0029, 0x002A, 0x002B, 0x002C, 0x002D, 0x002E, 0x002F, 0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037, 0x0038, 0x0039, 0x003A, 0x003B, 0x003C, 0x003D, 0x003E, 0x003F, 0x0040, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x004A, 0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x005B, 0x005C, 0x005D, 0x005E, 0x005F, 0x0060, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067, 0x0068, 0x0069, 0x006A, 0x006B, 0x006C, 0x006D, 0x006E, 0x006F, 0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077, 0x0078, 0x0079, 0x007A, 0x007B, 0x007C, 0x007D, 0x007E, 0x007F, 0x0080, 0x0081, 0x0082, 0x0083, 0x0084, 0x0085, 0x0086, 0x0087, 0x0088, 0x0089, 0x008A, 0x008B, 0x008C, 0x008D, 0x008E, 0x008F, 0x0090, 0x0091, 0x0092, 0x0093, 0x0094, 0x0095, 0x0096, 0x0097, 0x0098, 0x0099, 0x009A, 0x009B, 0x009C, 0x009D, 0x009E, 0x009F, 0xFFFD, 0x0E01, 0x0E02, 0x0E03, 0x0E04, 0x0E05, 0x0E06, 0x0E07, 0x0E08, 0x0E09, 0x0E0A, 0x0E0B, 0x0E0C, 0x0E0D, 0x0E0E, 0x0E0F, 0x0E10, 0x0E11, 0x0E12, 0x0E13, 0x0E14, 0x0E15, 0x0E16, 0x0E17, 0x0E18, 0x0E19, 0x0E1A, 0x0E1B, 0x0E1C, 0x0E1D, 0x0E1E, 0x0E1F, 0x0E20, 0x0E21, 0x0E22, 0x0E23, 0x0E24, 0x0E25, 0x0E26, 0x0E27, 0x0E28, 0x0E29, 0x0E2A, 0x0E2B, 0x0E2C, 0x0E2D, 0x0E2E, 0x0E2F, 0x0E30, 0x0E31, 0x0E32, 0x0E33, 0x0E34, 0x0E35, 0x0E36, 0x0E37, 0x0E38, 0x0E39, 0x0E3A, 0xFFFD, 0xFFFD, 0xFFFD, 0xFFFD, 0x0E3F, 0x0E40, 0x0E41, 0x0E42, 0x0E43, 0x0E44, 0x0E45, 0x0E46, 0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D, 0x0E4E, 0x0E4F, 0x0E50, 0x0E51, 0x0E52, 0x0E53, 0x0E54, 0x0E55, 0x0E56, 0x0E57, 0x0E58, 0x0E59, 0x0E5A, 0x0E5B, 0xFFFD, 0xFFFD, 0xFFFD, 0xFFFD}; static const uchar pl00[256] = { 0x0000, 0x0001, 0x0002, 0x0003, 0x0004, 0x0005, 0x0006, 0x0007, 0x0008, 0x0009, 0x000A, 0x000B, 0x000C, 0x000D, 0x000E, 0x000F, 0x0010, 0x0011, 0x0012, 0x0013, 0x0014, 0x0015, 0x0016, 0x0017, 0x0018, 0x0019, 0x001A, 0x001B, 0x001C, 0x001D, 0x001E, 0x001F, 0x0020, 0x0021, 0x0022, 0x0023, 0x0024, 0x0025, 0x0026, 0x0027, 0x0028, 0x0029, 0x002A, 0x002B, 0x002C, 0x002D, 0x002E, 0x002F, 0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037, 0x0038, 0x0039, 0x003A, 0x003B, 0x003C, 0x003D, 0x003E, 0x003F, 0x0040, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x004A, 0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x005B, 0x005C, 0x005D, 0x005E, 0x005F, 0x0060, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067, 0x0068, 0x0069, 0x006A, 0x006B, 0x006C, 0x006D, 0x006E, 0x006F, 0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077, 0x0078, 0x0079, 0x007A, 0x007B, 0x007C, 0x007D, 0x007E, 0x007F, 0x0080, 0x0081, 0x0082, 0x0083, 0x0084, 0x0085, 0x0086, 0x0087, 0x0088, 0x0089, 0x008A, 0x008B, 0x008C, 0x008D, 0x008E, 0x008F, 0x0090, 0x0091, 0x0092, 0x0093, 0x0094, 0x0095, 0x0096, 0x0097, 0x0098, 0x0099, 0x009A, 0x009B, 0x009C, 0x009D, 0x009E, 0x009F, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000}; static const uchar pl0E[256] = { 0x0000, 0x00A1, 0x00A2, 0x00A3, 0x00A4, 0x00A5, 0x00A6, 0x00A7, 0x00A8, 0x00A9, 0x00AA, 0x00AB, 0x00AC, 0x00AD, 0x00AE, 0x00AF, 0x00B0, 0x00B1, 0x00B2, 0x00B3, 0x00B4, 0x00B5, 0x00B6, 0x00B7, 0x00B8, 0x00B9, 0x00BA, 0x00BB, 0x00BC, 0x00BD, 0x00BE, 0x00BF, 0x00C0, 0x00C1, 0x00C2, 0x00C3, 0x00C4, 0x00C5, 0x00C6, 0x00C7, 0x00C8, 0x00C9, 0x00CA, 0x00CB, 0x00CC, 0x00CD, 0x00CE, 0x00CF, 0x00D0, 0x00D1, 0x00D2, 0x00D3, 0x00D4, 0x00D5, 0x00D6, 0x00D7, 0x00D8, 0x00D9, 0x00DA, 0x0000, 0x0000, 0x0000, 0x0000, 0x00DF, 0x00E0, 0x00E1, 0x00E2, 0x00E3, 0x00E4, 0x00E5, 0x00E6, 0x00E7, 0x00E8, 0x00E9, 0x00EA, 0x00EB, 0x00EC, 0x00ED, 0x00EE, 0x00EF, 0x00F0, 0x00F1, 0x00F2, 0x00F3, 0x00F4, 0x00F5, 0x00F6, 0x00F7, 0x00F8, 0x00F9, 0x00FA, 0x00FB, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000}; static const uchar plFF[256] = { 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x00FF, 0x0000, 0x0000}; static const uchar *uni_to_cs[256] = { pl00, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, pl0E, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, plFF}; extern "C" { static int my_mb_wc_tis620(const CHARSET_INFO *cs MY_ATTRIBUTE((unused)), my_wc_t *wc, const uchar *str, const uchar *end) { if (str >= end) return MY_CS_TOOSMALL; *wc = cs_to_uni[*str]; return (!wc[0] && str[0]) ? -1 : 1; } static int my_wc_mb_tis620(const CHARSET_INFO *cs MY_ATTRIBUTE((unused)), my_wc_t wc, uchar *str, uchar *end) { const uchar *pl; if (str >= end) return MY_CS_TOOSMALL; pl = uni_to_cs[(wc >> 8) & 0xFF]; str[0] = pl ? pl[wc & 0xFF] : '\0'; return (!str[0] && wc) ? MY_CS_ILUNI : 1; } } // extern "C" static MY_COLLATION_HANDLER my_collation_ci_handler = { nullptr, /* init */ nullptr, my_strnncoll_tis620, my_strnncollsp_tis620, my_strnxfrm_tis620, my_strnxfrmlen_simple, my_like_range_simple, my_wildcmp_8bit, /* wildcmp */ my_strcasecmp_8bit, my_instr_simple, /* QQ: To be fixed */ my_hash_sort_simple, my_propagate_simple}; static MY_CHARSET_HANDLER my_charset_handler = { NULL, /* init */ NULL, /* ismbchar */ my_mbcharlen_8bit, /* mbcharlen */ my_numchars_8bit, my_charpos_8bit, my_well_formed_len_8bit, my_lengthsp_8bit, my_numcells_8bit, my_mb_wc_tis620, /* mb_wc */ my_wc_mb_tis620, /* wc_mb */ my_mb_ctype_8bit, my_caseup_str_8bit, my_casedn_str_8bit, my_caseup_8bit, my_casedn_8bit, my_snprintf_8bit, my_long10_to_str_8bit, my_longlong10_to_str_8bit, my_fill_8bit, my_strntol_8bit, my_strntoul_8bit, my_strntoll_8bit, my_strntoull_8bit, my_strntod_8bit, my_strtoll10_8bit, my_strntoull10rnd_8bit, my_scan_8bit}; CHARSET_INFO my_charset_tis620_thai_ci = { 18, 0, 0, /* number */ MY_CS_COMPILED | MY_CS_PRIMARY | MY_CS_STRNXFRM, /* state */ "tis620", /* cs name */ "tis620_thai_ci", /* name */ "", /* comment */ NULL, /* tailoring */ NULL, /* coll_param */ ctype_tis620, to_lower_tis620, to_upper_tis620, sort_order_tis620, NULL, /* uca */ NULL, /* tab_to_uni */ NULL, /* tab_from_uni */ &my_unicase_default, /* caseinfo */ NULL, /* state_map */ NULL, /* ident_map */ 4, /* strxfrm_multiply */ 1, /* caseup_multiply */ 1, /* casedn_multiply */ 1, /* mbminlen */ 1, /* mbmaxlen */ 1, /* mbmaxlenlen */ 0, /* min_sort_char */ 255, /* max_sort_char */ ' ', /* pad char */ 0, /* escape_with_backslash_is_dangerous */ 1, /* levels_for_compare */ &my_charset_handler, &my_collation_ci_handler, PAD_SPACE}; CHARSET_INFO my_charset_tis620_bin = { 89, 0, 0, /* number */ MY_CS_COMPILED | MY_CS_BINSORT, /* state */ "tis620", /* cs name */ "tis620_bin", /* name */ "", /* comment */ NULL, /* tailoring */ NULL, /* coll_param */ ctype_tis620, to_lower_tis620, to_upper_tis620, NULL, /* sort_order */ NULL, /* uca */ NULL, /* tab_to_uni */ NULL, /* tab_from_uni */ &my_unicase_default, /* caseinfo */ NULL, /* state_map */ NULL, /* ident_map */ 1, /* strxfrm_multiply */ 1, /* caseup_multiply */ 1, /* casedn_multiply */ 1, /* mbminlen */ 1, /* mbmaxlen */ 1, /* mbmaxlenlen */ 0, /* min_sort_char */ 255, /* max_sort_char */ ' ', /* pad char */ 0, /* escape_with_backslash_is_dangerous */ 1, /* levels_for_compare */ &my_charset_handler, &my_collation_8bit_bin_handler, PAD_SPACE};