* include/hbdefs.h
+ added new types HB_WCHAR16 and HB_WCHAR32, existing type HB_WCHAR
is mapped to HB_WCHAR16 (just like before)
* include/hbapicdp.h
* src/harbour.def
* src/rtl/cdpapi.c
+ added new C functions for encoding and decoding UTF-8 string using
which HB_WCHAR32:
int hb_cdpU32CharToUTF8( char * szUTF8, HB_WCHAR32 wc );
HB_BOOL hb_cdpUTF8GetU32( const char * pSrc, HB_SIZE nLen,
HB_SIZE * pnIndex, HB_WCHAR32 * pWC );
HB_BOOL hb_cdpUTF8GetUCS( const char * pSrc, HB_SIZE nLen,
HB_SIZE * pnIndex, HB_WCHAR32 * pWC );
HB_BOOL hb_cdpUTF8GetU16( const char * pSrc, HB_SIZE nLen,
HB_SIZE * pnIndex, HB_WCHAR16 * pWC );
HB_BOOL hb_cdpUTF8Validate( const char * pSrc, HB_SIZE nLen );
They support full UCS and are much more restrictive against errors and
wrong UTF-8 encoding, i.e. now overlong encoding is forbidden.
The wrong characters are translated to 0xFFFD and later if such
character does not exist in final CP to '?' ASCII character.
* declaration of the following UTF-8 C functions have been changed to
operate on HB_WCHAR32 instead of HB_WCHAR:
int hb_cdpUTF8CharSize( HB_WCHAR32 wc );
HB_WCHAR32 hb_cdpUTF8StringPeek( const char * pSrc, HB_SIZE nLen,
HB_SIZE nPos );
* the following C functions have been changed to internally operate on
HB_WCHAR32 instead of HB_WCHAR:
hb_cdpUTF8StringLength()
hb_cdpUTF8StringAt()
hb_cdpUTF8StringSubstr()
* the following C functions have been changed to use new hb_cdpUTF8GetU*()
instead of step by step decoding with hb_cdpUTF8ToU16NextChar()
hb_cdpStrToUTF8Disp()
hb_cdpUTF8AsStrLen()
hb_cdpUTF8ToStr()
hb_cdpStrToU16()
hb_cdpUtf8Char()
* use HB_CDP_ERROR_* macros to mark wrong encoding
* src/rtl/cdpapihb.c
* the following UTF-8 C functions have been changed to operate on
HB_WCHAR32 instead of HB_WCHAR:
hb_utf8Chr()
hb_utf8Asc()
hb_utf8Poke()
hb_utf8Peek()
Other UTF-8 PRG functions have been adopted to HB_WCHAR32 by changes
in corresponding C functions.
* src/codepage/cp_utf8.c
* use new function hb_cdpUTF8GetU16() to decode UTF-8 strings in UTF8EX CP
* src/rtl/arc4.c
+ added new macro HB_NO_SYSCTL which allow to disable sysctl() in Linux
builds for GLIBC < 2.30
536 lines
25 KiB
C
536 lines
25 KiB
C
/*
|
|
* Header file for the CodePages API
|
|
*
|
|
* Copyright 2002 Alexander S.Kresin <alex@belacy.belgorod.su>
|
|
* Copyright 2009 Przemyslaw Czerpak <druzus / at / priv.onet.pl>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2, or (at your option)
|
|
* any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; see the file LICENSE.txt. If not, write to
|
|
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
|
|
* Boston, MA 02110-1301 USA (or visit https://www.gnu.org/licenses/).
|
|
*
|
|
* As a special exception, the Harbour Project gives permission for
|
|
* additional uses of the text contained in its release of Harbour.
|
|
*
|
|
* The exception is that, if you link the Harbour libraries with other
|
|
* files to produce an executable, this does not by itself cause the
|
|
* resulting executable to be covered by the GNU General Public License.
|
|
* Your use of that executable is in no way restricted on account of
|
|
* linking the Harbour library code into it.
|
|
*
|
|
* This exception does not however invalidate any other reasons why
|
|
* the executable file might be covered by the GNU General Public License.
|
|
*
|
|
* This exception applies only to the code released by the Harbour
|
|
* Project under the name Harbour. If you copy code from other
|
|
* Harbour Project or Free Software Foundation releases into a copy of
|
|
* Harbour, as the General Public License permits, the exception does
|
|
* not apply to the code that you add in this way. To avoid misleading
|
|
* anyone as to the status of such modified files, you must delete
|
|
* this exception notice from them.
|
|
*
|
|
* If you write modifications of your own for Harbour, it is your choice
|
|
* whether to permit this exception to apply to your modifications.
|
|
* If you do not wish that, delete this exception notice.
|
|
*
|
|
*/
|
|
|
|
#ifndef HB_APICDP_H_
|
|
#define HB_APICDP_H_
|
|
|
|
#include "hbapi.h"
|
|
#include "hbinit.h"
|
|
|
|
HB_EXTERN_BEGIN
|
|
|
|
/* This hack is needed to force preprocessing if id is also a macro */
|
|
#define HB_CODEPAGE_REQUEST( id ) HB_CODEPAGE_REQUEST_( id )
|
|
#define HB_CODEPAGE_REQUEST_( id ) HB_FUNC_EXTERN( HB_CODEPAGE_##id ); \
|
|
extern void hb_codepage_ForceLink_##id( void ); \
|
|
void hb_codepage_ForceLink_##id( void ) \
|
|
{ \
|
|
HB_FUNC_EXEC( HB_CODEPAGE_##id ); \
|
|
}
|
|
#define HB_CODEPAGE_ANNOUNCE( id ) HB_CODEPAGE_ANNOUNCE_( id )
|
|
#define HB_CODEPAGE_ANNOUNCE_( id ) HB_FUNC( HB_CODEPAGE_##id ) {}
|
|
|
|
|
|
/* forward declaration */
|
|
struct _HB_CODEPAGE;
|
|
|
|
#define _PHB_CODEPAGE struct _HB_CODEPAGE *
|
|
|
|
#define HB_CDPCHAR_GET( c, s, n, i, w ) (c)->wcharGet( c, s, n, i, w )
|
|
#define HB_CDPCHAR_PUT( c, s, n, i, w ) (c)->wcharPut( c, s, n, i, w )
|
|
#define HB_CDPCHAR_LEN( c, w ) (c)->wcharLen( c, w )
|
|
#define HB_CDPCHAR_UPPER( c, w ) (c)->wcharUpper( c, w )
|
|
#define HB_CDPCHAR_LOWER( c, w ) (c)->wcharLower( c, w )
|
|
#define HB_CDPCHAR_FLAGS( c, w ) (c)->wcharFlags( c, w )
|
|
#define HB_CDPCHAR_CMP( c, s1, n1, s2, n2, e ) (c)->wcharCmp( c, s1, n1, s2, n2, e )
|
|
#define HB_CDPCHAR_CMPI( c, s1, n1, s2, n2, e ) (c)->wcharCmpI( c, s1, n1, s2, n2, e )
|
|
|
|
#define HB_CDP_GET_FUNC( func ) HB_BOOL func( _PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nLen, HB_SIZE * pnIndex, HB_WCHAR * wc )
|
|
typedef HB_CDP_GET_FUNC( ( * PHB_CDP_GET_FUNC ) );
|
|
|
|
#define HB_CDP_PUT_FUNC( func ) HB_BOOL func( _PHB_CODEPAGE cdp, char * pDst, HB_SIZE nLen, HB_SIZE * pnIndex, HB_WCHAR wc )
|
|
typedef HB_CDP_PUT_FUNC( ( * PHB_CDP_PUT_FUNC ) );
|
|
|
|
#define HB_CDP_LEN_FUNC( func ) int func( _PHB_CODEPAGE cdp, HB_WCHAR wc )
|
|
typedef HB_CDP_LEN_FUNC( ( * PHB_CDP_LEN_FUNC ) );
|
|
|
|
#define HB_CDP_UPPER_FUNC( func ) HB_WCHAR func( _PHB_CODEPAGE cdp, HB_WCHAR wc )
|
|
typedef HB_CDP_UPPER_FUNC( ( * PHB_CDP_UPPER_FUNC ) );
|
|
|
|
#define HB_CDP_LOWER_FUNC( func ) HB_WCHAR func( _PHB_CODEPAGE cdp, HB_WCHAR wc )
|
|
typedef HB_CDP_LOWER_FUNC( ( * PHB_CDP_LOWER_FUNC ) );
|
|
|
|
#define HB_CDP_FLAGS_FUNC( func ) int func( _PHB_CODEPAGE cdp, HB_WCHAR wc )
|
|
typedef HB_CDP_FLAGS_FUNC( ( * PHB_CDP_FLAGS_FUNC ) );
|
|
|
|
#define HB_CDP_CMP_FUNC( func ) int func( _PHB_CODEPAGE cdp, const char * szFirst, HB_SIZE nLenFirst, const char * szSecond, HB_SIZE nLenSecond, HB_BOOL fExact )
|
|
typedef HB_CDP_CMP_FUNC( ( * PHB_CDP_CMP_FUNC ) );
|
|
|
|
|
|
typedef struct _HB_UNITABLE
|
|
{
|
|
const char * uniID;
|
|
const HB_WCHAR * uniCodes;
|
|
HB_UCHAR * uniTrans;
|
|
HB_WCHAR wcMax;
|
|
} HB_UNITABLE, * PHB_UNITABLE;
|
|
|
|
typedef struct _HB_MULTICHAR
|
|
{
|
|
char cFirst[ 2 ];
|
|
char cLast[ 2 ];
|
|
int sortUp;
|
|
int sortLo;
|
|
HB_WCHAR wcUp;
|
|
HB_WCHAR wcLo;
|
|
} HB_MULTICHAR, * PHB_MULTICHAR;
|
|
|
|
typedef struct _HB_CODEPAGE
|
|
{
|
|
const char * id;
|
|
const char * info;
|
|
PHB_UNITABLE uniTable;
|
|
const HB_UCHAR * flags;
|
|
const HB_UCHAR * upper;
|
|
const HB_UCHAR * lower;
|
|
const HB_UCHAR * sort;
|
|
const HB_UCHAR * acc;
|
|
int nACSort;
|
|
int type;
|
|
PHB_CDP_GET_FUNC wcharGet;
|
|
PHB_CDP_PUT_FUNC wcharPut;
|
|
PHB_CDP_LEN_FUNC wcharLen;
|
|
PHB_CDP_UPPER_FUNC wcharUpper;
|
|
PHB_CDP_LOWER_FUNC wcharLower;
|
|
PHB_CDP_FLAGS_FUNC wcharFlags;
|
|
PHB_CDP_CMP_FUNC wcharCmp;
|
|
PHB_CDP_CMP_FUNC wcharCmpI;
|
|
int nMulti;
|
|
int nMultiUC;
|
|
PHB_MULTICHAR multi;
|
|
void * buffer;
|
|
struct _HB_CODEPAGE * next;
|
|
} HB_CODEPAGE, * PHB_CODEPAGE;
|
|
|
|
#define HB_CPID_437 "cp437"
|
|
#define HB_CPID_737 "cp737"
|
|
#define HB_CPID_775 "cp775"
|
|
#define HB_CPID_850 "cp850"
|
|
#define HB_CPID_852 "cp852"
|
|
#define HB_CPID_855 "cp855"
|
|
#define HB_CPID_857 "cp857"
|
|
#define HB_CPID_858 "cp858"
|
|
#define HB_CPID_860 "cp860"
|
|
#define HB_CPID_861 "cp861"
|
|
#define HB_CPID_862 "cp862"
|
|
#define HB_CPID_863 "cp863"
|
|
#define HB_CPID_864 "cp864"
|
|
#define HB_CPID_865 "cp865"
|
|
#define HB_CPID_866 "cp866"
|
|
#define HB_CPID_869 "cp869"
|
|
#define HB_CPID_874 "cp874"
|
|
#define HB_CPID_1125 "cp1125"
|
|
#define HB_CPID_1250 "cp1250"
|
|
#define HB_CPID_1251 "cp1251"
|
|
#define HB_CPID_1252 "cp1252"
|
|
#define HB_CPID_1253 "cp1253"
|
|
#define HB_CPID_1254 "cp1254"
|
|
#define HB_CPID_1255 "cp1255"
|
|
#define HB_CPID_1256 "cp1256"
|
|
#define HB_CPID_1257 "cp1257"
|
|
#define HB_CPID_1258 "cp1258"
|
|
#define HB_CPID_8859_1 "iso8859-1"
|
|
#define HB_CPID_8859_1B "iso8859-1b"
|
|
#define HB_CPID_8859_2 "iso8859-2"
|
|
#define HB_CPID_8859_3 "iso8859-3"
|
|
#define HB_CPID_8859_4 "iso8859-4"
|
|
#define HB_CPID_8859_5 "iso8859-5"
|
|
#define HB_CPID_8859_6 "iso8859-6"
|
|
#define HB_CPID_8859_7 "iso8859-7"
|
|
#define HB_CPID_8859_8 "iso8859-8"
|
|
#define HB_CPID_8859_9 "iso8859-9"
|
|
#define HB_CPID_8859_10 "iso8859-10"
|
|
#define HB_CPID_8859_11 "iso8859-11"
|
|
#define HB_CPID_8859_13 "iso8859-13"
|
|
#define HB_CPID_8859_14 "iso8859-14"
|
|
#define HB_CPID_8859_15 "iso8859-15"
|
|
#define HB_CPID_8859_16 "iso8859-16"
|
|
#define HB_CPID_KOI_8 "koi-8"
|
|
#define HB_CPID_KOI_8U "koi-8u"
|
|
#define HB_CPID_KAM "kamenicky"
|
|
#define HB_CPID_MAZ "mazovia"
|
|
#define HB_CPID_MIK "bg-mik"
|
|
#define HB_CPID_037 "cp037"
|
|
#define HB_CPID_424 "cp424"
|
|
#define HB_CPID_500 "cp500"
|
|
#define HB_CPID_856 "cp856"
|
|
#define HB_CPID_875 "cp875"
|
|
#define HB_CPID_1006 "cp1006"
|
|
#define HB_CPID_1026 "cp1026"
|
|
#define HB_CPID_10000 "macroman"
|
|
#define HB_CPID_10006 "macgreek"
|
|
#define HB_CPID_10007 "maccyrillic"
|
|
#define HB_CPID_10029 "maccentraleurope"
|
|
#define HB_CPID_10079 "maciceland"
|
|
#define HB_CPID_10081 "macturkish"
|
|
#define HB_CPID_ATARIST "atarist"
|
|
#define HB_CPID_NEXTSTEP "nextstep"
|
|
#define HB_CPID_USASCII "us-ascii"
|
|
#define HB_CPID_646YU "iso646-yu"
|
|
#define HB_CPID_646YUC "iso646-yuc"
|
|
|
|
#define HB_UNITB_437 &hb_uniTbl_437
|
|
#define HB_UNITB_737 &hb_uniTbl_737
|
|
#define HB_UNITB_775 &hb_uniTbl_775
|
|
#define HB_UNITB_850 &hb_uniTbl_850
|
|
#define HB_UNITB_852 &hb_uniTbl_852
|
|
#define HB_UNITB_855 &hb_uniTbl_855
|
|
#define HB_UNITB_857 &hb_uniTbl_857
|
|
#define HB_UNITB_858 &hb_uniTbl_858
|
|
#define HB_UNITB_860 &hb_uniTbl_860
|
|
#define HB_UNITB_861 &hb_uniTbl_861
|
|
#define HB_UNITB_862 &hb_uniTbl_862
|
|
#define HB_UNITB_863 &hb_uniTbl_863
|
|
#define HB_UNITB_864 &hb_uniTbl_864
|
|
#define HB_UNITB_865 &hb_uniTbl_865
|
|
#define HB_UNITB_866 &hb_uniTbl_866
|
|
#define HB_UNITB_869 &hb_uniTbl_869
|
|
#define HB_UNITB_874 &hb_uniTbl_874
|
|
#define HB_UNITB_1125 &hb_uniTbl_1125
|
|
#define HB_UNITB_1250 &hb_uniTbl_1250
|
|
#define HB_UNITB_1251 &hb_uniTbl_1251
|
|
#define HB_UNITB_1252 &hb_uniTbl_1252
|
|
#define HB_UNITB_1253 &hb_uniTbl_1253
|
|
#define HB_UNITB_1254 &hb_uniTbl_1254
|
|
#define HB_UNITB_1255 &hb_uniTbl_1255
|
|
#define HB_UNITB_1256 &hb_uniTbl_1256
|
|
#define HB_UNITB_1257 &hb_uniTbl_1257
|
|
#define HB_UNITB_1258 &hb_uniTbl_1258
|
|
#define HB_UNITB_8859_1 &hb_uniTbl_8859_1
|
|
#define HB_UNITB_8859_1B &hb_uniTbl_8859_1b
|
|
#define HB_UNITB_8859_2 &hb_uniTbl_8859_2
|
|
#define HB_UNITB_8859_3 &hb_uniTbl_8859_3
|
|
#define HB_UNITB_8859_4 &hb_uniTbl_8859_4
|
|
#define HB_UNITB_8859_5 &hb_uniTbl_8859_5
|
|
#define HB_UNITB_8859_6 &hb_uniTbl_8859_6
|
|
#define HB_UNITB_8859_7 &hb_uniTbl_8859_7
|
|
#define HB_UNITB_8859_8 &hb_uniTbl_8859_8
|
|
#define HB_UNITB_8859_9 &hb_uniTbl_8859_9
|
|
#define HB_UNITB_8859_10 &hb_uniTbl_8859_10
|
|
#define HB_UNITB_8859_11 &hb_uniTbl_8859_11
|
|
#define HB_UNITB_8859_13 &hb_uniTbl_8859_13
|
|
#define HB_UNITB_8859_14 &hb_uniTbl_8859_14
|
|
#define HB_UNITB_8859_15 &hb_uniTbl_8859_15
|
|
#define HB_UNITB_8859_16 &hb_uniTbl_8859_16
|
|
#define HB_UNITB_KOI_8 &hb_uniTbl_KOI_8
|
|
#define HB_UNITB_KOI_8U &hb_uniTbl_KOI_8U
|
|
#define HB_UNITB_KAM &hb_uniTbl_kamenicky
|
|
#define HB_UNITB_MAZ &hb_uniTbl_mazovia
|
|
#define HB_UNITB_MIK &hb_uniTbl_MIK
|
|
#define HB_UNITB_037 &hb_uniTbl_037
|
|
#define HB_UNITB_424 &hb_uniTbl_424
|
|
#define HB_UNITB_500 &hb_uniTbl_500
|
|
#define HB_UNITB_856 &hb_uniTbl_856
|
|
#define HB_UNITB_875 &hb_uniTbl_875
|
|
#define HB_UNITB_1006 &hb_uniTbl_1006
|
|
#define HB_UNITB_1026 &hb_uniTbl_1026
|
|
#define HB_UNITB_10000 &hb_uniTbl_10000
|
|
#define HB_UNITB_10006 &hb_uniTbl_10006
|
|
#define HB_UNITB_10007 &hb_uniTbl_10007
|
|
#define HB_UNITB_10029 &hb_uniTbl_10029
|
|
#define HB_UNITB_10079 &hb_uniTbl_10079
|
|
#define HB_UNITB_10081 &hb_uniTbl_10081
|
|
#define HB_UNITB_ATARIST &hb_uniTbl_ATARIST
|
|
#define HB_UNITB_NEXTSTEP &hb_uniTbl_NEXTSTEP
|
|
#define HB_UNITB_USASCII &hb_uniTbl_USASCII
|
|
#define HB_UNITB_646YU &hb_uniTbl_646YU
|
|
#define HB_UNITB_646YUC &hb_uniTbl_646YUC
|
|
#define HB_UNITB_UNDEF NULL /* ((PHB_UNITABLE) (-1)) */
|
|
|
|
extern HB_UNITABLE hb_uniTbl_437;
|
|
extern HB_UNITABLE hb_uniTbl_737;
|
|
extern HB_UNITABLE hb_uniTbl_775;
|
|
extern HB_UNITABLE hb_uniTbl_850;
|
|
extern HB_UNITABLE hb_uniTbl_852;
|
|
extern HB_UNITABLE hb_uniTbl_855;
|
|
extern HB_UNITABLE hb_uniTbl_857;
|
|
extern HB_UNITABLE hb_uniTbl_858;
|
|
extern HB_UNITABLE hb_uniTbl_860;
|
|
extern HB_UNITABLE hb_uniTbl_861;
|
|
extern HB_UNITABLE hb_uniTbl_862;
|
|
extern HB_UNITABLE hb_uniTbl_863;
|
|
extern HB_UNITABLE hb_uniTbl_864;
|
|
extern HB_UNITABLE hb_uniTbl_865;
|
|
extern HB_UNITABLE hb_uniTbl_866;
|
|
extern HB_UNITABLE hb_uniTbl_869;
|
|
extern HB_UNITABLE hb_uniTbl_874;
|
|
extern HB_UNITABLE hb_uniTbl_1125;
|
|
extern HB_UNITABLE hb_uniTbl_1250;
|
|
extern HB_UNITABLE hb_uniTbl_1251;
|
|
extern HB_UNITABLE hb_uniTbl_1252;
|
|
extern HB_UNITABLE hb_uniTbl_1253;
|
|
extern HB_UNITABLE hb_uniTbl_1254;
|
|
extern HB_UNITABLE hb_uniTbl_1255;
|
|
extern HB_UNITABLE hb_uniTbl_1256;
|
|
extern HB_UNITABLE hb_uniTbl_1257;
|
|
extern HB_UNITABLE hb_uniTbl_1258;
|
|
extern HB_UNITABLE hb_uniTbl_8859_1;
|
|
extern HB_UNITABLE hb_uniTbl_8859_1b;
|
|
extern HB_UNITABLE hb_uniTbl_8859_2;
|
|
extern HB_UNITABLE hb_uniTbl_8859_3;
|
|
extern HB_UNITABLE hb_uniTbl_8859_4;
|
|
extern HB_UNITABLE hb_uniTbl_8859_5;
|
|
extern HB_UNITABLE hb_uniTbl_8859_6;
|
|
extern HB_UNITABLE hb_uniTbl_8859_7;
|
|
extern HB_UNITABLE hb_uniTbl_8859_8;
|
|
extern HB_UNITABLE hb_uniTbl_8859_9;
|
|
extern HB_UNITABLE hb_uniTbl_8859_10;
|
|
extern HB_UNITABLE hb_uniTbl_8859_11;
|
|
extern HB_UNITABLE hb_uniTbl_8859_13;
|
|
extern HB_UNITABLE hb_uniTbl_8859_14;
|
|
extern HB_UNITABLE hb_uniTbl_8859_15;
|
|
extern HB_UNITABLE hb_uniTbl_8859_16;
|
|
extern HB_UNITABLE hb_uniTbl_KOI_8;
|
|
extern HB_UNITABLE hb_uniTbl_KOI_8U;
|
|
extern HB_UNITABLE hb_uniTbl_kamenicky;
|
|
extern HB_UNITABLE hb_uniTbl_mazovia;
|
|
extern HB_UNITABLE hb_uniTbl_MIK;
|
|
extern HB_UNITABLE hb_uniTbl_037;
|
|
extern HB_UNITABLE hb_uniTbl_424;
|
|
extern HB_UNITABLE hb_uniTbl_500;
|
|
extern HB_UNITABLE hb_uniTbl_856;
|
|
extern HB_UNITABLE hb_uniTbl_875;
|
|
extern HB_UNITABLE hb_uniTbl_1006;
|
|
extern HB_UNITABLE hb_uniTbl_1026;
|
|
extern HB_UNITABLE hb_uniTbl_10000;
|
|
extern HB_UNITABLE hb_uniTbl_10006;
|
|
extern HB_UNITABLE hb_uniTbl_10007;
|
|
extern HB_UNITABLE hb_uniTbl_10029;
|
|
extern HB_UNITABLE hb_uniTbl_10079;
|
|
extern HB_UNITABLE hb_uniTbl_10081;
|
|
extern HB_UNITABLE hb_uniTbl_ATARIST;
|
|
extern HB_UNITABLE hb_uniTbl_NEXTSTEP;
|
|
extern HB_UNITABLE hb_uniTbl_USASCII;
|
|
extern HB_UNITABLE hb_uniTbl_646YU;
|
|
extern HB_UNITABLE hb_uniTbl_646YUC;
|
|
|
|
extern HB_EXPORT PHB_CODEPAGE hb_vmCDP( void );
|
|
extern HB_EXPORT void hb_vmSetCDP( PHB_CODEPAGE pCDP );
|
|
|
|
|
|
/* character flags */
|
|
#define HB_CDP_DIGIT 0x01
|
|
#define HB_CDP_ALPHA 0x02
|
|
#define HB_CDP_LOWER 0x04
|
|
#define HB_CDP_UPPER 0x08
|
|
#define HB_CDP_MULTI1 0x10
|
|
#define HB_CDP_MULTI2 0x20
|
|
|
|
/* accented character sorting */
|
|
#define HB_CDP_ACSORT_NONE 0 /* no special sorting for accented
|
|
characters */
|
|
#define HB_CDP_ACSORT_EQUAL 1 /* accented characters have the same
|
|
weight as corresponding unaccented
|
|
ones */
|
|
#define HB_CDP_ACSORT_INTERLEAVED 2 /* accented characters sort after
|
|
their unaccented counterparts only
|
|
if the unaccented versions of all
|
|
characters being compared are the
|
|
same ( interleaving ) */
|
|
|
|
/* letter case sensitive sorting */
|
|
#define HB_CDP_CSSORT_UPLO 0 /* upper letters first then lower
|
|
ones */
|
|
#define HB_CDP_CSSORT_MIXED 1 /* upper and lower letters are
|
|
mixed */
|
|
#define HB_CDP_CSSORT_IGNORE 2 /* ignore case */
|
|
|
|
/* byte order */
|
|
#define HB_CDP_ENDIAN_NATIVE 0
|
|
#define HB_CDP_ENDIAN_LITTLE 1
|
|
#define HB_CDP_ENDIAN_BIG 2
|
|
|
|
/* codepage types */
|
|
#define HB_CDP_TYPE_CUSTOM 0x0001
|
|
#define HB_CDP_TYPE_CHARIDX 0x0002
|
|
#define HB_CDP_TYPE_CHARUNI 0x0004
|
|
#define HB_CDP_TYPE_BINSORT 0x0008
|
|
#define HB_CDP_TYPE_UTF8 0x0010
|
|
|
|
/* maximal size of unicode character in 'char' representation for buffers
|
|
* To encode all ISO 10646 Universal Character Set (UCS) values (characters
|
|
* can be encoded in 31-bit code space) in UTF-8 we need 6 bytes.
|
|
* UC2 characters (16-bit) encoded in UTF-8 needs 3 bytes.
|
|
* 8 seems to be a little bit redundant and large enough for all encodings.
|
|
* In theory some other encodings may need more bytes but I do not know any
|
|
* one used in practice. [druzus]
|
|
*/
|
|
#define HB_MAX_CHAR_LEN 8
|
|
|
|
/* UCS maximal character value */
|
|
#define HB_CDP_UNICODE_MAX 0x10FFFF
|
|
|
|
/* UTF-16 surrogates for mapping U+010000 to U+10FFFF characters */
|
|
#define HB_CDP_SURROGATE_FIRST 0xD800
|
|
#define HB_CDP_SURROGATE_LAST 0xDFFF
|
|
#define HB_CDP_SURROGATE_HIGH 0xD800
|
|
#define HB_CDP_SURROGATE_LOW 0xDC00
|
|
|
|
/* character codes to replace sequences with wrong encoding or translation */
|
|
#define HB_CDP_ERROR_UNICHAR 0xFFFD /* <?> */
|
|
#define HB_CDP_ERROR_ASCCHAR 0x3F /* ? */
|
|
|
|
/* codepage uses simple binary sorting */
|
|
#define HB_CDP_ISBINSORT( cdp ) ( ( ( cdp )->type & HB_CDP_TYPE_BINSORT ) != 0 )
|
|
/* codepage uses custom string decoding */
|
|
#define HB_CDP_ISCUSTOM( cdp ) ( ( ( cdp )->type & HB_CDP_TYPE_CUSTOM ) != 0 )
|
|
/* codepage use character indexes instead of bytes ones */
|
|
#define HB_CDP_ISCHARIDX( cdp ) ( ( ( cdp )->type & HB_CDP_TYPE_CHARIDX ) != 0 )
|
|
/* Chr(), Asc() and similar functions operates on Unicode values instead of bytes */
|
|
#define HB_CDP_ISCHARUNI( cdp ) ( ( ( cdp )->type & HB_CDP_TYPE_CHARUNI ) != 0 )
|
|
/* codepage uses UTF-8 encoding */
|
|
#define HB_CDP_ISUTF8( cdp ) ( ( ( cdp )->type & HB_CDP_TYPE_UTF8 ) != 0 )
|
|
|
|
#define hb_cdpGetID( cdp ) ( ( cdp )->id )
|
|
|
|
extern HB_EXPORT HB_BOOL hb_cdpRegisterRaw( PHB_CODEPAGE cdp );
|
|
extern HB_EXPORT HB_BOOL hb_cdpRegisterNew( const char * id,
|
|
const char * info,
|
|
PHB_UNITABLE uniTable,
|
|
const char * pszUpper,
|
|
const char * pszLower,
|
|
unsigned int nACSort,
|
|
unsigned int nCaseSort,
|
|
HB_BOOL fUtf8 );
|
|
extern HB_EXPORT void hb_cdpBuildTransTable( PHB_UNITABLE uniTable );
|
|
extern HB_EXPORT void hb_cdpReleaseAll( void );
|
|
extern HB_EXPORT const char * hb_cdpID( void );
|
|
extern HB_EXPORT HB_BOOL hb_cdpIsUTF8( PHB_CODEPAGE cdp );
|
|
extern HB_EXPORT PHB_CODEPAGE hb_cdpSelect( PHB_CODEPAGE cdp );
|
|
extern HB_EXPORT const char * hb_cdpSelectID( const char * id );
|
|
extern HB_EXPORT PHB_CODEPAGE hb_cdpFind( const char * id );
|
|
extern HB_EXPORT PHB_CODEPAGE hb_cdpFindExt( const char * id );
|
|
extern HB_EXPORT const char ** hb_cdpList( void ); /* Caller must release the pointer */
|
|
|
|
|
|
extern HB_EXPORT HB_BOOL hb_cdpIsDigit( PHB_CODEPAGE cdp, int iChar );
|
|
extern HB_EXPORT HB_BOOL hb_cdpIsAlpha( PHB_CODEPAGE cdp, int iChar );
|
|
extern HB_EXPORT HB_BOOL hb_cdpIsLower( PHB_CODEPAGE cdp, int iChar );
|
|
extern HB_EXPORT HB_BOOL hb_cdpIsUpper( PHB_CODEPAGE cdp, int iChar );
|
|
|
|
extern HB_EXPORT int hb_cdpcmp( const char * szFirst, HB_SIZE nLenFirst, const char * szSecond, HB_SIZE nLenSecond, PHB_CODEPAGE cdp, HB_BOOL fExact );
|
|
extern HB_EXPORT int hb_cdpicmp( const char * szFirst, HB_SIZE nLenFirst, const char * szSecond, HB_SIZE nLenSecond, PHB_CODEPAGE cdp, HB_BOOL fExact );
|
|
extern HB_EXPORT const HB_UCHAR * hb_cdpGetSortTab( PHB_CODEPAGE cdp );
|
|
|
|
extern HB_EXPORT char * hb_cdpDup( const char *, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
extern HB_EXPORT char * hb_cdpDupn( const char *, HB_SIZE, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
extern HB_EXPORT char * hb_cdpnDup( const char *, HB_SIZE *, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
extern HB_EXPORT const char * hb_cdpnDup2( const char *, HB_SIZE, char *, HB_SIZE *, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
extern HB_EXPORT const char * hb_cdpnDup3( const char *, HB_SIZE, char *, HB_SIZE *, char **, HB_SIZE *, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
extern HB_EXPORT HB_SIZE hb_cdpnDupLen( const char *, HB_SIZE, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
extern HB_EXPORT HB_SIZE hb_cdpnDup2Len( const char *, HB_SIZE, HB_SIZE, PHB_CODEPAGE, PHB_CODEPAGE );
|
|
|
|
extern HB_EXPORT char * hb_cdpnDupUpper( PHB_CODEPAGE cdp, const char * pszText, HB_SIZE * pnSize );
|
|
extern HB_EXPORT char * hb_cdpnDupLower( PHB_CODEPAGE cdp, const char * pszText, HB_SIZE * pnSize );
|
|
extern HB_EXPORT HB_SIZE hb_cdpnDup2Upper( PHB_CODEPAGE cdp, const char * pszText, HB_SIZE nSize, char * buffer, HB_SIZE nBuffLen );
|
|
extern HB_EXPORT HB_SIZE hb_cdpnDup2Lower( PHB_CODEPAGE cdp, const char * pszText, HB_SIZE nSize, char * buffer, HB_SIZE nBuffLen );
|
|
|
|
extern HB_EXPORT HB_SIZE hb_cdpTransLen( const char * pSrc, HB_SIZE nSrc, HB_SIZE nMax, PHB_CODEPAGE cdpIn, PHB_CODEPAGE cdpOut );
|
|
extern HB_EXPORT HB_SIZE hb_cdpTransTo( const char * pSrc, HB_SIZE nSrc, char * pDst, HB_SIZE nDst, PHB_CODEPAGE cdpIn, PHB_CODEPAGE cdpOut );
|
|
|
|
extern HB_EXPORT HB_WCHAR hb_cdpGetU16Disp( PHB_CODEPAGE cdp, HB_UCHAR ch );
|
|
extern HB_EXPORT HB_SIZE hb_cdpStrToUTF8Disp( PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nSrc, char * pDst, HB_SIZE nDst );
|
|
extern HB_EXPORT int hb_cdpTranslateDispChar( int iChar, PHB_CODEPAGE cdpIn, PHB_CODEPAGE cdpOut );
|
|
extern HB_EXPORT int hb_cdpTranslateChar( int iChar, PHB_CODEPAGE cdpIn, PHB_CODEPAGE cdpOut );
|
|
|
|
extern HB_EXPORT HB_UCHAR hb_cdpGetChar( PHB_CODEPAGE cdp, HB_WCHAR wc );
|
|
extern HB_EXPORT HB_WCHAR hb_cdpGetU16( PHB_CODEPAGE cdp, HB_UCHAR ch );
|
|
extern HB_EXPORT HB_UCHAR hb_cdpGetUC( PHB_CODEPAGE cdp, HB_WCHAR wc, HB_UCHAR ucDef );
|
|
extern HB_EXPORT HB_WCHAR hb_cdpGetWC( PHB_CODEPAGE cdp, HB_UCHAR ch, HB_WCHAR wcDef );
|
|
|
|
extern HB_EXPORT HB_BOOL hb_cdpGetFromUTF8( PHB_CODEPAGE cdp, HB_UCHAR ch, int * n, HB_WCHAR * pwc );
|
|
|
|
extern HB_EXPORT HB_SIZE hb_cdpUTF8StringLength( const char * pSrc, HB_SIZE nLen );
|
|
extern HB_EXPORT HB_SIZE hb_cdpUTF8StringAt( const char * szNeedle, HB_SIZE nLenN, const char * szHaystack, HB_SIZE nLenH, HB_SIZE nStart, HB_SIZE nEnd, HB_BOOL fReverse );
|
|
extern HB_EXPORT HB_WCHAR32 hb_cdpUTF8StringPeek( const char * pSrc, HB_SIZE nLen, HB_SIZE nPos );
|
|
extern HB_EXPORT char * hb_cdpUTF8StringSubstr( const char * pSrc, HB_SIZE nLen, HB_SIZE nFrom, HB_SIZE nCount, HB_SIZE * pnDest );
|
|
|
|
extern HB_EXPORT HB_SIZE hb_cdpUTF8AsStrLen( PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nSrc, HB_SIZE nMax );
|
|
extern HB_EXPORT HB_SIZE hb_cdpUTF8ToStr( PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nSrc, char * pDst, HB_SIZE nDst );
|
|
extern HB_EXPORT HB_SIZE hb_cdpStrAsUTF8Len( PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nSrc, HB_SIZE nMax );
|
|
extern HB_EXPORT HB_SIZE hb_cdpStrToUTF8( PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nSrc, char * pDst, HB_SIZE nDst );
|
|
|
|
extern HB_EXPORT HB_SIZE hb_cdpU16AsStrLen( PHB_CODEPAGE cdp, const HB_WCHAR * pSrc, HB_SIZE nSrc, HB_SIZE nMax );
|
|
extern HB_EXPORT HB_SIZE hb_cdpU16ToStr( PHB_CODEPAGE cdp, int iEndian, const HB_WCHAR * pSrc, HB_SIZE nSrc, char * pDst, HB_SIZE nDst );
|
|
extern HB_EXPORT HB_SIZE hb_cdpStrAsU16Len( PHB_CODEPAGE cdp, const char * pSrc, HB_SIZE nSrc, HB_SIZE nMax );
|
|
extern HB_EXPORT HB_SIZE hb_cdpStrToU16( PHB_CODEPAGE cdp, int iEndian, const char * pSrc, HB_SIZE nSrc, HB_WCHAR * pDst, HB_SIZE nDst );
|
|
extern HB_EXPORT HB_WCHAR * hb_cdpStrDupU16( PHB_CODEPAGE cdp, int iEndian, const char * pSrc );
|
|
extern HB_EXPORT HB_WCHAR * hb_cdpStrDupnU16( PHB_CODEPAGE cdp, int iEndian, const char * pSrc, HB_SIZE nSrc );
|
|
extern HB_EXPORT HB_WCHAR * hb_cdpnStrDupU16( PHB_CODEPAGE cdp, int iEndian, const char * pSrc, HB_SIZE nSrc, HB_SIZE * pnDst );
|
|
|
|
extern HB_EXPORT HB_WCHAR hb_cdpGetU16Ctrl( HB_WCHAR wc );
|
|
|
|
extern HB_EXPORT int hb_cdpUTF8CharSize( HB_WCHAR32 wc );
|
|
extern HB_EXPORT int hb_cdpU32CharToUTF8( char * szUTF8, HB_WCHAR32 wc );
|
|
extern HB_EXPORT int hb_cdpU16CharToUTF8( char * szUTF8, HB_WCHAR wc );
|
|
extern HB_EXPORT HB_BOOL hb_cdpUTF8ToU16NextChar( HB_UCHAR ucChar, int * n, HB_WCHAR * pwc );
|
|
extern HB_EXPORT HB_BOOL hb_cdpUTF8GetU32( const char * pSrc, HB_SIZE nLen, HB_SIZE * pnIndex, HB_WCHAR32 * pWC );
|
|
extern HB_EXPORT HB_BOOL hb_cdpUTF8GetUCS( const char * pSrc, HB_SIZE nLen, HB_SIZE * pnIndex, HB_WCHAR32 * pWC );
|
|
extern HB_EXPORT HB_BOOL hb_cdpUTF8GetU16( const char * pSrc, HB_SIZE nLen, HB_SIZE * pnIndex, HB_WCHAR16 * pWC );
|
|
extern HB_EXPORT HB_BOOL hb_cdpUTF8Validate( const char * pSrc, HB_SIZE nLen );
|
|
|
|
extern HB_EXPORT PHB_ITEM hb_itemDeserializeCP( const char ** pBufferPtr, HB_SIZE * pnSize, PHB_CODEPAGE cdpIn, PHB_CODEPAGE cdpOut );
|
|
extern HB_EXPORT char * hb_itemSerializeCP( PHB_ITEM pItem, int iFlags, PHB_CODEPAGE cdpIn, PHB_CODEPAGE cdpOut, HB_SIZE * pnSize );
|
|
|
|
extern HB_EXPORT HB_WCHAR hb_cdpUpperWC( PHB_CODEPAGE cdp, HB_WCHAR wc );
|
|
|
|
/* functions operating on character indexes */
|
|
extern HB_EXPORT HB_SIZE hb_cdpTextLen( PHB_CODEPAGE cdp, const char * pText, HB_SIZE nSize );
|
|
extern HB_EXPORT HB_SIZE hb_cdpTextPos( PHB_CODEPAGE cdp, const char * pText, HB_SIZE nSize, HB_SIZE nIndex );
|
|
extern HB_EXPORT HB_SIZE hb_cdpTextPosEx( PHB_CODEPAGE cdp, const char * pText, HB_SIZE nSize, HB_SIZE * pnIndex );
|
|
|
|
extern HB_EXPORT HB_WCHAR hb_cdpTextGetU16( PHB_CODEPAGE cdp, const char * szText, HB_SIZE nLen );
|
|
extern HB_EXPORT HB_SIZE hb_cdpTextPutU16( PHB_CODEPAGE cdp, char * szText, HB_SIZE nSize, HB_WCHAR wc );
|
|
extern HB_EXPORT HB_BOOL hb_cdpCharEq( PHB_CODEPAGE cdp, const char * szText1, HB_SIZE nLen1, HB_SIZE * pnPos1,
|
|
const char * szText2, HB_SIZE nLen2, HB_SIZE * pnPos2 );
|
|
extern HB_EXPORT HB_BOOL hb_cdpCharCaseEq( PHB_CODEPAGE cdp, const char * szText1, HB_SIZE nLen1, HB_SIZE * pnPos1,
|
|
const char * szText2, HB_SIZE nLen2, HB_SIZE * pnPos2 );
|
|
|
|
HB_EXTERN_END
|
|
|
|
#endif /* HB_APICDP_H_ */
|