* common.mak
* source/hbpcre/Makefile
* source/hbpcre/chartabs.c -- changes
* source/hbpcre/config.h
* source/hbpcre/pcre.h
* source/hbpcre/pcrecomp.c
* source/hbpcre/pcreconf.c
* source/hbpcre/pcredfa.c
* source/hbpcre/pcreexec.c
* source/hbpcre/pcrefind.c
* source/hbpcre/pcrefinf.c
* source/hbpcre/pcreget.c
* source/hbpcre/pcreinal.h
* source/hbpcre/pcreinfo.c
* source/hbpcre/pcremktb.c
* source/hbpcre/pcreoutf.c
* source/hbpcre/pcrerefc.c
* source/hbpcre/pcrestud.c
* source/hbpcre/pcretabs.c
* source/hbpcre/pcretryf.c
* source/hbpcre/pcrever.c
* source/hbpcre/pcrevutf.c
* source/hbpcre/pcrexcls.c
* source/hbpcre/ucp.h
* source/hbpcre/ucpinter.h
- source/hbpcre/pcreglob.c -- renames
+ source/hbpcre/_hbpcreg.c
- source/hbpcre/pcreprni.c
+ source/hbpcre/pcreprni.h
- source/hbpcre/ucptable.c
+ source/hbpcre/ucptable.h
+ source/hbpcre/_hbconf.h -- new files
+ source/hbpcre/pcrenewl.c
- source/hbpcre/dftables.c -- deletion
+ Updated to PCRE 7.7 (from 6.3)
; Original code not (yet) modified, so some warnings
may appear in foreign code.
; Please test.
+ source/hbpcre/cnv_hb2o.bat
+ source/hbpcre/cnv_o2hb.bat
+ Added batch files to make to conversion from
original PCRE source files into Harbour.
134 lines
3.0 KiB
C
134 lines
3.0 KiB
C
/*************************************************
|
|
* Unicode Property Table handler *
|
|
*************************************************/
|
|
|
|
#ifndef _UCP_H
|
|
#define _UCP_H
|
|
|
|
/* This file contains definitions of the property values that are returned by
|
|
the function _pcre_ucp_findprop(). New values that are added for new releases
|
|
of Unicode should always be at the end of each enum, for backwards
|
|
compatibility. */
|
|
|
|
/* These are the general character categories. */
|
|
|
|
enum {
|
|
ucp_C, /* Other */
|
|
ucp_L, /* Letter */
|
|
ucp_M, /* Mark */
|
|
ucp_N, /* Number */
|
|
ucp_P, /* Punctuation */
|
|
ucp_S, /* Symbol */
|
|
ucp_Z /* Separator */
|
|
};
|
|
|
|
/* These are the particular character types. */
|
|
|
|
enum {
|
|
ucp_Cc, /* Control */
|
|
ucp_Cf, /* Format */
|
|
ucp_Cn, /* Unassigned */
|
|
ucp_Co, /* Private use */
|
|
ucp_Cs, /* Surrogate */
|
|
ucp_Ll, /* Lower case letter */
|
|
ucp_Lm, /* Modifier letter */
|
|
ucp_Lo, /* Other letter */
|
|
ucp_Lt, /* Title case letter */
|
|
ucp_Lu, /* Upper case letter */
|
|
ucp_Mc, /* Spacing mark */
|
|
ucp_Me, /* Enclosing mark */
|
|
ucp_Mn, /* Non-spacing mark */
|
|
ucp_Nd, /* Decimal number */
|
|
ucp_Nl, /* Letter number */
|
|
ucp_No, /* Other number */
|
|
ucp_Pc, /* Connector punctuation */
|
|
ucp_Pd, /* Dash punctuation */
|
|
ucp_Pe, /* Close punctuation */
|
|
ucp_Pf, /* Final punctuation */
|
|
ucp_Pi, /* Initial punctuation */
|
|
ucp_Po, /* Other punctuation */
|
|
ucp_Ps, /* Open punctuation */
|
|
ucp_Sc, /* Currency symbol */
|
|
ucp_Sk, /* Modifier symbol */
|
|
ucp_Sm, /* Mathematical symbol */
|
|
ucp_So, /* Other symbol */
|
|
ucp_Zl, /* Line separator */
|
|
ucp_Zp, /* Paragraph separator */
|
|
ucp_Zs /* Space separator */
|
|
};
|
|
|
|
/* These are the script identifications. */
|
|
|
|
enum {
|
|
ucp_Arabic,
|
|
ucp_Armenian,
|
|
ucp_Bengali,
|
|
ucp_Bopomofo,
|
|
ucp_Braille,
|
|
ucp_Buginese,
|
|
ucp_Buhid,
|
|
ucp_Canadian_Aboriginal,
|
|
ucp_Cherokee,
|
|
ucp_Common,
|
|
ucp_Coptic,
|
|
ucp_Cypriot,
|
|
ucp_Cyrillic,
|
|
ucp_Deseret,
|
|
ucp_Devanagari,
|
|
ucp_Ethiopic,
|
|
ucp_Georgian,
|
|
ucp_Glagolitic,
|
|
ucp_Gothic,
|
|
ucp_Greek,
|
|
ucp_Gujarati,
|
|
ucp_Gurmukhi,
|
|
ucp_Han,
|
|
ucp_Hangul,
|
|
ucp_Hanunoo,
|
|
ucp_Hebrew,
|
|
ucp_Hiragana,
|
|
ucp_Inherited,
|
|
ucp_Kannada,
|
|
ucp_Katakana,
|
|
ucp_Kharoshthi,
|
|
ucp_Khmer,
|
|
ucp_Lao,
|
|
ucp_Latin,
|
|
ucp_Limbu,
|
|
ucp_Linear_B,
|
|
ucp_Malayalam,
|
|
ucp_Mongolian,
|
|
ucp_Myanmar,
|
|
ucp_New_Tai_Lue,
|
|
ucp_Ogham,
|
|
ucp_Old_Italic,
|
|
ucp_Old_Persian,
|
|
ucp_Oriya,
|
|
ucp_Osmanya,
|
|
ucp_Runic,
|
|
ucp_Shavian,
|
|
ucp_Sinhala,
|
|
ucp_Syloti_Nagri,
|
|
ucp_Syriac,
|
|
ucp_Tagalog,
|
|
ucp_Tagbanwa,
|
|
ucp_Tai_Le,
|
|
ucp_Tamil,
|
|
ucp_Telugu,
|
|
ucp_Thaana,
|
|
ucp_Thai,
|
|
ucp_Tibetan,
|
|
ucp_Tifinagh,
|
|
ucp_Ugaritic,
|
|
ucp_Yi,
|
|
ucp_Balinese, /* New for Unicode 5.0.0 */
|
|
ucp_Cuneiform, /* New for Unicode 5.0.0 */
|
|
ucp_Nko, /* New for Unicode 5.0.0 */
|
|
ucp_Phags_Pa, /* New for Unicode 5.0.0 */
|
|
ucp_Phoenician /* New for Unicode 5.0.0 */
|
|
};
|
|
|
|
#endif
|
|
|
|
/* End of ucp.h */
|