/* * $Id$ */ /* * Harbour Project source code: * CT3 string functions * - TOKENINIT() * - TOKENEXIT() * - TOKENNEXT() * - TOKENNUM() * - TOKENAT() * - SAVETOKEN() * - RESTTOKEN() * - TOKENEND() * * Copyright 2001 IntTec GmbH, Neunlindenstr 32, 79106 Freiburg, Germany * Author: Martin Vogel * * www - http://harbour-project.org * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2, or (at your option) * any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this software; see the file COPYING. If not, write to * the Free Software Foundation, Inc., 59 Temple Place, Suite 330, * Boston, MA 02111-1307 USA (or visit the web site http://www.gnu.org/). * * As a special exception, the Harbour Project gives permission for * additional uses of the text contained in its release of Harbour. * * The exception is that, if you link the Harbour libraries with other * files to produce an executable, this does not by itself cause the * resulting executable to be covered by the GNU General Public License. * Your use of that executable is in no way restricted on account of * linking the Harbour library code into it. * * This exception does not however invalidate any other reasons why * the executable file might be covered by the GNU General Public License. * * This exception applies only to the code released by the Harbour * Project under the name Harbour. If you copy code from other * Harbour Project or Free Software Foundation releases into a copy of * Harbour, as the General Public License permits, the exception does * not apply to the code that you add in this way. To avoid misleading * anyone as to the status of such modified files, you must delete * this exception notice from them. * * If you write modifications of your own for Harbour, it is your choice * whether to permit this exception to apply to your modifications. * If you do not wish that, delete this exception notice. * */ #include "ct.h" #include "hbvm.h" /* ==================================================================== */ /* static functions for token environment management */ /* ==================================================================== */ #define TOKEN_ENVIRONMENT_STEP 100 typedef struct _TOKEN_POSITION { HB_SIZE sStartPos; /* relative 0-based index of first char of token */ HB_SIZE sEndPos; /* relative 0-based index of first char BEHIND token, so that length = sEndPos-sStartPos */ } TOKEN_POSITION; typedef TOKEN_POSITION * TOKEN_ENVIRONMENT; /* -------------------------------------------------------------------- */ /* alloc new token environment */ /* -------------------------------------------------------------------- */ static TOKEN_ENVIRONMENT sTokEnvNew( void ) { TOKEN_ENVIRONMENT env = ( TOKEN_ENVIRONMENT ) hb_xalloc( sizeof( TOKEN_POSITION ) * ( 2 + TOKEN_ENVIRONMENT_STEP ) ); if( env == NULL ) return NULL; /* use the first element to store current length and use of token env */ env[ 0 ].sStartPos = 0; /* 0-based index to next free, unused element */ env[ 0 ].sEndPos = TOKEN_ENVIRONMENT_STEP; /* but there are 100 elements ready for use */ /* use second element to store actual index with tokennext() */ env[ 1 ].sStartPos = 0; /* 0-based index value that is to be used NEXT */ return env; } /* -------------------------------------------------------------------- */ /* add a tokenizing position to a token environment */ /* -------------------------------------------------------------------- */ static int sTokEnvAddPos( TOKEN_ENVIRONMENT * pEnv, TOKEN_POSITION * pPos ) { HB_SIZE index; TOKEN_ENVIRONMENT env = *pEnv; /* new memory needed ? */ if( env[ 0 ].sStartPos == env[ 0 ].sEndPos ) { env = *pEnv = ( TOKEN_ENVIRONMENT ) hb_xrealloc( env, sizeof( TOKEN_POSITION ) * ( 2 + env[ 0 ].sEndPos + TOKEN_ENVIRONMENT_STEP ) ); env[ 0 ].sEndPos += TOKEN_ENVIRONMENT_STEP; } index = env[ 0 ].sStartPos + 2; /* +2 because of extra elements */ env[ index ].sStartPos = pPos->sStartPos; env[ index ].sEndPos = pPos->sEndPos; env[ 0 ].sStartPos++; return 1; } /* -------------------------------------------------------------------- */ /* check to see if token pointer is at end of environment */ /* -------------------------------------------------------------------- */ static int sTokEnvEnd( TOKEN_ENVIRONMENT env ) { return env[ 1 ].sStartPos >= env[ 0 ].sStartPos; } /* -------------------------------------------------------------------- */ /* get size of token environment in memory */ /* -------------------------------------------------------------------- */ static HB_SIZE sTokEnvGetSize( TOKEN_ENVIRONMENT env ) { return sizeof( TOKEN_POSITION ) * ( 2 + env[ 0 ].sEndPos ); } /* -------------------------------------------------------------------- */ /* get position element pointed to by tokenizing pointer */ /* -------------------------------------------------------------------- */ static TOKEN_POSITION * sTokEnvGetPos( TOKEN_ENVIRONMENT env ) { if( env[ 1 ].sStartPos >= env[ 0 ].sStartPos ) return NULL; return env + 2 + ( env[ 1 ].sStartPos ); /* "+2" because of extra elements */ } /* -------------------------------------------------------------------- */ /* get position element pointed to by given 0-based index */ /* -------------------------------------------------------------------- */ static TOKEN_POSITION * sTokEnvGetPosIndex( TOKEN_ENVIRONMENT env, HB_SIZE index ) { if( index >= env[ 0 ].sStartPos ) return NULL; return env + 2 + index; /* "+2" because of extra elements */ } /* -------------------------------------------------------------------- */ /* increment tokenizing pointer by one */ /* -------------------------------------------------------------------- */ static int sTokEnvIncPtr( TOKEN_ENVIRONMENT env ) { if( env[ 1 ].sStartPos >= env[ 0 ].sStartPos ) return 0; else { env[ 1 ].sStartPos++; return 1; } } /* -------------------------------------------------------------------- */ /* set tokenizing pointer to 0-based value */ /* -------------------------------------------------------------------- */ static int sTokEnvSetPtr( TOKEN_ENVIRONMENT env, HB_SIZE sCnt ) { if( sCnt >= env[ 0 ].sStartPos ) return 0; else { env[ 1 ].sStartPos = sCnt; return 1; } } /* -------------------------------------------------------------------- */ /* decrement tokenizing pointer by one */ /* -------------------------------------------------------------------- */ /* sTokEnvDecPtr currently not used ! */ /* static int sTokEnvDecPtr( TOKEN_ENVIRONMENT env ) { if( env[ 1 ].sStartPos <= 0 ) return 0; else { env[ 1 ].sStartPos--; return 1; } } */ /* -------------------------------------------------------------------- */ /* get value of tokenizing pointer */ /* -------------------------------------------------------------------- */ static HB_SIZE sTokEnvGetPtr( TOKEN_ENVIRONMENT env ) { return env[ 1 ].sStartPos; } /* -------------------------------------------------------------------- */ /* get token count */ /* -------------------------------------------------------------------- */ static HB_SIZE sTokEnvGetCnt( TOKEN_ENVIRONMENT env ) { return env[ 0 ].sStartPos; } /* -------------------------------------------------------------------- */ /* free token environment */ /* -------------------------------------------------------------------- */ static void sTokEnvDel( TOKEN_ENVIRONMENT env ) { hb_xfree( env ); } /* ==================================================================== */ /* HARBOUR functions */ /* ==================================================================== */ /* static data */ static const char * spcSeparatorStr = "\x00" "\x09" "\x0A" "\x0C" "\x1A" "\x20" "\x8A" "\x8C" ",.;:!\?/\\<>()#&%+-*"; static const HB_SIZE ssSeparatorStrLen = 26; /* TODO: make thread safe */ static TOKEN_ENVIRONMENT s_sTokenEnvironment = NULL; static HB_BOOL s_fInit = HB_FALSE; static void sTokExit( void * cargo ) { HB_SYMBOL_UNUSED( cargo ); if( s_sTokenEnvironment ) { sTokEnvDel( s_sTokenEnvironment ); s_sTokenEnvironment = NULL; } } static void sTokSet( TOKEN_ENVIRONMENT env ) { if( !s_fInit && env ) { hb_vmAtExit( sTokExit, NULL ); s_fInit = HB_TRUE; } if( s_sTokenEnvironment ) sTokEnvDel( s_sTokenEnvironment ); s_sTokenEnvironment = env; } HB_FUNC( TOKENINIT ) { if( HB_ISCHAR( 1 ) ) { const char * pcString = hb_parc( 1 ); HB_SIZE sStrLen = hb_parclen( 1 ); const char * pcSeparatorStr; HB_SIZE sSeparatorStrLen; HB_SIZE nSkipCnt, nSkip; const char * pcSubStr, * pc; HB_SIZE sSubStrLen; TOKEN_ENVIRONMENT sTokenEnvironment; TOKEN_POSITION sTokenPosition; /* separator string */ sSeparatorStrLen = hb_parclen( 2 ); if( sSeparatorStrLen > 0 ) pcSeparatorStr = hb_parc( 2 ); else { pcSeparatorStr = ( const char * ) spcSeparatorStr; sSeparatorStrLen = ssSeparatorStrLen; } /* skip width */ if( HB_ISNUM( 3 ) ) nSkip = hb_parns( 3 ); else nSkip = HB_SIZE_MAX; if( nSkip == 0 ) nSkip = HB_SIZE_MAX; /* allocate new token environment */ if( ( sTokenEnvironment = sTokEnvNew() ) == NULL ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_MEM, CT_ERROR_TOKENINIT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } hb_retl( HB_FALSE ); return; } pcSubStr = pcString; sSubStrLen = sStrLen; /* scan start condition */ pc = pcSubStr - 1; for( ;; ) { HB_SIZE sMatchedPos = sSeparatorStrLen; /* nSkip */ nSkipCnt = 0; do { sSubStrLen -= ( pc - pcSubStr ) + 1; pcSubStr = pc + 1; pc = ct_at_charset_forward( pcSubStr, sSubStrLen, pcSeparatorStr, sSeparatorStrLen, &sMatchedPos ); nSkipCnt++; } while( nSkipCnt < nSkip && pc == pcSubStr ); if( sSubStrLen == 0 ) break; sTokenPosition.sStartPos = pcSubStr - pcString; if( pc == NULL ) sTokenPosition.sEndPos = pcSubStr - pcString + sSubStrLen; else sTokenPosition.sEndPos = pc - pcString; if( !sTokEnvAddPos( &sTokenEnvironment, &sTokenPosition ) ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_MEM, CT_ERROR_TOKENINIT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } sTokEnvDel( sTokenEnvironment ); hb_retl( HB_FALSE ); return; } if( pc == NULL ) break; } /* for( ;; ) */ /* save token environment to 4th parameter OR to the static */ if( HB_ISBYREF( 4 ) ) { hb_storclen( ( char * ) sTokenEnvironment, sTokEnvGetSize( sTokenEnvironment ), 4 ); sTokEnvDel( sTokenEnvironment ); } else { sTokSet( sTokenEnvironment ); } hb_retl( HB_TRUE ); } else /* HB_ISCHAR( 1 ) */ { /* if there is a token environment stored in either the 4th parameter or in the static variable -> rewind to first token */ TOKEN_ENVIRONMENT sTokenEnvironment; if( HB_ISCHAR( 4 ) && HB_ISBYREF( 4 ) ) sTokenEnvironment = ( TOKEN_ENVIRONMENT ) hb_parc( 4 ); else sTokenEnvironment = s_sTokenEnvironment; if( sTokenEnvironment != NULL ) { /* rewind to first token */ hb_retl( sTokEnvSetPtr( sTokenEnvironment, 0 ) ); if( HB_ISCHAR( 4 ) && HB_ISBYREF( 4 ) ) hb_storclen( ( char * ) sTokenEnvironment, sTokEnvGetSize( sTokenEnvironment ), 4 ); } else { /* nothing to rewind -> return .f. */ PHB_ITEM pSubst = NULL; int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { pSubst = ct_error_subst( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENINIT, NULL, HB_ERR_FUNCNAME, 0, EF_CANSUBSTITUTE, HB_ERR_ARGS_BASEPARAMS ); } if( pSubst != NULL ) hb_itemReturnRelease( pSubst ); else hb_retl( HB_FALSE ); } } } HB_FUNC( TOKENNEXT ) { if( HB_ISCHAR( 1 ) ) { const char * pcString = hb_parc( 1 ); HB_SIZE sStrLen = hb_parclen( 1 ); TOKEN_ENVIRONMENT sTokenEnvironment; TOKEN_POSITION * psTokenPosition; /* token environment by parameter ... */ if( HB_ISCHAR( 3 ) && HB_ISBYREF( 3 ) ) { HB_SIZE sStrLen3 = hb_parclen( 3 ); if( sStrLen3 < sizeof( TOKEN_POSITION ) * 2 ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENNEXT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } hb_retc_null(); return; } sTokenEnvironment = ( TOKEN_ENVIRONMENT ) hb_xgrab( sStrLen3 ); hb_xmemcpy( ( char * ) sTokenEnvironment, hb_parc( 3 ), sStrLen3 ); } else { /* ... or static ? */ if( s_sTokenEnvironment == NULL ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENNEXT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } hb_retc_null(); return; } sTokenEnvironment = s_sTokenEnvironment; } /* nth token or next token ? */ if( HB_ISNUM( 2 ) ) { psTokenPosition = sTokEnvGetPosIndex( sTokenEnvironment, hb_parns( 2 ) - 1 ); /* no increment here */ } else { psTokenPosition = sTokEnvGetPos( sTokenEnvironment ); /* increment counter */ sTokEnvIncPtr( sTokenEnvironment ); } if( ( psTokenPosition == NULL ) || ( sStrLen <= psTokenPosition->sStartPos ) ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENNEXT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } if( HB_ISCHAR( 3 ) && HB_ISBYREF( 3 ) ) { hb_storclen( ( char * ) sTokenEnvironment, sTokEnvGetSize( sTokenEnvironment ), 3 ); hb_xfree( ( char * ) sTokenEnvironment ); } hb_retc_null(); return; } if( sStrLen < psTokenPosition->sEndPos ) hb_retclen( pcString + psTokenPosition->sStartPos, sStrLen - ( psTokenPosition->sStartPos ) ); else hb_retclen( pcString + psTokenPosition->sStartPos, ( psTokenPosition->sEndPos ) - ( psTokenPosition->sStartPos ) ); if( HB_ISCHAR( 3 ) && HB_ISBYREF( 3 ) ) { hb_storclen( ( char * ) sTokenEnvironment, sTokEnvGetSize( sTokenEnvironment ), 3 ); hb_xfree( ( char * ) sTokenEnvironment ); } } else { /* no string given, no token returns */ PHB_ITEM pSubst = NULL; int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { pSubst = ct_error_subst( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENNEXT, NULL, HB_ERR_FUNCNAME, 0, EF_CANSUBSTITUTE, HB_ERR_ARGS_BASEPARAMS ); } if( pSubst != NULL ) hb_itemReturnRelease( pSubst ); else hb_retc_null(); } } HB_FUNC( TOKENNUM ) { TOKEN_ENVIRONMENT sTokenEnvironment; if( HB_ISCHAR( 1 ) && HB_ISBYREF( 1 ) ) sTokenEnvironment = ( TOKEN_ENVIRONMENT ) hb_parc( 1 ); else sTokenEnvironment = s_sTokenEnvironment; if( ( void * ) sTokenEnvironment != NULL ) hb_retns( sTokEnvGetCnt( sTokenEnvironment ) ); else { PHB_ITEM pSubst = NULL; int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { pSubst = ct_error_subst( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENNUM, NULL, HB_ERR_FUNCNAME, 0, EF_CANSUBSTITUTE, HB_ERR_ARGS_BASEPARAMS ); } if( pSubst != NULL ) hb_itemReturnRelease( pSubst ); else hb_retns( 0 ); } } HB_FUNC( TOKENEND ) { TOKEN_ENVIRONMENT sTokenEnvironment; if( HB_ISCHAR( 1 ) && HB_ISBYREF( 1 ) ) sTokenEnvironment = ( TOKEN_ENVIRONMENT ) hb_parc( 1 ); else sTokenEnvironment = s_sTokenEnvironment; if( ( void * ) sTokenEnvironment != NULL ) hb_retl( sTokEnvEnd( sTokenEnvironment ) ); else { PHB_ITEM pSubst = NULL; int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { pSubst = ct_error_subst( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENEND, NULL, HB_ERR_FUNCNAME, 0, EF_CANSUBSTITUTE, HB_ERR_ARGS_BASEPARAMS ); } if( pSubst != NULL ) hb_itemReturnRelease( pSubst ); else /* it is CTIII behaviour to return .T. if there's no string TOKENINIT'ed */ hb_retl( HB_TRUE ); } } HB_FUNC( TOKENEXIT ) { if( s_sTokenEnvironment != NULL ) { sTokExit( NULL ); hb_retl( HB_TRUE ); } else hb_retl( HB_FALSE ); } HB_FUNC( TOKENAT ) { int iSeparatorPos = 0; HB_SIZE sCurrentIndex; TOKEN_ENVIRONMENT sTokenEnvironment; TOKEN_POSITION *psTokenPosition; if( HB_ISLOG( 1 ) ) iSeparatorPos = hb_parl( 1 ); if( HB_ISCHAR( 3 ) && HB_ISBYREF( 3 ) ) sTokenEnvironment = ( TOKEN_ENVIRONMENT ) hb_parc( 3 ); else sTokenEnvironment = s_sTokenEnvironment; if( ( void * ) sTokenEnvironment == NULL ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENAT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } hb_retns( 0 ); return; } if( HB_ISNUM( 2 ) ) sCurrentIndex = hb_parns( 2 ) - 1; else sCurrentIndex = sTokEnvGetPtr( sTokenEnvironment ); psTokenPosition = sTokEnvGetPosIndex( sTokenEnvironment, sCurrentIndex ); if( psTokenPosition == NULL ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_TOKENAT, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } hb_retns( 0 ); return; } if( iSeparatorPos ) hb_retns( psTokenPosition->sEndPos + 1 ); else hb_retns( psTokenPosition->sStartPos + 1 ); } HB_FUNC( SAVETOKEN ) { if( s_sTokenEnvironment != NULL ) hb_retclen( ( char * ) s_sTokenEnvironment, sTokEnvGetSize( s_sTokenEnvironment ) ); else hb_retc_null(); } HB_FUNC( RESTTOKEN ) { TOKEN_ENVIRONMENT sTokenEnvironment = NULL; HB_SIZE sStrLen = 1; if( HB_ISCHAR( 1 ) ) { sStrLen = hb_parclen( 1 ); if( sStrLen >= sizeof( TOKEN_POSITION ) ) { TOKEN_ENVIRONMENT env = ( TOKEN_ENVIRONMENT ) hb_parc( 1 ); if( sTokEnvGetSize( env ) == sStrLen ) { /* alloc memory for new environment */ sTokenEnvironment = ( TOKEN_ENVIRONMENT ) hb_xalloc( sStrLen ); if( sTokenEnvironment == NULL ) { int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { ct_error( ( HB_USHORT ) iArgErrorMode, EG_MEM, CT_ERROR_RESTTOKEN, NULL, HB_ERR_FUNCNAME, 0, EF_CANDEFAULT, HB_ERR_ARGS_BASEPARAMS ); } hb_retc_null(); return; } hb_xmemcpy( sTokenEnvironment, env, sStrLen ); } } } if( sTokenEnvironment != NULL || sStrLen == 0 ) { /* return current environment, then delete it */ if( s_sTokenEnvironment != NULL ) hb_retclen( ( char * ) s_sTokenEnvironment, sTokEnvGetSize( s_sTokenEnvironment ) ); else hb_retc_null(); sTokSet( sTokenEnvironment ); } else { PHB_ITEM pSubst = NULL; int iArgErrorMode = ct_getargerrormode(); if( iArgErrorMode != CT_ARGERR_IGNORE ) { pSubst = ct_error_subst( ( HB_USHORT ) iArgErrorMode, EG_ARG, CT_ERROR_RESTTOKEN, NULL, HB_ERR_FUNCNAME, 0, EF_CANSUBSTITUTE, HB_ERR_ARGS_BASEPARAMS ); } if( pSubst != NULL ) hb_itemReturnRelease( pSubst ); else hb_retc_null(); } }