Files
harbour-core/harbour/contrib/xhb/fparse.c
Viktor Szakats 003fd7c41e 2010-01-14 18:01 UTC+0100 Viktor Szakats (harbour.01 syenar.hu)
* src/rtl/strclear.c
    + HB_STRCLEAR() return value will now precisely inform about
      successful clear operation. Thanks to Mindaugas.

  * src/vm/hashfunc.c
  * src/vm/macro.c
  * src/vm/strapi.c
  * src/vm/runner.c
  * src/vm/estack.c
  * src/vm/codebloc.c
  * src/vm/hashes.c
  * src/vm/maindll.c
  * src/vm/dynsym.c
  * src/vm/debug.c
  * src/vm/itemapi.c
  * src/vm/garbage.c
  * src/vm/asort.c
  * src/vm/hvm.c
  * src/vm/cmdarg.c
  * src/vm/mainstd.c
  * src/vm/maindllp.c
  * src/vm/arrays.c
  * src/vm/task.c
  * src/vm/fm.c
  * src/vm/proc.c
  * src/vm/thread.c
  * src/vm/memvars.c
  * src/vm/arrayshb.c
  * src/vm/eval.c
  * src/vm/extend.c
  * src/vm/dynlibhb.c
  * src/vm/set.c
  * src/vm/classes.c
  * src/debug/dbgentry.c
  * src/common/hbgete.c
  * src/common/hbffind.c
  * src/common/hbver.c
  * src/common/hbprintf.c
  * src/common/hbfsapi.c
  * src/common/hbstr.c
  * src/common/expropt1.c
  * src/common/expropt2.c
  * src/common/hbdate.c
  * src/common/strwild.c
  * src/common/hbhash.c
  * src/rtl/gtdos/gtdos.c
  * src/rtl/fscopy.c
  * src/rtl/run.c
  * src/rtl/gtwin/gtwin.c
  * src/rtl/gtxwc/gtxwc.h
  * src/rtl/gtxwc/gtxwc.c
  * src/rtl/math.c
  * src/rtl/empty.c
  * src/rtl/gtcrs/gtcrs.c
  * src/rtl/trim.c
  * src/rtl/filehb.c
  * src/rtl/hbtoken.c
  * src/rtl/fstemp.c
  * src/rtl/gtchrmap.c
  * src/rtl/strmatch.c
  * src/rtl/gtstd/gtstd.c
  * src/rtl/gttrm/gttrm.c
  * src/rtl/padr.c
  * src/rtl/hbstrfmt.c
  * src/rtl/transfrm.c
  * src/rtl/fserr.c
  * src/rtl/minmax.c
  * src/rtl/hbfeof.c
  * src/rtl/dates.c
  * src/rtl/padc.c
  * src/rtl/gtcgi/gtcgi.c
  * src/rtl/errapi.c
  * src/rtl/version.c
  * src/rtl/hbregexc.c
  * src/rtl/hbrandom.c
  * src/rtl/strtran.c
  * src/rtl/hbprocfn.c
  * src/rtl/hbsocket.c
  * src/rtl/hbinet.c
  * src/rtl/copyfile.c
  * src/rtl/errintlo.c
  * src/rtl/gtapi.c
  * src/rtl/filesys.c
  * src/rtl/padl.c
  * src/rtl/hbregex.c
  * src/rtl/hbbit.c
  * src/rtl/isprint.c
  * src/rtl/saverest.c
  * src/rtl/diskspac.c
  * src/rtl/console.c
  * src/rtl/spfiles.c
  * src/rtl/gtos2/gtos2.c
  * src/rtl/philes.c
  * src/rtl/hbbffnc.c
  * src/rtl/hbgtcore.c
  * src/rtl/cdpapi.c
  * src/rtl/dirdrive.c
  * src/rtl/hbi18n1.c
  * src/rtl/gtclip.c
  * src/rtl/mlcfunc.c
  * src/rtl/gtapiu.c
  * src/rtl/accept.c
  * src/rtl/idle.c
  * src/rtl/itemseri.c
  * src/rtl/hbrunfun.c
  * src/rtl/setcolor.c
  * src/rtl/setkey.c
  * src/rtl/gtsln/mousesln.c
  * src/rtl/gtsln/gtsln.c
  * src/rtl/gtsln/kbsln.c
  * src/rtl/gtsln/gtsln.h
  * src/rtl/disksphb.c
  * src/rtl/strc.c
  * src/rtl/gtpca/gtpca.c
  * src/rtl/gtgui/gtgui.c
  * src/rtl/hbhex.c
  * src/rtl/trace.c
  * src/rtl/gt_tpl/gt_tpl.c
  * src/rtl/inkeyapi.c
  * src/rtl/filebuf.c
  * src/rtl/gete.c
  * src/rtl/setcurs.c
  * src/rtl/hbproces.c
  * src/rtl/langapi.c
  * src/rtl/gtwvt/gtwvt.h
  * src/rtl/gtwvt/gtwvt.c
  * src/rtl/mouse53.c
  * src/rtl/fssize.c
  * src/rtl/hbbyte.c
  * src/rtl/mouseapi.c
  * src/rtl/memofile.c
  * src/rtl/valtostr.c
  * src/rtl/file.c
  * src/rtl/val.c
  * src/rtl/rat.c
  * src/rdd/hbsix/sxcompr.c
  * include/hbvmpub.h
  * include/hbset.h
  * include/hbapicdp.h
  * include/hbstack.h
  * include/hbapilng.h
  * include/hbgtcore.h
  * include/hbapifs.h
  * include/hbthread.h
  * include/hbxvm.h
  * include/hbmacro.h
  * include/hbtypes.h
  * include/hbapi.h
  * include/hbapiitm.h
  * include/hbznet.h
  * include/hbvm.h
  * include/hbapidbg.h
  * include/hbcomp.h
  * include/hbsxfunc.h
  * include/hbcompdf.h
  * include/hbmather.h
  * include/hbapistr.h
  * include/hbwmain.c
  * include/hbexpra.c
  * include/hbexprop.h
  * include/hbsocket.h
  * include/hbapigt.h
  * include/hbapicls.h
  * include/hbhash.h
  * include/hbregex.h
  * include/hbexprb.c
  * include/hbdate.h
  * contrib/gtalleg/gtalleg.c
  * contrib/xhb/hboutdbg.c
  * contrib/xhb/hbserv.h
  * contrib/xhb/bkgtsks.c
  * contrib/xhb/dbf2txt.c
  * contrib/xhb/xhbis.c
  * contrib/xhb/fparse.c
  * contrib/xhb/xhb.h
  * contrib/xhb/xhbsave.c
  * contrib/xhb/xhbmsgs.c
  * contrib/xhb/freadlin.c
  * contrib/xhb/txtline.c
  * contrib/xhb/dbgfxc.c
  * contrib/xhb/xhberrc.c
  * contrib/xhb/filestat.c
  * contrib/xhb/xhbcopyf.c
  * contrib/xhb/hbnxs.h
  * contrib/xhb/hbserv.c
  * contrib/xhb/cstructc.c
  * contrib/xhb/xhbfunc.c
  * contrib/hbmzip/hbmzip.c
  * contrib/gtqtc/gtqtc.cpp
  * contrib/gtwvg/gtwvg.c
  * contrib/gtwvg/gtwvg.h
  * contrib/gtwvg/wvggui.c
  * contrib/gtwvg/wvgcuig.c
  * contrib/gtwvg/wvggui.h
  * contrib/gtwvg/wvgwin.c
  * contrib/gtwvg/wvgutils.c
  * contrib/gtwvg/wvgcore.c
  * contrib/gtwvg/wvgwing.c
  * contrib/hbmisc/hb_f.c
  * contrib/hbmisc/dates2.c
  * contrib/hbwin/hbwapi.h
  * contrib/hbbtree/tests/ctest.c
    * BOOL  -> HB_BOOL
    * TRUE  -> HB_TRUE
    * FALSE -> HB_FALSE
    ; If possible please try to verify me, at least your own are of interest
      or expertise. Look for HB_BOOL/HB_TRUE/HB_FALSE usage in WINAPI calls,
      if you see such thing, it's wrong. Also some, HB_BOOL WINAPI BOOL
      implicit conversions may need to be cleaned.
    ; I didn't touch PP, RDD, SDD and compiler parts yet.
    ; In few places it's possible that some in-line comments are disaligned
      after this operation.
2010-01-14 17:59:30 +00:00

688 lines
16 KiB
C

/*
* $Id$
*/
/*
* Harbour Project source code:
*
* FPARSE()
* FPARSEEX()
* FPARSELINE()
* FLINECOUNT()
* FCHARCOUNT()
* FWORDCOUNT()
*
* Copyright 2004 Andi Jahja <xharbour@cbn.net.id>
* www - http://www.harbour-project.org
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2, or (at your option)
* any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this software; see the file COPYING. If not, write to
* the Free Software Foundation, Inc., 59 Temple Place, Suite 330,
* Boston, MA 02111-1307 USA (or visit the web site http://www.gnu.org/).
*
* As a special exception, the Harbour Project gives permission for
* additional uses of the text contained in its release of Harbour.
*
* The exception is that, if you link the Harbour libraries with other
* files to produce an executable, this does not by itself cause the
* resulting executable to be covered by the GNU General Public License.
* Your use of that executable is in no way restricted on account of
* linking the Harbour library code into it.
*
* This exception does not however invalidate any other reasons why
* the executable file might be covered by the GNU General Public License.
*
* This exception applies only to the code released by the Harbour
* Project under the name Harbour. If you copy code from other
* Harbour Project or Free Software Foundation releases into a copy of
* Harbour, as the General Public License permits, the exception does
* not apply to the code that you add in this way. To avoid misleading
* anyone as to the status of such modified files, you must delete
* this exception notice from them.
*
* If you write modifications of your own for Harbour, it is your choice
* whether to permit this exception to apply to your modifications.
* If you do not wish that, delete this exception notice.
*
*/
/*
FPARSE( cFile, cDelimiter ) -> array
Purpose:
Parse a delimited text file.
Parameters:
cFile - file to process
cDelimiter - delimiter, default is comma
Returns:
Upon success -> Two dimensional array, of which each element contains
the results of parsing
Upon error -> An empty array
*/
#include "hbapi.h"
#include "hbapifs.h"
#include "hbapiitm.h"
#include "hbfast.h"
/* adjustable, but this should be sufficient in normal situation */
#define MAX_READ 4096
/*----------------------------------------------------------------------------*/
void hb_ParseLine( PHB_ITEM pReturn, const char * szText, int iDelimiter, int * iWord )
{
if ( szText )
{
int iLen = strlen( szText );
if ( iLen > 0 )
{
PHB_ITEM pTemp = hb_itemNew( NULL );
int i = 0, word_count = 0 ;
/* booked enough memory */
char *szResult = (char*) hb_xgrab( iLen + 1 );
#if 0
while( iLen )
{
if ( szText[ iLen - 1 ] && ! HB_ISSPACE( szText[ iLen - 1 ] ) )
{
break;
}
iLen --;
}
szText[ iLen ] = 0;
iLen = strlen( szText );
#endif
while( i < iLen )
{
int ui = 0;
hb_xmemset( szResult, ' ', iLen + 1 );
/* an '"' found, loop until the next one is found */
if ( szText[ i ] == '"' )
{
/* an '"' after '"' ? */
if ( szText[ i + 1 ] != '"' )
{
szResult [ ui ] = szText[ i + 1 ];
}
else
{
szResult [ ui ] = '\0';
}
++ i;
while( ++ i < iLen )
{
if ( szText[ i - 1 ] == '"' )
{
szResult [ ui + 1 ] = '\0';
break;
}
else
{
if ( szText[ i ] == '"' )
{
szResult [ ui + 1 ] = '\0';
}
else
{
szResult [ ++ ui ] = szText[ i ];
}
}
}
word_count ++;
hb_arrayAddForward( pReturn, hb_itemPutC( pTemp, szResult ));
}
/* delimiter found */
else if ( szText[ i ] == iDelimiter )
{
/* first delimiter found but no word yet */
if ( word_count == 0 )
{
/* add an empty string */
szResult [ ui ] = '\0';
}
else
{
/* we have already have the first word */
/* check next character */
if ( szText [ i - 1 ] == iDelimiter )
{
/* delimiter after delimiter */
/* just add an empty string */
szResult [ ui ] = '\0';
}
else
{
/* ",,0" */
/* it is not a delimiter */
/* move to next character */
++ i;
szResult [ ui ] = szText[ i ];
while( ++ i < iLen )
{
if ( szText[ i ] == iDelimiter )
{
break;
}
else
{
szResult [ ++ ui ] = szText[ i ];
}
}
}
}
word_count ++;
szResult [ ui + 1 ] = '\0';
hb_arrayAddForward( pReturn, hb_itemPutC( pTemp, szResult ));
}
else
{
szResult [ ui ] = szText[ i ];
while( ++ i < iLen )
{
if ( szText[ i ] == iDelimiter )
{
szResult [ ui + 1 ] = '\0';
break;
}
else if ( szText[ i ] == '"' )
{
szResult [ ui ] = szText[ i + 1 ];
++ i;
while( ++ i < iLen )
{
if ( szText[ i - 1 ] == '"' )
{
szResult [ ui + 1 ] = '\0';
break;
}
else
{
if ( szText[ i ] == '"' )
{
szResult [ ui + 1 ] = '\0';
break;
}
else
{
szResult [ ++ ui ] = szText[ i ];
}
}
}
}
else
{
szResult [ ++ ui ] = szText[ i ];
}
}
word_count ++;
szResult [ ui + 1 ] = '\0';
hb_arrayAddForward( pReturn, hb_itemPutC( pTemp, szResult ));
}
i ++;
}
/* last character in passed string is a delimiter */
/* just add an empty string */
if ( szText[ iLen - 1 ] == iDelimiter )
{
word_count ++;
hb_arrayAddForward( pReturn, hb_itemPutC( pTemp, NULL ) );
}
/* store number of words */
*iWord = word_count;
/* clean up */
hb_xfree( szResult );
hb_itemRelease( pTemp );
}
}
}
/*----------------------------------------------------------------------------*/
static char ** hb_tokensplit ( char *string, BYTE delimiter, int iCharCount, int *iWord )
{
char *buffer, *bufptr;
char **token_list;
char last_char = '\0';
int word_count = 0, word_nbr;
buffer = (char *) hb_xgrab ( iCharCount + 1 );
bufptr = buffer;
while ( *string )
{
if ( *string == delimiter )
{
while ( *string == delimiter )
{
string ++;
}
if (bufptr > buffer)
{
word_count ++;
last_char = *bufptr++ = '\0';
}
}
else
{
last_char = *bufptr++ = *string++;
}
}
if (last_char > 0)
{
word_count++;
}
*bufptr = '\0';
token_list = (char **) hb_xgrab (sizeof (char *) * (word_count + 2));
token_list [0] = buffer;
token_list++;
bufptr = buffer;
for (word_nbr = 0; word_nbr < word_count; word_nbr++)
{
token_list [word_nbr] = bufptr;
bufptr += strlen (bufptr) + 1;
}
token_list [word_count] = NULL;
*iWord = word_count;
return token_list;
}
/*----------------------------------------------------------------------------*/
static HB_BOOL file_read( FILE *stream, char *string, int *iCharCount )
{
int ch, cnbr = 0;
memset ( string, ' ', MAX_READ );
for (;;)
{
ch = fgetc ( stream );
if ( ( ch == '\n' ) || ( ch == EOF ) || ( ch == 26 ) )
{
*iCharCount = cnbr;
string [cnbr] = '\0';
return ch == '\n' || cnbr;
}
else
{
if ( cnbr < MAX_READ && ch != '\r' )
{
string [cnbr++] = (char) ch;
}
}
if (cnbr >= MAX_READ)
{
*iCharCount = cnbr;
string [MAX_READ] = '\0';
return HB_TRUE;
}
}
}
/*----------------------------------------------------------------------------*/
HB_FUNC( FPARSE )
{
FILE *inFile ;
PHB_ITEM pSrc = hb_param(1, HB_IT_STRING);
PHB_ITEM pDelim = hb_param(2, HB_IT_STRING);
PHB_ITEM pArray;
PHB_ITEM pItem;
char *string ;
char **tokens;
int iToken, iCharCount = 0;
BYTE nByte;
/* file parameter correctly passed */
if ( !pSrc )
{
hb_reta( 0 );
return;
}
if ( hb_itemGetCLen( pSrc ) == 0 )
{
hb_reta( 0 );
return;
}
/* open file for read */
inFile = hb_fopen( hb_itemGetCPtr( pSrc ), "r" );
/* return empty array on failure */
if ( !inFile )
{
hb_reta( 0 );
return;
}
/* default delimiter to comma, chr(44) */
nByte = pDelim ? (BYTE) hb_itemGetCPtr( pDelim )[0] : (BYTE) 44;
/* the main array */
pArray = hb_itemArrayNew( 0 );
pItem = hb_itemNew( NULL );
/* book memory for line to read */
string = (char*) hb_xgrab( MAX_READ + 1 );
/* read the file until EOF */
while ( file_read ( inFile, string, &iCharCount ) )
{
/* parse the read line */
int iWord = 0;
tokens = hb_tokensplit ( string, nByte, iCharCount, &iWord ) ;
/* prepare empty array */
hb_arrayNew( pItem, iWord );
/* add parsed text to array */
for (iToken = 0; tokens [iToken]; iToken++)
{
hb_arraySetC( pItem, iToken + 1, tokens [iToken] );
}
/* add array containing parsed text to main array */
hb_arrayAddForward( pArray, pItem );
/* clean up */
tokens--;
hb_xfree( tokens [0] );
hb_xfree( tokens );
}
/* return main array */
hb_itemReturnRelease( pArray );
hb_itemRelease( pItem );
/* clean up */
hb_xfree( string );
fclose( inFile );
}
/*----------------------------------------------------------------------------*/
HB_FUNC( FPARSEEX )
{
FILE *inFile ;
PHB_ITEM pSrc = hb_param(1, HB_IT_STRING);
PHB_ITEM pDelim = hb_param(2, HB_IT_STRING);
PHB_ITEM pArray;
PHB_ITEM pSubArray;
char *string;
int iCharCount = 0;
BYTE nByte;
/* file parameter correctly passed */
if ( !pSrc )
{
hb_reta( 0 );
return;
}
if ( hb_itemGetCLen( pSrc ) == 0 )
{
hb_reta( 0 );
return;
}
/* open file for read */
inFile = hb_fopen( hb_itemGetCPtr( pSrc ), "r" );
/* return empty array on failure */
if ( !inFile )
{
hb_reta( 0 );
return;
}
/* default delimiter to comma, chr(44) */
nByte = pDelim ? (BYTE) hb_itemGetCPtr( pDelim )[0] : (BYTE) 44;
/* the main array */
pArray = hb_itemArrayNew( 0 );
pSubArray = hb_itemNew( NULL );
/* book memory for line to read */
string = (char*) hb_xgrab( MAX_READ + 1 );
/* read the file until EOF */
while ( file_read ( inFile, string, &iCharCount ) )
{
/* parse the read line */
int iWord = 0;
hb_arrayNew( pSubArray, 0 );
hb_ParseLine( pSubArray, string, nByte, &iWord );
/* add array containing parsed text to main array */
hb_arrayAddForward( pArray, pSubArray );
}
/* return main array */
hb_itemReturnRelease( pArray );
hb_itemRelease( pSubArray );
/* clean up */
hb_xfree( string );
fclose( inFile );
}
/*----------------------------------------------------------------------------*/
HB_FUNC( FWORDCOUNT )
{
FILE *inFile ;
PHB_ITEM pSrc = hb_param(1, HB_IT_STRING);
char *string ;
char **tokens;
int iCharCount = 0;
BYTE nByte = ' ';
ULONG ulWordCount = 0;
/* file parameter correctly passed */
if ( !pSrc )
{
hb_retni( 0 );
return;
}
if ( hb_itemGetCLen( pSrc ) == 0 )
{
hb_retni( 0 );
return;
}
/* open file for read */
inFile = hb_fopen( hb_itemGetCPtr( pSrc ), "r" );
/* return 0 on failure */
if ( !inFile )
{
hb_retni( 0 );
return;
}
/* book memory for line to read */
string = (char*) hb_xgrab( MAX_READ + 1 );
/* read the file until EOF */
while ( file_read ( inFile, string, &iCharCount ) )
{
int iWord = 0;
tokens = hb_tokensplit ( string, nByte, iCharCount, &iWord ) ;
ulWordCount += iWord;
/* clean up */
tokens--;
hb_xfree( tokens [0] );
hb_xfree( tokens );
}
/* return number of words */
hb_retnl( ulWordCount );
/* clean up */
hb_xfree( string );
fclose( inFile );
}
/*----------------------------------------------------------------------------*/
HB_FUNC( FLINECOUNT )
{
FILE *inFile ;
PHB_ITEM pSrc = hb_param(1, HB_IT_STRING);
ULONG ulLineCount = 0;
int ch;
/* file parameter correctly passed */
if ( !pSrc )
{
hb_retni( 0 );
return;
}
if ( hb_itemGetCLen( pSrc ) == 0 )
{
hb_retni( 0 );
return;
}
/* open file for read */
inFile = hb_fopen( hb_itemGetCPtr( pSrc ), "r" );
/* return 0 on failure */
if ( !inFile )
{
hb_retni( 0 );
return;
}
/* read the file until EOF */
while ( ( ch = fgetc ( inFile ) ) != EOF )
{
if ( ch == '\n' )
{
ulLineCount ++;
}
}
/* return number of lines */
hb_retnl( ulLineCount );
/* clean up */
fclose( inFile );
}
/*----------------------------------------------------------------------------*/
HB_FUNC( FCHARCOUNT )
{
FILE *inFile ;
PHB_ITEM pSrc = hb_param(1, HB_IT_STRING);
ULONG ulResult = 0;
int ch;
/* file parameter correctly passed */
if ( !pSrc )
{
hb_retni( 0 );
return;
}
if ( hb_itemGetCLen( pSrc ) == 0 )
{
hb_retni( 0 );
return;
}
/* open file for read */
inFile = hb_fopen( hb_itemGetCPtr( pSrc ), "r" );
/* return 0 on failure */
if ( !inFile )
{
hb_retni( 0 );
return;
}
/* read the file until EOF */
while ( ( ch = fgetc ( inFile ) ) != EOF )
{
switch ( ch )
{
case '\n' :
case '\r' :
case ' ' :
case '\t':
break;
default:
ulResult ++;
}
}
/* return number of characters */
hb_retnl( ulResult );
/* clean up */
fclose( inFile );
}
/*----------------------------------------------------------------------------*/
HB_FUNC( FPARSELINE )
{
PHB_ITEM pArray;
int iWords = 0;
const char * szText;
pArray = hb_itemArrayNew( 0 );
szText = hb_parc( 1 );
if( szText )
{
const char * szDelim = hb_parc( 2 );
hb_ParseLine( pArray, szText, szDelim ? ( unsigned char ) *szDelim : ',', &iWords );
}
hb_itemReturnRelease( pArray );
hb_stornl( iWords, 3 );
}