219 lines
6.7 KiB
C
219 lines
6.7 KiB
C
|
const char ssplit_rcs[] = "$Id: ssplit.c,v 1.9 2007/11/03 14:35:45 fabiankeil Exp $";
|
|||
|
/*********************************************************************
|
|||
|
*
|
|||
|
* File : $Source: /cvsroot/ijbswa/current/ssplit.c,v $
|
|||
|
*
|
|||
|
* Purpose : A function to split a string at specified delimiters.
|
|||
|
*
|
|||
|
* Copyright : Written by and Copyright (C) 2001 the SourceForge
|
|||
|
* Privoxy team. http://www.privoxy.org/
|
|||
|
*
|
|||
|
* Based on the Internet Junkbuster originally written
|
|||
|
* by and Copyright (C) 1997 Anonymous Coders and
|
|||
|
* Junkbusters Corporation. http://www.junkbusters.com
|
|||
|
*
|
|||
|
* This program is free software; you can redistribute it
|
|||
|
* and/or modify it under the terms of the GNU General
|
|||
|
* Public License as published by the Free Software
|
|||
|
* Foundation; either version 2 of the License, or (at
|
|||
|
* your option) any later version.
|
|||
|
*
|
|||
|
* This program is distributed in the hope that it will
|
|||
|
* be useful, but WITHOUT ANY WARRANTY; without even the
|
|||
|
* implied warranty of MERCHANTABILITY or FITNESS FOR A
|
|||
|
* PARTICULAR PURPOSE. See the GNU General Public
|
|||
|
* License for more details.
|
|||
|
*
|
|||
|
* The GNU General Public License should be included with
|
|||
|
* this file. If not, you can view it at
|
|||
|
* http://www.gnu.org/copyleft/gpl.html
|
|||
|
* or write to the Free Software Foundation, Inc., 59
|
|||
|
* Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|||
|
*
|
|||
|
* Revisions :
|
|||
|
* $Log: ssplit.c,v $
|
|||
|
* Revision 1.9 2007/11/03 14:35:45 fabiankeil
|
|||
|
* Fix spelling in Purpose line. Patch submitted by Simon Ruderich.
|
|||
|
*
|
|||
|
* Revision 1.8 2006/07/18 14:48:47 david__schmidt
|
|||
|
* Reorganizing the repository: swapping out what was HEAD (the old 3.1 branch)
|
|||
|
* with what was really the latest development (the v_3_0_branch branch)
|
|||
|
*
|
|||
|
* Revision 1.6 2002/03/26 22:29:55 swa
|
|||
|
* we have a new homepage!
|
|||
|
*
|
|||
|
* Revision 1.5 2002/03/24 13:25:43 swa
|
|||
|
* name change related issues
|
|||
|
*
|
|||
|
* Revision 1.4 2001/11/13 00:16:38 jongfoster
|
|||
|
* Replacing references to malloc.h with the standard stdlib.h
|
|||
|
* (See ANSI or K&R 2nd Ed)
|
|||
|
*
|
|||
|
* Revision 1.3 2001/05/29 08:54:25 jongfoster
|
|||
|
* Rewrote the innards of ssplit() to be easier to understand,
|
|||
|
* faster, and to use less memory. Didn't change the interface
|
|||
|
* except to give the parameters meaningful names.
|
|||
|
*
|
|||
|
* Revision 1.2 2001/05/17 23:01:01 oes
|
|||
|
* - Cleaned CRLF's from the sources and related files
|
|||
|
*
|
|||
|
* Revision 1.1.1.1 2001/05/15 13:59:04 oes
|
|||
|
* Initial import of version 2.9.3 source tree
|
|||
|
*
|
|||
|
*
|
|||
|
*********************************************************************/
|
|||
|
|
|||
|
|
|||
|
#include "config.h"
|
|||
|
|
|||
|
#include <string.h>
|
|||
|
#include <stdlib.h>
|
|||
|
|
|||
|
#include "ssplit.h"
|
|||
|
#include "miscutil.h"
|
|||
|
|
|||
|
const char ssplit_h_rcs[] = SSPLIT_H_VERSION;
|
|||
|
|
|||
|
/* Define this for lots of debugging information to stdout */
|
|||
|
#undef SSPLIT_VERBOSE
|
|||
|
/* #define SSPLIT_VERBOSE 1 */
|
|||
|
|
|||
|
|
|||
|
/*********************************************************************
|
|||
|
*
|
|||
|
* Function : ssplit
|
|||
|
*
|
|||
|
* Description : Split a string using delimiters in `delim'. Results
|
|||
|
* go into `vec'.
|
|||
|
*
|
|||
|
* Parameters :
|
|||
|
* 1 : str = string to split. Will be split in place
|
|||
|
* (i.e. do not free until you've finished with vec,
|
|||
|
* previous contents will be trashed by the call).
|
|||
|
* 2 : delim = array of delimiters (if NULL, uses " \t").
|
|||
|
* 3 : vec[] = results vector (aka. array) [out]
|
|||
|
* 4 : vec_len = number of usable slots in the vector (aka. array size)
|
|||
|
* 5 : dont_save_empty_fields = zero if consecutive delimiters
|
|||
|
* give a null output field(s), nonzero if they are just
|
|||
|
* to be considered as single delimeter
|
|||
|
* 6 : ignore_leading = nonzero to ignore leading field
|
|||
|
* separators.
|
|||
|
*
|
|||
|
* Returns : -1 => Error: vec_len is too small to hold all the
|
|||
|
* data, or str == NULL.
|
|||
|
* >=0 => the number of fields put in `vec'.
|
|||
|
* On error, vec and str may still have been overwritten.
|
|||
|
*
|
|||
|
*********************************************************************/
|
|||
|
int ssplit(char *str, const char *delim, char *vec[], int vec_len,
|
|||
|
int dont_save_empty_fields, int ignore_leading)
|
|||
|
{
|
|||
|
unsigned char is_delim[256];
|
|||
|
unsigned char char_type;
|
|||
|
int vec_count = 0;
|
|||
|
|
|||
|
if (!str)
|
|||
|
{
|
|||
|
return(-1);
|
|||
|
}
|
|||
|
|
|||
|
|
|||
|
/* Build is_delim array */
|
|||
|
|
|||
|
memset(is_delim, '\0', sizeof(is_delim));
|
|||
|
|
|||
|
if (!delim)
|
|||
|
{
|
|||
|
delim = " \t"; /* default field separators */
|
|||
|
}
|
|||
|
|
|||
|
while (*delim)
|
|||
|
{
|
|||
|
is_delim[(unsigned)(unsigned char)*delim++] = 1; /* separator */
|
|||
|
}
|
|||
|
|
|||
|
is_delim[(unsigned)(unsigned char)'\0'] = 2; /* terminator */
|
|||
|
is_delim[(unsigned)(unsigned char)'\n'] = 2; /* terminator */
|
|||
|
|
|||
|
|
|||
|
/* Parse string */
|
|||
|
|
|||
|
if (ignore_leading)
|
|||
|
{
|
|||
|
/* skip leading separators */
|
|||
|
while (is_delim[(unsigned)(unsigned char)*str] == 1)
|
|||
|
{
|
|||
|
str++;
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
/* first pointer is the beginning of string */
|
|||
|
/* Check if we want to save this field */
|
|||
|
if ( (!dont_save_empty_fields)
|
|||
|
|| (is_delim[(unsigned)(unsigned char)*str] == 0) )
|
|||
|
{
|
|||
|
/*
|
|||
|
* We want empty fields, or the first character in this
|
|||
|
* field is not a delimiter or the end of string.
|
|||
|
* So save it.
|
|||
|
*/
|
|||
|
if (vec_count >= vec_len)
|
|||
|
{
|
|||
|
return(-1); /* overflow */
|
|||
|
}
|
|||
|
vec[vec_count++] = (char *) str;
|
|||
|
}
|
|||
|
|
|||
|
while ((char_type = is_delim[(unsigned)(unsigned char)*str]) != 2)
|
|||
|
{
|
|||
|
if (char_type == 1)
|
|||
|
{
|
|||
|
/* the char is a separator */
|
|||
|
|
|||
|
/* null terminate the substring */
|
|||
|
*str++ = '\0';
|
|||
|
|
|||
|
/* Check if we want to save this field */
|
|||
|
if ( (!dont_save_empty_fields)
|
|||
|
|| (is_delim[(unsigned)(unsigned char)*str] == 0) )
|
|||
|
{
|
|||
|
/*
|
|||
|
* We want empty fields, or the first character in this
|
|||
|
* field is not a delimiter or the end of string.
|
|||
|
* So save it.
|
|||
|
*/
|
|||
|
if (vec_count >= vec_len)
|
|||
|
{
|
|||
|
return(-1); /* overflow */
|
|||
|
}
|
|||
|
vec[vec_count++] = (char *) str;
|
|||
|
}
|
|||
|
}
|
|||
|
else
|
|||
|
{
|
|||
|
str++;
|
|||
|
}
|
|||
|
}
|
|||
|
*str = '\0'; /* null terminate the substring */
|
|||
|
|
|||
|
#ifdef SSPLIT_VERBOSE
|
|||
|
{
|
|||
|
int i;
|
|||
|
printf("dump %d strings\n", vec_count);
|
|||
|
for (i = 0; i < vec_count; i++)
|
|||
|
{
|
|||
|
printf("%d '%s'\n", i, vec[i]);
|
|||
|
}
|
|||
|
}
|
|||
|
#endif /* def SSPLIT_VERBOSE */
|
|||
|
|
|||
|
return(vec_count);
|
|||
|
}
|
|||
|
|
|||
|
|
|||
|
/*
|
|||
|
Local Variables:
|
|||
|
tab-width: 3
|
|||
|
end:
|
|||
|
*/
|