added qse_mbsspltrn()/qse_wcsspltrn()/qse_mbsspl()/qse_wcsspl()

This commit is contained in:
2011-04-08 00:46:25 +00:00
parent f7ebae421f
commit c0afd55a3a
9 changed files with 839 additions and 425 deletions

View File

@ -10,8 +10,8 @@ libqsecmn_la_SOURCES = \
syscall.h mem.h \
mem.c xma.c fma.c chr.c chr_cnv.c rex.c \
str_bas.c str_cat.c str_chr.c str_cnv.c str_cmp.c str_cpy.c str_dup.c \
str_dyn.c str_fcpy.c str_len.c str_pbrk.c str_put.c str_spn.c str_str.c \
str_subst.c str_utl.c str_word.c \
str_dyn.c str_fcpy.c str_len.c str_pbrk.c str_put.c str_spl.c \
str_spn.c str_str.c str_subst.c str_utl.c str_word.c \
lda.c oht.c htb.c rbt.c sll.c gdl.c dll.c opt.c \
tio.c tio_get.c tio_put.c \
fio.c pio.c sio.c \

View File

@ -75,7 +75,7 @@ libqsecmn_la_DEPENDENCIES =
am_libqsecmn_la_OBJECTS = mem.lo xma.lo fma.lo chr.lo chr_cnv.lo \
rex.lo str_bas.lo str_cat.lo str_chr.lo str_cnv.lo str_cmp.lo \
str_cpy.lo str_dup.lo str_dyn.lo str_fcpy.lo str_len.lo \
str_pbrk.lo str_put.lo str_spn.lo str_str.lo str_subst.lo \
str_pbrk.lo str_put.lo str_spl.lo str_spn.lo str_str.lo str_subst.lo \
str_utl.lo str_word.lo lda.lo oht.lo htb.lo rbt.lo sll.lo \
gdl.lo dll.lo opt.lo tio.lo tio_get.lo tio_put.lo fio.lo \
pio.lo sio.lo alg_search.lo alg_sort.lo time.lo misc.lo \
@ -268,8 +268,8 @@ libqsecmn_la_SOURCES = \
syscall.h mem.h \
mem.c xma.c fma.c chr.c chr_cnv.c rex.c \
str_bas.c str_cat.c str_chr.c str_cnv.c str_cmp.c str_cpy.c str_dup.c \
str_dyn.c str_fcpy.c str_len.c str_pbrk.c str_put.c str_spn.c str_str.c \
str_subst.c str_utl.c str_word.c \
str_dyn.c str_fcpy.c str_len.c str_pbrk.c str_put.c str_spl.c \
str_spn.c str_str.c str_subst.c str_utl.c str_word.c \
lda.c oht.c htb.c rbt.c sll.c gdl.c dll.c opt.c \
tio.c tio_get.c tio_put.c \
fio.c pio.c sio.c \
@ -399,6 +399,7 @@ distclean-compile:
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_len.Plo@am__quote@
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_pbrk.Plo@am__quote@
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_put.Plo@am__quote@
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_spl.Plo@am__quote@
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_spn.Plo@am__quote@
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_str.Plo@am__quote@
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/str_subst.Plo@am__quote@

594
qse/lib/cmn/str_spl.c Normal file
View File

@ -0,0 +1,594 @@
/*
* $Id$
*
Copyright 2006-2009 Chung, Hyung-Hwan.
This file is part of QSE.
QSE is free software: you can redistribute it and/or modify
it under the terms of the GNU Lesser General Public License as
published by the Free Software Foundation, either version 3 of
the License, or (at your option) any later version.
QSE is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with QSE. If not, see <http://www.gnu.org/licenses/>.
*/
#include <qse/cmn/str.h>
#include <qse/cmn/chr.h>
int qse_mbsspltrn (
qse_mchar_t* s, const qse_mchar_t* delim,
qse_mchar_t lquote, qse_mchar_t rquote,
qse_mchar_t escape, const qse_mchar_t* trset)
{
qse_mchar_t* p = s, *d;
qse_mchar_t* sp = QSE_NULL, * ep = QSE_NULL;
int delim_mode;
int cnt = 0;
if (delim == QSE_NULL) delim_mode = 0;
else
{
delim_mode = 1;
for (d = (qse_mchar_t*)delim; *d != QSE_MT('\0'); d++)
if (!QSE_ISMSPACE(*d)) delim_mode = 2;
}
if (delim_mode == 0)
{
/* skip preceding space characters */
while (QSE_ISMSPACE(*p)) p++;
/* when 0 is given as "delim", it has an effect of cutting
preceding and trailing space characters off "s". */
if (lquote != QSE_MT('\0') && *p == lquote)
{
qse_mbscpy (p, p + 1);
for (;;)
{
if (*p == QSE_MT('\0')) return -1;
if (escape != QSE_MT('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_MT('\0'))
{
const qse_mchar_t* ep = trset;
while (*ep != QSE_MT('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_mbscpy (p, p + 1);
}
else
{
if (*p == rquote)
{
p++;
break;
}
}
if (sp == 0) sp = p;
ep = p;
p++;
}
while (QSE_ISMSPACE(*p)) p++;
if (*p != QSE_MT('\0')) return -1;
if (sp == 0 && ep == 0) s[0] = QSE_MT('\0');
else
{
ep[1] = QSE_MT('\0');
if (s != (qse_mchar_t*)sp) qse_mbscpy (s, sp);
cnt++;
}
}
else
{
while (*p)
{
if (!QSE_ISMSPACE(*p))
{
if (sp == 0) sp = p;
ep = p;
}
p++;
}
if (sp == 0 && ep == 0) s[0] = QSE_MT('\0');
else
{
ep[1] = QSE_MT('\0');
if (s != (qse_mchar_t*)sp) qse_mbscpy (s, sp);
cnt++;
}
}
}
else if (delim_mode == 1)
{
qse_mchar_t* o;
while (*p)
{
o = p;
while (QSE_ISMSPACE(*p)) p++;
if (o != p) { qse_mbscpy (o, p); p = o; }
if (lquote != QSE_MT('\0') && *p == lquote)
{
qse_mbscpy (p, p + 1);
for (;;)
{
if (*p == QSE_MT('\0')) return -1;
if (escape != QSE_MT('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_MT('\0'))
{
const qse_mchar_t* ep = trset;
while (*ep != QSE_MT('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_mbscpy (p, p + 1);
}
else
{
if (*p == rquote)
{
*p++ = QSE_MT('\0');
cnt++;
break;
}
}
p++;
}
}
else
{
o = p;
for (;;)
{
if (*p == QSE_MT('\0'))
{
if (o != p) cnt++;
break;
}
if (QSE_ISMSPACE (*p))
{
*p++ = QSE_MT('\0');
cnt++;
break;
}
p++;
}
}
}
}
else /* if (delim_mode == 2) */
{
qse_mchar_t* o;
int ok;
while (*p != QSE_MT('\0'))
{
o = p;
while (QSE_ISMSPACE(*p)) p++;
if (o != p) { qse_mbscpy (o, p); p = o; }
if (lquote != QSE_MT('\0') && *p == lquote)
{
qse_mbscpy (p, p + 1);
for (;;)
{
if (*p == QSE_MT('\0')) return -1;
if (escape != QSE_MT('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_MT('\0'))
{
const qse_mchar_t* ep = trset;
while (*ep != QSE_MT('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_mbscpy (p, p + 1);
}
else
{
if (*p == rquote)
{
*p++ = QSE_MT('\0');
cnt++;
break;
}
}
p++;
}
ok = 0;
while (QSE_ISMSPACE(*p)) p++;
if (*p == QSE_MT('\0')) ok = 1;
for (d = (qse_mchar_t*)delim; *d != QSE_MT('\0'); d++)
{
if (*p == *d)
{
ok = 1;
qse_mbscpy (p, p + 1);
break;
}
}
if (ok == 0) return -1;
}
else
{
o = p; sp = ep = 0;
for (;;)
{
if (*p == QSE_MT('\0'))
{
if (ep)
{
ep[1] = QSE_MT('\0');
p = &ep[1];
}
cnt++;
break;
}
for (d = (qse_mchar_t*)delim; *d != QSE_MT('\0'); d++)
{
if (*p == *d)
{
if (sp == QSE_NULL)
{
qse_mbscpy (o, p); p = o;
*p++ = QSE_MT('\0');
}
else
{
qse_mbscpy (&ep[1], p);
qse_mbscpy (o, sp);
o[ep - sp + 1] = QSE_MT('\0');
p = &o[ep - sp + 2];
}
cnt++;
/* last empty field after delim */
if (*p == QSE_MT('\0')) cnt++;
goto exit_point;
}
}
if (!QSE_ISMSPACE (*p))
{
if (sp == QSE_NULL) sp = p;
ep = p;
}
p++;
}
exit_point:
;
}
}
}
return cnt;
}
int qse_mbsspl (
qse_mchar_t* s, const qse_mchar_t* delim,
qse_mchar_t lquote, qse_mchar_t rquote, qse_mchar_t escape)
{
return qse_mbsspltrn (s, delim, lquote, rquote, escape, QSE_NULL);
}
int qse_wcsspltrn (
qse_wchar_t* s, const qse_wchar_t* delim,
qse_wchar_t lquote, qse_wchar_t rquote,
qse_wchar_t escape, const qse_wchar_t* trset)
{
qse_wchar_t* p = s, *d;
qse_wchar_t* sp = QSE_NULL, * ep = QSE_NULL;
int delim_mode;
int cnt = 0;
if (delim == QSE_NULL) delim_mode = 0;
else
{
delim_mode = 1;
for (d = (qse_wchar_t*)delim; *d != QSE_WT('\0'); d++)
if (!QSE_ISWSPACE(*d)) delim_mode = 2;
}
if (delim_mode == 0)
{
/* skip preceding space characters */
while (QSE_ISWSPACE(*p)) p++;
/* when 0 is given as "delim", it has an effect of cutting
preceding and trailing space characters off "s". */
if (lquote != QSE_WT('\0') && *p == lquote)
{
qse_wcscpy (p, p + 1);
for (;;)
{
if (*p == QSE_WT('\0')) return -1;
if (escape != QSE_WT('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_WT('\0'))
{
const qse_wchar_t* ep = trset;
while (*ep != QSE_WT('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_wcscpy (p, p + 1);
}
else
{
if (*p == rquote)
{
p++;
break;
}
}
if (sp == 0) sp = p;
ep = p;
p++;
}
while (QSE_ISWSPACE(*p)) p++;
if (*p != QSE_WT('\0')) return -1;
if (sp == 0 && ep == 0) s[0] = QSE_WT('\0');
else
{
ep[1] = QSE_WT('\0');
if (s != (qse_wchar_t*)sp) qse_wcscpy (s, sp);
cnt++;
}
}
else
{
while (*p)
{
if (!QSE_ISWSPACE(*p))
{
if (sp == 0) sp = p;
ep = p;
}
p++;
}
if (sp == 0 && ep == 0) s[0] = QSE_WT('\0');
else
{
ep[1] = QSE_WT('\0');
if (s != (qse_wchar_t*)sp) qse_wcscpy (s, sp);
cnt++;
}
}
}
else if (delim_mode == 1)
{
qse_wchar_t* o;
while (*p)
{
o = p;
while (QSE_ISWSPACE(*p)) p++;
if (o != p) { qse_wcscpy (o, p); p = o; }
if (lquote != QSE_WT('\0') && *p == lquote)
{
qse_wcscpy (p, p + 1);
for (;;)
{
if (*p == QSE_WT('\0')) return -1;
if (escape != QSE_WT('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_WT('\0'))
{
const qse_wchar_t* ep = trset;
while (*ep != QSE_WT('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_wcscpy (p, p + 1);
}
else
{
if (*p == rquote)
{
*p++ = QSE_WT('\0');
cnt++;
break;
}
}
p++;
}
}
else
{
o = p;
for (;;)
{
if (*p == QSE_WT('\0'))
{
if (o != p) cnt++;
break;
}
if (QSE_ISWSPACE (*p))
{
*p++ = QSE_WT('\0');
cnt++;
break;
}
p++;
}
}
}
}
else /* if (delim_mode == 2) */
{
qse_wchar_t* o;
int ok;
while (*p != QSE_WT('\0'))
{
o = p;
while (QSE_ISWSPACE(*p)) p++;
if (o != p) { qse_wcscpy (o, p); p = o; }
if (lquote != QSE_WT('\0') && *p == lquote)
{
qse_wcscpy (p, p + 1);
for (;;)
{
if (*p == QSE_WT('\0')) return -1;
if (escape != QSE_WT('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_WT('\0'))
{
const qse_wchar_t* ep = trset;
while (*ep != QSE_WT('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_wcscpy (p, p + 1);
}
else
{
if (*p == rquote)
{
*p++ = QSE_WT('\0');
cnt++;
break;
}
}
p++;
}
ok = 0;
while (QSE_ISWSPACE(*p)) p++;
if (*p == QSE_WT('\0')) ok = 1;
for (d = (qse_wchar_t*)delim; *d != QSE_WT('\0'); d++)
{
if (*p == *d)
{
ok = 1;
qse_wcscpy (p, p + 1);
break;
}
}
if (ok == 0) return -1;
}
else
{
o = p; sp = ep = 0;
for (;;)
{
if (*p == QSE_WT('\0'))
{
if (ep)
{
ep[1] = QSE_WT('\0');
p = &ep[1];
}
cnt++;
break;
}
for (d = (qse_wchar_t*)delim; *d != QSE_WT('\0'); d++)
{
if (*p == *d)
{
if (sp == QSE_NULL)
{
qse_wcscpy (o, p); p = o;
*p++ = QSE_WT('\0');
}
else
{
qse_wcscpy (&ep[1], p);
qse_wcscpy (o, sp);
o[ep - sp + 1] = QSE_WT('\0');
p = &o[ep - sp + 2];
}
cnt++;
/* last empty field after delim */
if (*p == QSE_WT('\0')) cnt++;
goto exit_point;
}
}
if (!QSE_ISWSPACE (*p))
{
if (sp == QSE_NULL) sp = p;
ep = p;
}
p++;
}
exit_point:
;
}
}
}
return cnt;
}
int qse_wcsspl (
qse_wchar_t* s, const qse_wchar_t* delim,
qse_wchar_t lquote, qse_wchar_t rquote, qse_wchar_t escape)
{
return qse_wcsspltrn (s, delim, lquote, rquote, escape, QSE_NULL);
}

View File

@ -1,5 +1,5 @@
/*
* $Id: str_utl.c 297 2009-10-08 13:09:19Z hyunghwan.chung $
* $Id: str_utl.c 427 2011-04-07 06:46:25Z hyunghwan.chung $
*
Copyright 2006-2009 Chung, Hyung-Hwan.
This file is part of QSE.
@ -22,296 +22,6 @@
#include <qse/cmn/chr.h>
#include "mem.h"
#define ISSPACE(c) \
((c) == QSE_T(' ') || (c) == QSE_T('\t') || (c) == QSE_T('\n') || \
(c) == QSE_T('\r') || (c) == QSE_T('\v') && (c) == QSE_T('\f'))
int qse_strspltrn (
qse_char_t* s, const qse_char_t* delim,
qse_char_t lquote, qse_char_t rquote,
qse_char_t escape, const qse_char_t* trset)
{
qse_char_t* p = s, *d;
qse_char_t* sp = QSE_NULL, * ep = QSE_NULL;
int delim_mode;
int cnt = 0;
if (delim == QSE_NULL) delim_mode = 0;
else
{
delim_mode = 1;
for (d = (qse_char_t*)delim; *d != QSE_T('\0'); d++)
if (!QSE_ISSPACE(*d)) delim_mode = 2;
}
if (delim_mode == 0)
{
/* skip preceding space characters */
while (QSE_ISSPACE(*p)) p++;
/* when 0 is given as "delim", it has an effect of cutting
preceding and trailing space characters off "s". */
if (lquote != QSE_T('\0') && *p == lquote)
{
qse_strcpy (p, p + 1);
for (;;)
{
if (*p == QSE_T('\0')) return -1;
if (escape != QSE_T('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_T('\0'))
{
const qse_char_t* ep = trset;
while (*ep != QSE_T('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_strcpy (p, p + 1);
}
else
{
if (*p == rquote)
{
p++;
break;
}
}
if (sp == 0) sp = p;
ep = p;
p++;
}
while (QSE_ISSPACE(*p)) p++;
if (*p != QSE_T('\0')) return -1;
if (sp == 0 && ep == 0) s[0] = QSE_T('\0');
else
{
ep[1] = QSE_T('\0');
if (s != (qse_char_t*)sp) qse_strcpy (s, sp);
cnt++;
}
}
else
{
while (*p)
{
if (!QSE_ISSPACE(*p))
{
if (sp == 0) sp = p;
ep = p;
}
p++;
}
if (sp == 0 && ep == 0) s[0] = QSE_T('\0');
else
{
ep[1] = QSE_T('\0');
if (s != (qse_char_t*)sp) qse_strcpy (s, sp);
cnt++;
}
}
}
else if (delim_mode == 1)
{
qse_char_t* o;
while (*p)
{
o = p;
while (QSE_ISSPACE(*p)) p++;
if (o != p) { qse_strcpy (o, p); p = o; }
if (lquote != QSE_T('\0') && *p == lquote)
{
qse_strcpy (p, p + 1);
for (;;)
{
if (*p == QSE_T('\0')) return -1;
if (escape != QSE_T('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_T('\0'))
{
const qse_char_t* ep = trset;
while (*ep != QSE_T('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_strcpy (p, p + 1);
}
else
{
if (*p == rquote)
{
*p++ = QSE_T('\0');
cnt++;
break;
}
}
p++;
}
}
else
{
o = p;
for (;;)
{
if (*p == QSE_T('\0'))
{
if (o != p) cnt++;
break;
}
if (QSE_ISSPACE (*p))
{
*p++ = QSE_T('\0');
cnt++;
break;
}
p++;
}
}
}
}
else /* if (delim_mode == 2) */
{
qse_char_t* o;
int ok;
while (*p != QSE_T('\0'))
{
o = p;
while (QSE_ISSPACE(*p)) p++;
if (o != p) { qse_strcpy (o, p); p = o; }
if (lquote != QSE_T('\0') && *p == lquote)
{
qse_strcpy (p, p + 1);
for (;;)
{
if (*p == QSE_T('\0')) return -1;
if (escape != QSE_T('\0') && *p == escape)
{
if (trset != QSE_NULL && p[1] != QSE_T('\0'))
{
const qse_char_t* ep = trset;
while (*ep != QSE_T('\0'))
{
if (p[1] == *ep++)
{
p[1] = *ep;
break;
}
}
}
qse_strcpy (p, p + 1);
}
else
{
if (*p == rquote)
{
*p++ = QSE_T('\0');
cnt++;
break;
}
}
p++;
}
ok = 0;
while (QSE_ISSPACE(*p)) p++;
if (*p == QSE_T('\0')) ok = 1;
for (d = (qse_char_t*)delim; *d != QSE_T('\0'); d++)
{
if (*p == *d)
{
ok = 1;
qse_strcpy (p, p + 1);
break;
}
}
if (ok == 0) return -1;
}
else
{
o = p; sp = ep = 0;
for (;;)
{
if (*p == QSE_T('\0'))
{
if (ep)
{
ep[1] = QSE_T('\0');
p = &ep[1];
}
cnt++;
break;
}
for (d = (qse_char_t*)delim; *d != QSE_T('\0'); d++)
{
if (*p == *d)
{
if (sp == QSE_NULL)
{
qse_strcpy (o, p); p = o;
*p++ = QSE_T('\0');
}
else
{
qse_strcpy (&ep[1], p);
qse_strcpy (o, sp);
o[ep - sp + 1] = QSE_T('\0');
p = &o[ep - sp + 2];
}
cnt++;
/* last empty field after delim */
if (*p == QSE_T('\0')) cnt++;
goto exit_point;
}
}
if (!QSE_ISSPACE (*p))
{
if (sp == QSE_NULL) sp = p;
ep = p;
}
p++;
}
exit_point:
;
}
}
}
return cnt;
}
int qse_strspl (
qse_char_t* s, const qse_char_t* delim,
qse_char_t lquote, qse_char_t rquote, qse_char_t escape)
{
return qse_strspltrn (s, delim, lquote, rquote, escape, QSE_NULL);
}
qse_char_t* qse_strtrmx (qse_char_t* str, int opt)
{
qse_char_t* p = str;