qse/ase/lib/awk/func.c

1413 lines
31 KiB
C

/*
* $Id: func.c 499 2008-12-16 09:42:48Z baconevi $
*
* {License}
*/
#include "awk.h"
static int bfn_close (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_fflush (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_index (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_length (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_substr (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_split (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_tolower (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_toupper (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_gsub (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_sub (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_match (ase_awk_run_t*, const ase_char_t*, ase_size_t);
static int bfn_sprintf (ase_awk_run_t*, const ase_char_t*, ase_size_t);
#undef MAX
#define MAX ASE_TYPE_UNSIGNED_MAX(ase_size_t)
static ase_awk_bfn_t sys_bfn[] =
{
/* io functions */
{ {ASE_T("close"), 5}, ASE_AWK_EXTIO, {1, 1, ASE_NULL}, bfn_close},
{ {ASE_T("fflush"), 6}, ASE_AWK_EXTIO, {0, 1, ASE_NULL}, bfn_fflush},
/* string functions */
{ {ASE_T("index"), 5}, 0, {2, 2, ASE_NULL}, bfn_index},
{ {ASE_T("substr"), 6}, 0, {2, 3, ASE_NULL}, bfn_substr},
{ {ASE_T("length"), 6}, 0, {1, 1, ASE_NULL}, bfn_length},
{ {ASE_T("split"), 5}, 0, {2, 3, ASE_T("vrv")}, bfn_split},
{ {ASE_T("tolower"), 7}, 0, {1, 1, ASE_NULL}, bfn_tolower},
{ {ASE_T("toupper"), 7}, 0, {1, 1, ASE_NULL}, bfn_toupper},
{ {ASE_T("gsub"), 4}, 0, {2, 3, ASE_T("xvr")}, bfn_gsub},
{ {ASE_T("sub"), 3}, 0, {2, 3, ASE_T("xvr")}, bfn_sub},
{ {ASE_T("match"), 5}, 0, {2, 2, ASE_T("vx")}, bfn_match},
{ {ASE_T("sprintf"), 7}, 0, {1, MAX, ASE_NULL}, bfn_sprintf},
{ {ASE_NULL, 0}, 0, {0, 0, ASE_NULL}, ASE_NULL}
};
void* ase_awk_addfunc (
ase_awk_t* awk, const ase_char_t* name, ase_size_t name_len,
int when_valid, ase_size_t min_args, ase_size_t max_args,
const ase_char_t* arg_spec,
int (*handler)(ase_awk_run_t*,const ase_char_t*,ase_size_t))
{
ase_awk_bfn_t* bfn;
ase_size_t spec_len;
if (name_len <= 0)
{
ase_awk_seterror (awk, ASE_AWK_EINVAL, 0, ASE_NULL, 0);
return ASE_NULL;
}
if (ase_awk_getbfn (awk, name, name_len) != ASE_NULL)
{
ase_cstr_t errarg;
errarg.ptr = name;
errarg.len = name_len;
ase_awk_seterror (awk, ASE_AWK_EEXIST, 0, &errarg, 1);
return ASE_NULL;
}
spec_len = (arg_spec == ASE_NULL)? 0: ase_strlen(arg_spec);
bfn = (ase_awk_bfn_t*) ASE_AWK_ALLOC (awk,
ASE_SIZEOF(ase_awk_bfn_t) +
(name_len+1) * ASE_SIZEOF(ase_char_t) +
(spec_len+1) * ASE_SIZEOF(ase_char_t));
if (bfn == ASE_NULL)
{
ase_awk_seterrnum (awk, ASE_AWK_ENOMEM);
return ASE_NULL;
}
bfn->name.ptr = (ase_char_t*)(bfn + 1);
bfn->name.len = name_len;
ase_strxncpy (bfn->name.ptr, name_len+1, name, name_len);
bfn->valid = when_valid;
bfn->arg.min = min_args;
bfn->arg.max = max_args;
if (arg_spec == ASE_NULL) bfn->arg.spec = ASE_NULL;
else
{
bfn->arg.spec = bfn->name.ptr + bfn->name.len + 1;
ase_strxcpy (bfn->arg.spec, spec_len+1, arg_spec);
}
bfn->handler = handler;
if (ase_map_insert (awk->bfn.user,
(ase_char_t*)name, name_len, bfn, 0) == ASE_NULL)
{
ASE_AWK_FREE (awk, bfn);
ase_awk_seterrnum (awk, ASE_AWK_ENOMEM);
return ASE_NULL;
}
return bfn;
}
int ase_awk_delfunc (
ase_awk_t* awk, const ase_char_t* name, ase_size_t name_len)
{
if (ase_map_delete (awk->bfn.user, name, name_len) == -1)
{
ase_cstr_t errarg;
errarg.ptr = name;
errarg.len = name_len;
ase_awk_seterror (awk, ASE_AWK_ENOENT, 0, &errarg, 1);
return -1;
}
return 0;
}
void ase_awk_clrbfn (ase_awk_t* awk)
{
ase_map_clear (awk->bfn.user);
}
ase_awk_bfn_t* ase_awk_getbfn (
ase_awk_t* awk, const ase_char_t* name, ase_size_t len)
{
ase_awk_bfn_t* bfn;
ase_map_pair_t* pair;
const ase_char_t* k;
ase_size_t l;
/* search the system function table */
for (bfn = sys_bfn; bfn->name.ptr != ASE_NULL; bfn++)
{
if (bfn->valid != 0 &&
(awk->option & bfn->valid) != bfn->valid) continue;
pair = ase_map_search (
awk->wtab, bfn->name.ptr, bfn->name.len);
if (pair != ASE_NULL)
{
/* found in the customized word table */
k = ASE_MAP_VPTR(pair);
l = ASE_MAP_VLEN(pair);
}
else
{
k = bfn->name.ptr;
l = bfn->name.len;
}
if (ase_strxncmp (k, l, name, len) == 0) return bfn;
}
/* NOTE: I suspect this block of code might be very fragile.
* because I'm trying to support ase_awk_setword in
* a very flimsy way here. Would it be better to drop
* ase_awk_setword totally? */
pair = ase_map_search (awk->rwtab, name, len);
if (pair != ASE_NULL)
{
/* the current name is a target name for
* one of the original word. */
k = ASE_MAP_VPTR(pair);
l = ASE_MAP_VLEN(pair);
}
else
{
pair = ase_map_search (awk->wtab, name, len);
if (pair != ASE_NULL)
{
k = ASE_MAP_VPTR(pair);
l = ASE_MAP_VLEN(pair);
if (ase_strxncmp (name, len, k, l) != 0)
{
/* it name is not a target name but has
* a target name different from itself,
* it cannot be a intrinsic function name.
*
* For instance, name is "sin" here after
* ase_awk_setword ("sin", "cain") is called.
* If name were "cain", it would be handled
* in the outmost if block */
return ASE_NULL;
}
}
else
{
k = name;
l = len;
}
}
/* END NOTE */
pair = ase_map_search (awk->bfn.user, k, l);
if (pair == ASE_NULL) return ASE_NULL;
bfn = (ase_awk_bfn_t*)ASE_MAP_VPTR(pair);
if (bfn->valid != 0 && (awk->option & bfn->valid) == 0) return ASE_NULL;
return bfn;
}
static int bfn_close (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* v, * a0;
int n;
ase_char_t* name;
ase_size_t len;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 1);
/* TODO: support close (xxx, "to"/"from") like gawk */
a0 = ase_awk_getarg (run, 0);
ASE_ASSERT (a0 != ASE_NULL);
if (a0->type == ASE_AWK_VAL_STR)
{
name = ((ase_awk_val_str_t*)a0)->buf;
len = ((ase_awk_val_str_t*)a0)->len;
}
else
{
name = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len);
if (name == ASE_NULL) return -1;
}
if (len == 0)
{
/* getline or print doesn't allow an emptry for the
* input or output file name. so close should not allow
* it either.
* another reason for this is if close is called explicitly
* with an empty string, it may close the console that uses
* an empty string for its identification because closeextio
* closes any extios that match the name given unlike
* closeextio_read or closeextio_write. */
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, name);
n = -1;
goto skip_close;
}
while (len > 0)
{
if (name[--len] == ASE_T('\0'))
{
/* the name contains a null string.
* make close return -1 */
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, name);
n = -1;
goto skip_close;
}
}
n = ase_awk_closeextio (run, name);
/*
if (n == -1 && run->errnum != ASE_AWK_EIONONE)
{
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, name);
return -1;
}
*/
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, name);
skip_close:
v = ase_awk_makeintval (run, (ase_long_t)n);
if (v == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_setretval (run, v);
return 0;
}
static int flush_extio (
ase_awk_run_t* run, int extio, const ase_char_t* name, int n)
{
int n2;
if (run->extio.handler[extio] != ASE_NULL)
{
n2 = ase_awk_flushextio (run, extio, name);
if (n2 == -1)
{
/*
if (run->errnum == ASE_AWK_EIOIMPL) n = -1;
else if (run->errnum == ASE_AWK_EIONONE)
{
if (n != 0) n = -2;
}
else n = -99;
*/
if (run->errnum == ASE_AWK_EIONONE)
{
if (n != 0) n = -2;
}
else n = -1;
}
else if (n != -1) n = 0;
}
return n;
}
static int bfn_fflush (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0;
ase_char_t* str0;
ase_size_t len0;
int n;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 0 || nargs == 1);
if (nargs == 0)
{
/* flush the console output.
* fflush() should return -1 on errors */
n = ase_awk_flushextio (run, ASE_AWK_OUT_CONSOLE, ASE_T(""));
}
else
{
ase_char_t* ptr, * end;
a0 = ase_awk_getarg (run, 0);
if (a0->type == ASE_AWK_VAL_STR)
{
str0 = ((ase_awk_val_str_t*)a0)->buf;
len0 = ((ase_awk_val_str_t*)a0)->len;
}
else
{
str0 = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len0);
if (str0 == ASE_NULL) return -1;
}
/* the target name contains a null character.
* make fflush return -1 */
ptr = str0; end = str0 + len0;
while (ptr < end)
{
if (*ptr == ASE_T('\0'))
{
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, str0);
n = -1;
goto skip_flush;
}
ptr++;
}
/* flush the given extio */
n = flush_extio (
run, ASE_AWK_EXTIO_FILE,
((len0 == 0)? ASE_NULL: str0), 1);
/*if (n == -99) return -1;*/
n = flush_extio (
run, ASE_AWK_EXTIO_PIPE,
((len0 == 0)? ASE_NULL: str0), n);
/*if (n == -99) return -1;*/
n = flush_extio (
run, ASE_AWK_EXTIO_COPROC,
((len0 == 0)? ASE_NULL: str0), n);
/*if (n == -99) return -1;*/
/* if n remains 1, no ip handlers have been defined for
* file, pipe, and coproc. so make fflush return -1.
* if n is -2, no such named io has been found at all
* if n is -1, the io handler has returned an error */
if (n != 0) n = -1;
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str0);
}
skip_flush:
a0 = ase_awk_makeintval (run, (ase_long_t)n);
if (a0 == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_setretval (run, a0);
return 0;
}
static int bfn_index (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0, * a1;
ase_char_t* str0, * str1, * ptr;
ase_size_t len0, len1;
ase_long_t idx;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 2);
a0 = ase_awk_getarg (run, 0);
a1 = ase_awk_getarg (run, 1);
if (a0->type == ASE_AWK_VAL_STR)
{
str0 = ((ase_awk_val_str_t*)a0)->buf;
len0 = ((ase_awk_val_str_t*)a0)->len;
}
else
{
str0 = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len0);
if (str0 == ASE_NULL) return -1;
}
if (a1->type == ASE_AWK_VAL_STR)
{
str1 = ((ase_awk_val_str_t*)a1)->buf;
len1 = ((ase_awk_val_str_t*)a1)->len;
}
else
{
str1 = ase_awk_valtostr (
run, a1, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len1);
if (str1 == ASE_NULL)
{
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, str0);
return -1;
}
}
ptr = ase_strxnstr (str0, len0, str1, len1);
idx = (ptr == ASE_NULL)? -1: (ase_long_t)(ptr - str0);
if (ase_awk_getoption(run->awk) & ASE_AWK_BASEONE) idx = idx + 1;
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str0);
if (a1->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str1);
a0 = ase_awk_makeintval (run, idx);
if (a0 == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_setretval (run, a0);
return 0;
}
static int bfn_length (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* v;
ase_char_t* str;
ase_size_t len;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 1);
v = ase_awk_getarg (run, 0);
if (v->type == ASE_AWK_VAL_STR)
{
len = ((ase_awk_val_str_t*)v)->len;
}
else
{
str = ase_awk_valtostr (
run, v, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len);
if (str == ASE_NULL) return -1;
ASE_AWK_FREE (run->awk, str);
}
v = ase_awk_makeintval (run, len);
if (v == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_setretval (run, v);
return 0;
}
static int bfn_substr (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0, * a1, * a2, * r;
ase_char_t* str;
ase_size_t len;
ase_long_t lindex, lcount;
ase_real_t rindex, rcount;
int n;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs >= 2 && nargs <= 3);
a0 = ase_awk_getarg (run, 0);
a1 = ase_awk_getarg (run, 1);
a2 = (nargs >= 3)? ase_awk_getarg (run, 2): ASE_NULL;
if (a0->type == ASE_AWK_VAL_STR)
{
str = ((ase_awk_val_str_t*)a0)->buf;
len = ((ase_awk_val_str_t*)a0)->len;
}
else
{
str = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len);
if (str == ASE_NULL) return -1;
}
n = ase_awk_valtonum (run, a1, &lindex, &rindex);
if (n == -1)
{
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
return -1;
}
if (n == 1) lindex = (ase_long_t)rindex;
if (a2 == ASE_NULL) lcount = (ase_long_t)len;
else
{
n = ase_awk_valtonum (run, a2, &lcount, &rcount);
if (n == -1)
{
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, str);
return -1;
}
if (n == 1) lcount = (ase_long_t)rcount;
}
if (ase_awk_getoption(run->awk) & ASE_AWK_BASEONE) lindex = lindex - 1;
if (lindex >= (ase_long_t)len) lindex = (ase_long_t)len;
else if (lindex < 0) lindex = 0;
if (lcount < 0) lcount = 0;
else if (lcount > (ase_long_t)len - lindex)
{
lcount = (ase_long_t)len - lindex;
}
r = ase_awk_makestrval (run, &str[lindex], (ase_size_t)lcount);
if (r == ASE_NULL)
{
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
ase_awk_setretval (run, r);
return 0;
}
static int bfn_split (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0, * a1, * a2, * t1, * t2, ** a1_ref;
ase_char_t* str, * str_free, * p, * tok;
ase_size_t str_len, str_left, tok_len;
ase_long_t sta, num;
ase_char_t key[ASE_SIZEOF(ase_long_t)*8+2];
ase_size_t key_len;
ase_char_t* fs_ptr, * fs_free;
ase_size_t fs_len;
void* fs_rex = ASE_NULL;
void* fs_rex_free = ASE_NULL;
int errnum;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs >= 2 && nargs <= 3);
a0 = ase_awk_getarg (run, 0);
a1 = ase_awk_getarg (run, 1);
a2 = (nargs >= 3)? ase_awk_getarg (run, 2): ASE_NULL;
ASE_ASSERT (a1->type == ASE_AWK_VAL_REF);
if (((ase_awk_val_ref_t*)a1)->id >= ASE_AWK_VAL_REF_NAMEDIDX &&
((ase_awk_val_ref_t*)a1)->id <= ASE_AWK_VAL_REF_ARGIDX)
{
/* an indexed value should not be assigned another map */
ase_awk_setrunerrnum (run, ASE_AWK_EIDXVALASSMAP);
return -1;
}
if (((ase_awk_val_ref_t*)a1)->id == ASE_AWK_VAL_REF_POS)
{
/* a positional should not be assigned a map */
ase_awk_setrunerrnum (run, ASE_AWK_EPOSVALASSMAP);
return -1;
}
a1_ref = (ase_awk_val_t**)((ase_awk_val_ref_t*)a1)->adr;
if ((*a1_ref)->type != ASE_AWK_VAL_NIL &&
(*a1_ref)->type != ASE_AWK_VAL_MAP)
{
/* cannot change a scalar value to a map */
ase_awk_setrunerrnum (run, ASE_AWK_ESCALARTOMAP);
return -1;
}
if (a0->type == ASE_AWK_VAL_STR)
{
str = ((ase_awk_val_str_t*)a0)->buf;
str_len = ((ase_awk_val_str_t*)a0)->len;
str_free = ASE_NULL;
}
else
{
str = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &str_len);
if (str == ASE_NULL) return -1;
str_free = str;
}
if (a2 == ASE_NULL)
{
/* get the value from FS */
t1 = ase_awk_getglobal (run, ASE_AWK_GLOBAL_FS);
if (t1->type == ASE_AWK_VAL_NIL)
{
fs_ptr = ASE_T(" ");
fs_len = 1;
fs_free = ASE_NULL;
}
else if (t1->type == ASE_AWK_VAL_STR)
{
fs_ptr = ((ase_awk_val_str_t*)t1)->buf;
fs_len = ((ase_awk_val_str_t*)t1)->len;
fs_free = ASE_NULL;
}
else
{
fs_ptr = ase_awk_valtostr (
run, t1, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &fs_len);
if (fs_ptr == ASE_NULL)
{
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
return -1;
}
fs_free = fs_ptr;
}
if (fs_len > 1)
{
fs_rex = run->global.fs;
fs_rex_free = ASE_NULL;
}
}
else
{
if (a2->type == ASE_AWK_VAL_STR)
{
fs_ptr = ((ase_awk_val_str_t*)a2)->buf;
fs_len = ((ase_awk_val_str_t*)a2)->len;
fs_free = ASE_NULL;
}
else
{
fs_ptr = ase_awk_valtostr (
run, a2, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &fs_len);
if (fs_ptr == ASE_NULL)
{
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
return -1;
}
fs_free = fs_ptr;
}
if (fs_len > 1)
{
fs_rex = ASE_AWK_BUILDREX (
run->awk, fs_ptr, fs_len, &errnum);
if (fs_rex == ASE_NULL)
{
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
if (fs_free != ASE_NULL)
ASE_AWK_FREE (run->awk, fs_free);
ase_awk_setrunerrnum (run, errnum);
return -1;
}
fs_rex_free = fs_rex;
}
}
t1 = ase_awk_makemapval (run);
if (t1 == ASE_NULL)
{
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
if (fs_free != ASE_NULL)
ASE_AWK_FREE (run->awk, fs_free);
if (fs_rex_free != ASE_NULL)
ASE_AWK_FREEREX (run->awk, fs_rex_free);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_refdownval (run, *a1_ref);
*a1_ref = t1;
ase_awk_refupval (run, *a1_ref);
p = str; str_left = str_len;
sta = (ase_awk_getoption(run->awk) & ASE_AWK_BASEONE)? 1: 0;
num = sta;
while (p != ASE_NULL)
{
if (fs_len <= 1)
{
p = ase_awk_strxntok (run,
p, str_len, fs_ptr, fs_len, &tok, &tok_len);
}
else
{
p = ase_awk_strxntokbyrex (run, p, str_len,
fs_rex, &tok, &tok_len, &errnum);
if (p == ASE_NULL && errnum != ASE_AWK_ENOERR)
{
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
if (fs_free != ASE_NULL)
ASE_AWK_FREE (run->awk, fs_free);
if (fs_rex_free != ASE_NULL)
ASE_AWK_FREEREX (run->awk, fs_rex_free);
ase_awk_setrunerrnum (run, errnum);
return -1;
}
}
if (num == 0 && p == ASE_NULL && tok_len == 0)
{
/* no field at all*/
break;
}
ASE_ASSERT (
(tok != ASE_NULL && tok_len > 0) || tok_len == 0);
/* create the field string */
t2 = ase_awk_makestrval (run, tok, tok_len);
if (t2 == ASE_NULL)
{
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
if (fs_free != ASE_NULL)
ASE_AWK_FREE (run->awk, fs_free);
if (fs_rex_free != ASE_NULL)
ASE_AWK_FREEREX (run->awk, fs_rex_free);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
/* put it into the map */
key_len = ase_awk_longtostr (
num, 10, ASE_NULL, key, ASE_COUNTOF(key));
ASE_ASSERT (key_len != (ase_size_t)-1);
/* don't forget to update the reference count when you
* handle the assignment-like situation. anyway, it is
* incremented in advance as if the assignment was successful.
* it is decremented if the assignement fails. */
ase_awk_refupval (run, t2);
if (ase_map_insert (
((ase_awk_val_map_t*)t1)->map,
key, key_len, t2, 0) == ASE_NULL)
{
/* assignment failed. restore the reference counter */
ase_awk_refdownval (run, t2);
if (str_free != ASE_NULL)
ASE_AWK_FREE (run->awk, str_free);
if (fs_free != ASE_NULL)
ASE_AWK_FREE (run->awk, fs_free);
if (fs_rex_free != ASE_NULL)
ASE_AWK_FREEREX (run->awk, fs_rex_free);
/* ase_map_insert() fails if the key exists.
* that can't happen here. so set the error code
* to ENOMEM */
ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);
return -1;
}
num++;
str_len = str_left - (p - str);
}
if (str_free != ASE_NULL) ASE_AWK_FREE (run->awk, str_free);
if (fs_free != ASE_NULL) ASE_AWK_FREE (run->awk, fs_free);
if (fs_rex_free != ASE_NULL) ASE_AWK_FREEREX (run->awk, fs_rex_free);
if (sta == 1) num--;
t1 = ase_awk_makeintval (run, num);
if (t1 == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_setretval (run, t1);
return 0;
}
static int bfn_tolower (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_char_t* str;
ase_size_t len, i;
ase_awk_val_t* a0, * r;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 1);
a0 = ase_awk_getarg (run, 0);
if (a0->type == ASE_AWK_VAL_STR)
{
str = ((ase_awk_val_str_t*)a0)->buf;
len = ((ase_awk_val_str_t*)a0)->len;
}
else
{
str = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len);
if (str == ASE_NULL) return -1;
}
for (i = 0; i < len; i++) str[i] = ASE_AWK_TOLOWER (run->awk, str[i]);
r = ase_awk_makestrval (run, str, len);
if (r == ASE_NULL)
{
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
ase_awk_setretval (run, r);
return 0;
}
static int bfn_toupper (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_char_t* str;
ase_size_t len, i;
ase_awk_val_t* a0, * r;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 1);
a0 = ase_awk_getarg (run, 0);
if (a0->type == ASE_AWK_VAL_STR)
{
str = ((ase_awk_val_str_t*)a0)->buf;
len = ((ase_awk_val_str_t*)a0)->len;
}
else
{
str = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len);
if (str == ASE_NULL) return -1;
}
for (i = 0; i < len; i++) str[i] = ASE_AWK_TOUPPER (run->awk, str[i]);
r = ase_awk_makestrval (run, str, len);
if (r == ASE_NULL)
{
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str);
ase_awk_setretval (run, r);
return 0;
}
static int __substitute (ase_awk_run_t* run, ase_long_t max_count)
{
ase_size_t nargs;
ase_awk_val_t* a0, * a1, * a2, ** a2_ref, * v;
ase_char_t* a0_ptr, * a1_ptr, * a2_ptr;
ase_size_t a0_len, a1_len, a2_len;
ase_char_t* a0_ptr_free = ASE_NULL;
ase_char_t* a1_ptr_free = ASE_NULL;
ase_char_t* a2_ptr_free = ASE_NULL;
void* rex = ASE_NULL;
int opt, n;
const ase_char_t* cur_ptr, * mat_ptr;
ase_size_t cur_len, mat_len, i, m;
ase_str_t new;
ase_long_t sub_count;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs >= 2 && nargs <= 3);
a0 = ase_awk_getarg (run, 0);
a1 = ase_awk_getarg (run, 1);
a2 = (nargs >= 3)? ase_awk_getarg (run, 2): ASE_NULL;
ASE_ASSERT (a2 == ASE_NULL || a2->type == ASE_AWK_VAL_REF);
#define FREE_A_PTRS(awk) \
do { \
if (a2_ptr_free != ASE_NULL) ASE_AWK_FREE (awk, a2_ptr_free); \
if (a1_ptr_free != ASE_NULL) ASE_AWK_FREE (awk, a1_ptr_free); \
if (a0_ptr_free != ASE_NULL) ASE_AWK_FREE (awk, a0_ptr_free); \
} while (0)
#define FREE_A0_REX(awk,rex) \
do { \
if (a0->type != ASE_AWK_VAL_REX) ASE_AWK_FREEREX (awk, rex); \
} while (0)
if (a0->type == ASE_AWK_VAL_REX)
{
rex = ((ase_awk_val_rex_t*)a0)->code;
}
else if (a0->type == ASE_AWK_VAL_STR)
{
a0_ptr = ((ase_awk_val_str_t*)a0)->buf;
a0_len = ((ase_awk_val_str_t*)a0)->len;
}
else
{
a0_ptr = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &a0_len);
if (a0_ptr == ASE_NULL)
{
FREE_A_PTRS (run->awk);
return -1;
}
a0_ptr_free = a0_ptr;
}
if (a1->type == ASE_AWK_VAL_STR)
{
a1_ptr = ((ase_awk_val_str_t*)a1)->buf;
a1_len = ((ase_awk_val_str_t*)a1)->len;
}
else
{
a1_ptr = ase_awk_valtostr (
run, a1, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &a1_len);
if (a1_ptr == ASE_NULL)
{
FREE_A_PTRS (run->awk);
return -1;
}
a1_ptr_free = a1_ptr;
}
if (a2 == ASE_NULL)
{
/* is this correct? any needs to use inrec.d0? */
a2_ptr = ASE_STR_PTR(&run->inrec.line);
a2_len = ASE_STR_LEN(&run->inrec.line);
}
else if (((ase_awk_val_ref_t*)a2)->id == ASE_AWK_VAL_REF_POS)
{
ase_size_t idx;
idx = (ase_size_t)((ase_awk_val_ref_t*)a2)->adr;
if (idx == 0)
{
a2_ptr = ASE_STR_PTR(&run->inrec.line);
a2_len = ASE_STR_LEN(&run->inrec.line);
}
else if (idx <= run->inrec.nflds)
{
a2_ptr = run->inrec.flds[idx-1].ptr;
a2_len = run->inrec.flds[idx-1].len;
}
else
{
a2_ptr = ASE_T("");
a2_len = 0;
}
}
else
{
a2_ref = (ase_awk_val_t**)((ase_awk_val_ref_t*)a2)->adr;
if ((*a2_ref)->type == ASE_AWK_VAL_MAP)
{
FREE_A_PTRS (run->awk);
/* a map is not allowed as the third parameter */
ase_awk_setrunerrnum (run, ASE_AWK_EMAPNOTALLOWED);
return -1;
}
if ((*a2_ref)->type == ASE_AWK_VAL_STR)
{
a2_ptr = ((ase_awk_val_str_t*)(*a2_ref))->buf;
a2_len = ((ase_awk_val_str_t*)(*a2_ref))->len;
}
else
{
a2_ptr = ase_awk_valtostr (
run, *a2_ref, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &a2_len);
if (a2_ptr == ASE_NULL)
{
FREE_A_PTRS (run->awk);
return -1;
}
a2_ptr_free = a2_ptr;
}
}
if (ase_str_init (&new, run->awk->mmgr, a2_len) == ASE_NULL)
{
FREE_A_PTRS (run->awk);
ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);
return -1;
}
if (a0->type != ASE_AWK_VAL_REX)
{
rex = ASE_AWK_BUILDREX (run->awk, a0_ptr, a0_len, &run->errnum);
if (rex == ASE_NULL)
{
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
}
opt = (run->global.ignorecase)? ASE_REX_IGNORECASE: 0;
cur_ptr = a2_ptr;
cur_len = a2_len;
sub_count = 0;
while (1)
{
if (max_count == 0 || sub_count < max_count)
{
n = ASE_AWK_MATCHREX (
run->awk, rex, opt, cur_ptr, cur_len,
&mat_ptr, &mat_len, &run->errnum);
}
else n = 0;
if (n == -1)
{
FREE_A0_REX (run->awk, rex);
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
if (n == 0)
{
/* no more match found */
if (ase_str_ncat (
&new, cur_ptr, cur_len) == (ase_size_t)-1)
{
FREE_A0_REX (run->awk, rex);
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
break;
}
if (ase_str_ncat (
&new, cur_ptr, mat_ptr - cur_ptr) == (ase_size_t)-1)
{
FREE_A0_REX (run->awk, rex);
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
for (i = 0; i < a1_len; i++)
{
if ((i+1) < a1_len &&
a1_ptr[i] == ASE_T('\\') &&
a1_ptr[i+1] == ASE_T('&'))
{
m = ase_str_ccat (&new, ASE_T('&'));
i++;
}
else if (a1_ptr[i] == ASE_T('&'))
{
m = ase_str_ncat (&new, mat_ptr, mat_len);
}
else
{
m = ase_str_ccat (&new, a1_ptr[i]);
}
if (m == (ase_size_t)-1)
{
FREE_A0_REX (run->awk, rex);
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
}
sub_count++;
cur_len = cur_len - ((mat_ptr - cur_ptr) + mat_len);
cur_ptr = mat_ptr + mat_len;
}
FREE_A0_REX (run->awk, rex);
if (sub_count > 0)
{
if (a2 == ASE_NULL)
{
if (ase_awk_setrec (run, 0,
ASE_STR_PTR(&new), ASE_STR_LEN(&new)) == -1)
{
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
}
else if (((ase_awk_val_ref_t*)a2)->id == ASE_AWK_VAL_REF_POS)
{
int n;
n = ase_awk_setrec (
run, (ase_size_t)((ase_awk_val_ref_t*)a2)->adr,
ASE_STR_PTR(&new), ASE_STR_LEN(&new));
if (n == -1)
{
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
return -1;
}
}
else
{
v = ase_awk_makestrval (run,
ASE_STR_PTR(&new), ASE_STR_LEN(&new));
if (v == ASE_NULL)
{
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_refdownval (run, *a2_ref);
*a2_ref = v;
ase_awk_refupval (run, *a2_ref);
}
}
ase_str_fini (&new);
FREE_A_PTRS (run->awk);
#undef FREE_A0_REX
#undef FREE_A_PTRS
v = ase_awk_makeintval (run, sub_count);
if (v == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_setretval (run, v);
return 0;
}
static int bfn_gsub (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
return __substitute (run, 0);
}
static int bfn_sub (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
return __substitute (run, 1);
}
static int bfn_match (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0, * a1;
ase_char_t* str0, * str1;
ase_size_t len0, len1;
ase_long_t idx;
void* rex;
int opt, n;
const ase_char_t* mat_ptr;
ase_size_t mat_len;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 2);
a0 = ase_awk_getarg (run, 0);
a1 = ase_awk_getarg (run, 1);
if (a0->type == ASE_AWK_VAL_STR)
{
str0 = ((ase_awk_val_str_t*)a0)->buf;
len0 = ((ase_awk_val_str_t*)a0)->len;
}
else
{
str0 = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len0);
if (str0 == ASE_NULL) return -1;
}
if (a1->type == ASE_AWK_VAL_REX)
{
rex = ((ase_awk_val_rex_t*)a1)->code;
}
else
{
if (a1->type == ASE_AWK_VAL_STR)
{
str1 = ((ase_awk_val_str_t*)a1)->buf;
len1 = ((ase_awk_val_str_t*)a1)->len;
}
else
{
str1 = ase_awk_valtostr (
run, a1, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &len1);
if (str1 == ASE_NULL)
{
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, str0);
return -1;
}
}
rex = ASE_AWK_BUILDREX (run->awk, str1, len1, &run->errnum);
if (rex == ASE_NULL)
{
if (a0->type != ASE_AWK_VAL_STR)
ASE_AWK_FREE (run->awk, str0);
return -1;
}
if (a1->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str1);
}
opt = (run->global.ignorecase)? ASE_REX_IGNORECASE: 0;
n = ASE_AWK_MATCHREX (
run->awk, rex, opt, str0, len0,
&mat_ptr, &mat_len, &run->errnum);
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, str0);
if (a1->type != ASE_AWK_VAL_REX) ASE_AWK_FREEREX (run->awk, rex);
if (n == -1) return -1;
idx = (n == 0)? -1: (ase_long_t)(mat_ptr - str0);
if (ase_awk_getoption(run->awk) & ASE_AWK_BASEONE) idx = idx + 1;
a0 = ase_awk_makeintval (run, idx);
if (a0 == ASE_NULL)
{
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_refupval (run, a0);
a1 = ase_awk_makeintval (run,
((n == 0)? (ase_long_t)-1: (ase_long_t)mat_len));
if (a1 == ASE_NULL)
{
ase_awk_refdownval (run, a0);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_awk_refupval (run, a1);
if (ase_awk_setglobal (run, ASE_AWK_GLOBAL_RSTART, a0) == -1)
{
ase_awk_refdownval (run, a1);
ase_awk_refdownval (run, a0);
return -1;
}
if (ase_awk_setglobal (run, ASE_AWK_GLOBAL_RLENGTH, a1) == -1)
{
ase_awk_refdownval (run, a1);
ase_awk_refdownval (run, a0);
return -1;
}
ase_awk_setretval (run, a0);
ase_awk_refdownval (run, a1);
ase_awk_refdownval (run, a0);
return 0;
}
static int bfn_sprintf (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0;
ase_str_t out, fbu;
ase_xstr_t cs0;
ase_xstr_t x;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs > 0);
if (ase_str_init (&out, run->awk->mmgr, 256) == ASE_NULL)
{
ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);
return -1;
}
if (ase_str_init (&fbu, run->awk->mmgr, 256) == ASE_NULL)
{
ase_str_fini (&out);
ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);
return -1;
}
a0 = ase_awk_getarg (run, 0);
if (a0->type == ASE_AWK_VAL_STR)
{
cs0.ptr = ((ase_awk_val_str_t*)a0)->buf;
cs0.len = ((ase_awk_val_str_t*)a0)->len;
}
else
{
cs0.ptr = ase_awk_valtostr (
run, a0, ASE_AWK_VALTOSTR_CLEAR, ASE_NULL, &cs0.len);
if (cs0.ptr == ASE_NULL)
{
ase_str_fini (&fbu);
ase_str_fini (&out);
return -1;
}
}
x.ptr = ase_awk_format (run,
&out, &fbu, cs0.ptr, cs0.len, nargs, ASE_NULL, &x.len);
if (a0->type != ASE_AWK_VAL_STR) ASE_AWK_FREE (run->awk, cs0.ptr);
if (x.ptr == ASE_NULL)
{
ase_str_fini (&fbu);
ase_str_fini (&out);
return -1;
}
/*a0 = ase_awk_makestrval_nodup (run, x.ptr, x.len);*/
a0 = ase_awk_makestrval (run, x.ptr, x.len);
if (a0 == ASE_NULL)
{
ase_str_fini (&fbu);
ase_str_fini (&out);
/*ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);*/
return -1;
}
ase_str_fini (&fbu);
/*ase_str_yield (&out, ASE_NULL, 0);*/
ase_str_fini (&out);
ase_awk_setretval (run, a0);
return 0;
}