qse/ase/cmd/awk/awk.c

598 lines
13 KiB
C
Raw Normal View History

/*
2008-12-16 03:56:48 +00:00
* $Id: awk.c 496 2008-12-15 09:56:48Z baconevi $
*/
#include <ase/awk/awk.h>
#include <ase/cmn/sll.h>
#include <ase/cmn/mem.h>
2008-08-21 04:58:19 +00:00
#include <ase/cmn/chr.h>
2008-08-23 02:13:47 +00:00
#include <ase/cmn/opt.h>
#include <ase/utl/stdio.h>
#include <ase/utl/main.h>
#include <string.h>
#include <signal.h>
#include <stdarg.h>
#include <math.h>
#include <stdlib.h>
2008-10-01 05:14:20 +00:00
#define ABORT(label) goto label
#if defined(_WIN32)
#include <windows.h>
#include <tchar.h>
#include <process.h>
#pragma warning (disable: 4996)
#pragma warning (disable: 4296)
2008-08-19 21:16:02 +00:00
#if defined(_MSC_VER) && defined(_DEBUG)
#define _CRTDBG_MAP_ALLOC
#include <crtdbg.h>
#endif
#else
#include <unistd.h>
#endif
2008-12-11 04:19:59 +00:00
static void dprint (const ase_char_t* fmt, ...)
{
va_list ap;
va_start (ap, fmt);
ase_vfprintf (stderr, fmt, ap);
va_end (ap);
}
ase_awk_t* app_awk = NULL;
ase_awk_run_t* app_run = NULL;
#ifdef _WIN32
static BOOL WINAPI stop_run (DWORD ctrl_type)
{
if (ctrl_type == CTRL_C_EVENT ||
ctrl_type == CTRL_CLOSE_EVENT)
{
ase_awk_stop (app_run);
return TRUE;
}
return FALSE;
}
#else
static void stop_run (int sig)
{
signal (SIGINT, SIG_IGN);
ase_awk_stop (app_run);
signal (SIGINT, stop_run);
}
#endif
static void on_run_start (ase_awk_run_t* run, void* custom)
{
app_run = run;
2008-12-11 04:19:59 +00:00
dprint (ASE_T("[AWK ABOUT TO START]\n"));
}
static ase_map_walk_t print_awk_value (
ase_map_t* map, ase_map_pair_t* pair, void* arg)
{
ase_awk_run_t* run = (ase_awk_run_t*)arg;
2008-12-11 04:19:59 +00:00
ase_char_t* str;
ase_size_t len;
str = ase_awk_valtostr (run, ASE_MAP_VPTR(pair), 0, ASE_NULL, &len);
if (str == ASE_NULL)
{
dprint (ASE_T("***OUT OF MEMORY***\n"));
}
else
{
dprint (ASE_T("%.*s = %.*s\n"),
(int)ASE_MAP_KLEN(pair), ASE_MAP_KPTR(pair),
(int)len, str);
ase_awk_free (ase_awk_getrunawk(run), str);
}
return ASE_MAP_WALK_FORWARD;
}
static void on_run_statement (
ase_awk_run_t* run, ase_size_t line, void* custom)
{
2008-12-11 04:19:59 +00:00
/*dprint (L"running %d\n", (int)line);*/
}
static void on_run_return (
ase_awk_run_t* run, ase_awk_val_t* ret, void* custom)
{
2008-12-11 04:19:59 +00:00
ase_size_t len;
ase_char_t* str;
2008-12-16 03:56:48 +00:00
if (ret == ase_awk_val_nil)
2008-12-11 04:19:59 +00:00
{
2008-12-16 03:56:48 +00:00
dprint (ASE_T("[RETURN] - ***nil***\n"));
2008-12-11 04:19:59 +00:00
}
else
{
2008-12-16 03:56:48 +00:00
str = ase_awk_valtostr (run, ret, 0, ASE_NULL, &len);
if (str == ASE_NULL)
{
dprint (ASE_T("[RETURN] - ***OUT OF MEMORY***\n"));
}
else
{
dprint (ASE_T("[RETURN] - [%.*s]\n"), (int)len, str);
ase_awk_free (ase_awk_getrunawk(run), str);
}
2008-12-11 04:19:59 +00:00
}
2008-12-11 04:19:59 +00:00
dprint (ASE_T("[NAMED VARIABLES]\n"));
2008-12-12 04:05:28 +00:00
ase_map_walk (ase_awk_getrunnvmap(run), print_awk_value, run);
2008-12-11 04:19:59 +00:00
dprint (ASE_T("[END NAMED VARIABLES]\n"));
}
2008-08-19 05:21:48 +00:00
static void on_run_end (ase_awk_run_t* run, int errnum, void* data)
{
if (errnum != ASE_AWK_ENOERR)
{
2008-12-11 04:19:59 +00:00
dprint (ASE_T("[AWK ENDED WITH AN ERROR]\n"));
ase_printf (ASE_T("RUN ERROR: CODE [%d] LINE [%u] %s\n"),
errnum,
(unsigned int)ase_awk_getrunerrlin(run),
ase_awk_getrunerrmsg(run));
}
2008-12-11 04:19:59 +00:00
else dprint (ASE_T("[AWK ENDED SUCCESSFULLY]\n"));
app_run = NULL;
}
2008-08-19 21:16:02 +00:00
/* TODO: remove otab... */
static struct
{
const ase_char_t* name;
int opt;
} otab[] =
{
{ ASE_T("implicit"), ASE_AWK_IMPLICIT },
{ ASE_T("explicit"), ASE_AWK_EXPLICIT },
2008-07-23 07:12:56 +00:00
{ ASE_T("bxor"), ASE_AWK_BXOR },
{ ASE_T("shift"), ASE_AWK_SHIFT },
{ ASE_T("idiv"), ASE_AWK_IDIV },
{ ASE_T("extio"), ASE_AWK_EXTIO },
2008-07-15 23:56:32 +00:00
{ ASE_T("newline"), ASE_AWK_NEWLINE },
{ ASE_T("baseone"), ASE_AWK_BASEONE },
{ ASE_T("stripspaces"), ASE_AWK_STRIPSPACES },
{ ASE_T("nextofile"), ASE_AWK_NEXTOFILE },
{ ASE_T("crfl"), ASE_AWK_CRLF },
{ ASE_T("argstomain"), ASE_AWK_ARGSTOMAIN },
{ ASE_T("reset"), ASE_AWK_RESET },
{ ASE_T("maptovar"), ASE_AWK_MAPTOVAR },
2008-07-15 23:56:32 +00:00
{ ASE_T("pablock"), ASE_AWK_PABLOCK }
};
static void print_usage (const ase_char_t* argv0)
{
int j;
2008-12-11 04:19:59 +00:00
ase_printf (ASE_T("Usage: %s [options] -f sourcefile [ -- ] [datafile]*\n"), argv0);
ase_printf (ASE_T(" %s [options] [ -- ] sourcestring [datafile]*\n"), argv0);
ase_printf (ASE_T("Where options are:\n"));
ase_printf (ASE_T(" -f sourcefile --file=sourcefile\n"));
ase_printf (ASE_T(" -d deparsedfile --deparsed-file=deparsedfile\n"));
ase_printf (ASE_T(" -F string --field-separator=string\n"));
ase_printf (ASE_T("\nYou may specify the following options to change the behavior of the interpreter.\n"));
for (j = 0; j < ASE_COUNTOF(otab); j++)
{
ase_printf (ASE_T(" -%-20s -no%-20s\n"), otab[j].name, otab[j].name);
}
}
static int bfn_sleep (
ase_awk_run_t* run, const ase_char_t* fnm, ase_size_t fnl)
{
ase_size_t nargs;
ase_awk_val_t* a0;
ase_long_t lv;
ase_real_t rv;
ase_awk_val_t* r;
int n;
nargs = ase_awk_getnargs (run);
ASE_ASSERT (nargs == 1);
a0 = ase_awk_getarg (run, 0);
n = ase_awk_valtonum (run, a0, &lv, &rv);
if (n == -1) return -1;
if (n == 1) lv = (ase_long_t)rv;
#ifdef _WIN32
Sleep ((DWORD)(lv * 1000));
n = 0;
#else
n = sleep (lv);
#endif
r = ase_awk_makeintval (run, n);
if (r == ASE_NULL)
{
ase_awk_setrunerrnum (run, ASE_AWK_ENOMEM);
return -1;
}
ase_awk_setretval (run, r);
return 0;
}
static void out_of_memory (void)
{
ase_fprintf (ASE_STDERR, ASE_T("Error: out of memory\n"));
}
2008-10-01 05:14:20 +00:00
struct argout_t
{
2008-12-16 03:56:48 +00:00
void* isp; /* input source files or string */
2008-12-13 03:42:32 +00:00
int ist; /* input source type */
ase_size_t isfl; /* the number of input source files */
ase_char_t* osf; /* output source file */
ase_char_t** icf; /* input console files */
ase_size_t icfl; /* the number of input console files */
ase_map_t* vm; /* global variable map */
2008-10-01 05:14:20 +00:00
};
static int handle_args (int argc, ase_char_t* argv[], struct argout_t* ao)
2008-07-23 08:22:24 +00:00
{
2008-07-25 08:08:37 +00:00
static ase_opt_lng_t lng[] =
{
2008-08-04 08:06:43 +00:00
{ ASE_T("implicit"), 0 },
{ ASE_T("explicit"), 0 },
{ ASE_T("bxor"), 0 },
{ ASE_T("shift"), 0 },
{ ASE_T("idiv"), 0 },
{ ASE_T("extio"), 0 },
{ ASE_T("newline"), 0 },
{ ASE_T("baseone"), 0 },
{ ASE_T("stripspaces"), 0 },
{ ASE_T("nextofile"), 0 },
{ ASE_T("crlf"), 0 },
{ ASE_T("argstomain"), 0 },
{ ASE_T("reset"), 0 },
{ ASE_T("maptovar"), 0 },
{ ASE_T("pablock"), 0 },
2008-07-28 00:16:54 +00:00
{ ASE_T(":main"), ASE_T('m') },
{ ASE_T(":file"), ASE_T('f') },
{ ASE_T(":field-separator"), ASE_T('F') },
2008-12-11 04:19:59 +00:00
{ ASE_T(":deparsed-file"), ASE_T('d') },
2008-07-28 00:16:54 +00:00
{ ASE_T(":assign"), ASE_T('v') },
2008-08-04 08:06:43 +00:00
{ ASE_T("help"), ASE_T('h') }
2008-07-25 08:08:37 +00:00
};
static ase_opt_t opt =
{
2008-10-14 05:32:58 +00:00
ASE_T("hm:f:F:d:v:"),
2008-07-25 08:08:37 +00:00
lng
};
2008-07-23 08:22:24 +00:00
2008-08-19 21:16:02 +00:00
ase_cint_t c;
2008-09-30 05:07:47 +00:00
ase_size_t isfc = 16; /* the capacity of isf */
ase_size_t isfl = 0; /* number of input source files */
ase_size_t icfc = 0; /* the capacity of icf */
ase_size_t icfl = 0; /* the number of input console files */
ase_char_t** isf = ASE_NULL; /* input source files */
ase_char_t* osf = ASE_NULL; /* output source file */
ase_char_t** icf = ASE_NULL; /* input console files */
ase_map_t* vm = ASE_NULL; /* global variable map */
isf = (ase_char_t**) malloc (ASE_SIZEOF(*isf) * isfc);
if (isf == ASE_NULL)
2008-09-30 05:07:47 +00:00
{
out_of_memory ();
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-09-30 05:07:47 +00:00
}
vm = ase_map_open (ASE_NULL, 0, 30, 70);
if (vm == ASE_NULL)
{
out_of_memory ();
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-09-30 05:07:47 +00:00
}
ase_map_setcopier (vm, ASE_MAP_KEY, ASE_MAP_COPIER_INLINE);
ase_map_setcopier (vm, ASE_MAP_VAL, ASE_MAP_COPIER_INLINE);
ase_map_setscale (vm, ASE_MAP_KEY, ASE_SIZEOF(ase_char_t));
ase_map_setscale (vm, ASE_MAP_VAL, ASE_SIZEOF(ase_char_t));
2008-07-23 08:22:24 +00:00
while ((c = ase_getopt (argc, argv, &opt)) != ASE_CHAR_EOF)
{
switch (c)
{
2008-07-26 09:01:27 +00:00
case 0:
2008-07-27 09:37:38 +00:00
ase_printf (ASE_T(">>> [%s] [%s]\n"), opt.lngopt, opt.arg);
2008-07-26 09:01:27 +00:00
break;
2008-07-23 08:22:24 +00:00
case ASE_T('h'):
print_usage (argv[0]);
if (isf != ASE_NULL) free (isf);
if (vm != ASE_NULL) ase_map_close (vm);
2008-07-27 09:37:38 +00:00
return 1;
2008-07-23 08:22:24 +00:00
2008-07-25 08:08:37 +00:00
case ASE_T('f'):
{
2008-12-13 03:42:32 +00:00
if (isfl >= isfc-1) /* -1 for last ASE_NULL */
2008-08-11 02:27:21 +00:00
{
ase_char_t** tmp;
2008-12-13 03:42:32 +00:00
tmp = (ase_char_t**) realloc (isf, ASE_SIZEOF(*isf)*(isfc+16));
if (tmp == ASE_NULL)
{
out_of_memory ();
2008-12-16 03:56:48 +00:00
ABORT (oops);
}
isf = tmp;
isfc = isfc + 16;
2008-08-11 02:27:21 +00:00
}
isf[isfl++] = opt.arg;
2008-07-27 09:37:38 +00:00
break;
}
2008-07-27 09:37:38 +00:00
case ASE_T('F'):
2008-10-01 05:14:20 +00:00
{
2008-07-27 09:37:38 +00:00
ase_printf (ASE_T("[field separator] = %s\n"), opt.arg);
2008-07-23 08:22:24 +00:00
break;
2008-10-01 05:14:20 +00:00
}
2008-07-23 08:22:24 +00:00
2008-10-14 05:32:58 +00:00
case ASE_T('d'):
{
osf = opt.arg;
break;
}
2008-09-30 05:07:47 +00:00
case ASE_T('v'):
{
ase_char_t* eq = ase_strchr(opt.arg, ASE_T('='));
if (eq == ASE_NULL)
{
/* INVALID VALUE... */
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-09-30 05:07:47 +00:00
}
*eq = ASE_T('\0');
if (ase_map_upsert (vm, opt.arg, ase_strlen(opt.arg)+1, eq, ase_strlen(eq)+1) == ASE_NULL)
{
out_of_memory ();
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-09-30 05:07:47 +00:00
}
break;
}
2008-07-23 08:22:24 +00:00
case ASE_T('?'):
2008-10-01 05:14:20 +00:00
{
2008-07-27 09:37:38 +00:00
if (opt.lngopt)
{
ase_printf (ASE_T("Error: illegal option - %s\n"), opt.lngopt);
}
else
{
ase_printf (ASE_T("Error: illegal option - %c\n"), opt.opt);
}
2008-08-19 21:16:02 +00:00
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-10-01 05:14:20 +00:00
}
2008-07-23 08:22:24 +00:00
case ASE_T(':'):
2008-10-01 05:14:20 +00:00
{
2008-07-27 09:37:38 +00:00
if (opt.lngopt)
{
ase_printf (ASE_T("Error: bad argument for %s\n"), opt.lngopt);
}
else
{
ase_printf (ASE_T("Error: bad argument for %c\n"), opt.opt);
}
2008-08-19 21:16:02 +00:00
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-10-01 05:14:20 +00:00
}
2008-07-23 08:22:24 +00:00
2008-07-26 09:01:27 +00:00
default:
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-07-23 08:22:24 +00:00
}
}
2008-12-13 03:42:32 +00:00
isf[isfl] = ASE_NULL;
2008-08-12 04:52:25 +00:00
if (isfl <= 0)
2008-07-26 09:01:27 +00:00
{
2008-08-19 05:21:48 +00:00
if (opt.ind >= argc)
{
/* no source code specified */
2008-12-16 03:56:48 +00:00
ABORT (oops);
2008-08-19 05:21:48 +00:00
}
/* the source code is the string, not from the file */
2008-12-13 03:42:32 +00:00
ao->ist = ASE_AWK_PARSE_STRING;
ao->isp = argv[opt.ind++];
2008-07-26 09:01:27 +00:00
}
else
{
2008-12-13 03:42:32 +00:00
ao->ist = ASE_AWK_PARSE_FILES;
ao->isp = isf;
2008-07-26 09:01:27 +00:00
}
2008-07-27 09:37:38 +00:00
/* the remaining arguments are input console file names */
icfc = (opt.ind >= argc)? 2: (argc - opt.ind + 1);
icf = (ase_char_t**) malloc (ASE_SIZEOF(*icf)*icfc);
if (icf == ASE_NULL)
{
out_of_memory ();
2008-12-16 03:56:48 +00:00
ABORT (oops);
}
if (opt.ind >= argc)
{
/* no input(console) file names are specified.
* the standard input becomes the input console */
icf[icfl++] = ASE_T("");
}
else
{
do { icf[icfl++] = argv[opt.ind++]; } while (opt.ind < argc);
}
icf[icfl] = ASE_NULL;
2008-07-23 08:22:24 +00:00
2008-10-14 05:32:58 +00:00
ao->osf = osf;
ao->icf = icf;
ao->icfl = icfl;
2008-10-01 05:14:20 +00:00
ao->vm = vm;
return 0;
2008-10-01 05:14:20 +00:00
2008-12-16 03:56:48 +00:00
oops:
2008-10-01 05:14:20 +00:00
if (vm != ASE_NULL) ase_map_close (vm);
if (icf != ASE_NULL) free (icf);
if (isf != ASE_NULL) free (isf);
2008-10-01 05:14:20 +00:00
return -1;
2008-07-23 08:22:24 +00:00
}
2008-08-04 08:06:43 +00:00
static ase_awk_t* open_awk (void)
{
ase_awk_t* awk;
2008-12-16 03:56:48 +00:00
awk = ase_awk_opensimple (0);
2008-08-04 08:06:43 +00:00
if (awk == ASE_NULL)
{
ase_printf (ASE_T("ERROR: cannot open awk\n"));
return ASE_NULL;
2008-08-04 08:06:43 +00:00
}
2008-08-19 05:21:48 +00:00
/* TODO: get depth from command line */
ase_awk_setmaxdepth (
awk, ASE_AWK_DEPTH_BLOCK_PARSE | ASE_AWK_DEPTH_EXPR_PARSE, 50);
ase_awk_setmaxdepth (
awk, ASE_AWK_DEPTH_BLOCK_RUN | ASE_AWK_DEPTH_EXPR_RUN, 500);
2008-08-04 08:06:43 +00:00
2008-08-19 05:21:48 +00:00
/*
ase_awk_seterrstr (awk, ASE_AWK_EGBLRED,
ASE_T("\uC804\uC5ED\uBCC0\uC218 \'%.*s\'\uAC00 \uC7AC\uC815\uC758 \uB418\uC5C8\uC2B5\uB2C8\uB2E4"));
ase_awk_seterrstr (awk, ASE_AWK_EAFNRED,
ASE_T("\uD568\uC218 \'%.*s\'\uAC00 \uC7AC\uC815\uC758 \uB418\uC5C8\uC2B5\uB2C8\uB2E4"));
*/
/*ase_awk_setkeyword (awk, ASE_T("func"), 4, ASE_T("FX"), 2);*/
2008-08-04 08:06:43 +00:00
2008-08-19 05:21:48 +00:00
if (ase_awk_addfunc (awk,
ASE_T("sleep"), 5, 0,
1, 1, ASE_NULL, bfn_sleep) == ASE_NULL)
{
ase_awk_close (awk);
ase_printf (ASE_T("ERROR: cannot add function 'sleep'\n"));
return ASE_NULL;
}
2008-08-04 08:06:43 +00:00
return awk;
}
2008-07-21 06:42:39 +00:00
static int awk_main (int argc, ase_char_t* argv[])
{
ase_awk_t* awk;
2008-12-16 03:56:48 +00:00
ase_awk_runcbs_t runcbs;
2008-08-04 08:06:43 +00:00
int i, file_count = 0;
2008-07-21 06:42:39 +00:00
const ase_char_t* mfn = ASE_NULL;
int mode = 0;
int runarg_count = 0;
ase_awk_runarg_t runarg[128];
int deparse = 0;
2008-10-01 05:14:20 +00:00
struct argout_t ao;
ase_memset (&ao, 0, ASE_SIZEOF(ao));
i = handle_args (argc, argv, &ao);
2008-07-27 09:37:38 +00:00
if (i == -1)
2008-07-21 06:42:39 +00:00
{
print_usage (argv[0]);
return -1;
}
2008-07-27 09:37:38 +00:00
if (i == 1) return 0;
2008-07-21 06:42:39 +00:00
runarg[runarg_count].ptr = NULL;
runarg[runarg_count].len = 0;
2008-08-04 08:06:43 +00:00
awk = open_awk ();
if (awk == ASE_NULL) return -1;
app_awk = awk;
2008-12-13 03:42:32 +00:00
if (ase_awk_parsesimple (awk, ao.isp, ao.ist, ao.osf) == -1)
2008-10-01 05:14:20 +00:00
{
ase_printf (
ASE_T("PARSE ERROR: CODE [%d] LINE [%u] %s\n"),
ase_awk_geterrnum(awk),
(unsigned int)ase_awk_geterrlin(awk),
2008-12-12 04:05:28 +00:00
ase_awk_geterrmsg(awk)
);
2008-12-16 03:56:48 +00:00
ase_awk_close (awk);
2008-10-01 05:14:20 +00:00
return -1;
}
#ifdef _WIN32
SetConsoleCtrlHandler (stop_run, TRUE);
#else
signal (SIGINT, stop_run);
#endif
2008-12-16 03:56:48 +00:00
runcbs.on_start = on_run_start;
runcbs.on_statement = on_run_statement;
runcbs.on_return = on_run_return;
runcbs.on_end = on_run_end;
runcbs.data = ASE_NULL;
if (ase_awk_runsimple (awk, ao.icf, &runcbs) == -1)
{
2008-12-12 04:05:28 +00:00
ase_printf (
ASE_T("RUN ERROR: CODE [%d] LINE [%u] %s\n"),
ase_awk_geterrnum(awk),
(unsigned int)ase_awk_geterrlin(awk),
ase_awk_geterrmsg(awk)
);
2008-12-16 03:56:48 +00:00
ase_awk_close (awk);
return -1;
}
2008-12-16 03:56:48 +00:00
ase_awk_close (awk);
2008-08-19 05:21:48 +00:00
2008-12-13 03:42:32 +00:00
if (ao.ist == ASE_AWK_PARSE_FILES && ao.isp != ASE_NULL) free (ao.isp);
if (ao.osf != ASE_NULL) free (ao.osf);
2008-12-11 04:19:59 +00:00
if (ao.icf != ASE_NULL) free (ao.icf);
if (ao.vm != ASE_NULL) ase_map_close (ao.vm);
2008-09-30 05:07:47 +00:00
return 0;
}
int ase_main (int argc, ase_achar_t* argv[])
{
int n;
#if defined(_WIN32) && defined(_DEBUG) && defined(_MSC_VER)
_CrtSetDbgFlag (_CRTDBG_LEAK_CHECK_DF | _CRTDBG_ALLOC_MEM_DF);
#endif
n = ase_runmain (argc, argv, awk_main);
#if defined(_WIN32) && defined(_DEBUG)
/*#if defined(_MSC_VER)
_CrtDumpMemoryLeaks ();
#endif*/
#endif
return n;
}