2009-05-19 22:32:12 +00:00
|
|
|
/*
|
2011-09-21 23:10:09 +00:00
|
|
|
* $Id: sed.h 572 2011-09-21 05:10:09Z hyunghwan.chung $
|
2009-05-19 22:32:12 +00:00
|
|
|
*
|
2011-04-23 08:28:43 +00:00
|
|
|
Copyright 2006-2011 Chung, Hyung-Hwan.
|
2009-09-16 04:01:02 +00:00
|
|
|
This file is part of QSE.
|
2009-05-19 22:32:12 +00:00
|
|
|
|
2009-09-16 04:01:02 +00:00
|
|
|
QSE is free software: you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU Lesser General Public License as
|
|
|
|
published by the Free Software Foundation, either version 3 of
|
|
|
|
the License, or (at your option) any later version.
|
2009-05-19 22:32:12 +00:00
|
|
|
|
2009-09-16 04:01:02 +00:00
|
|
|
QSE is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU Lesser General Public License for more details.
|
2009-05-19 22:32:12 +00:00
|
|
|
|
2009-09-16 04:01:02 +00:00
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
|
|
License along with QSE. If not, see <http://www.gnu.org/licenses/>.
|
2009-05-19 22:32:12 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _QSE_LIB_SED_SED_H_
|
|
|
|
#define _QSE_LIB_SED_SED_H_
|
|
|
|
|
|
|
|
#include <qse/sed/sed.h>
|
|
|
|
#include <qse/cmn/str.h>
|
|
|
|
|
2010-07-15 06:54:48 +00:00
|
|
|
#define QSE_MAP_AS_RBT
|
|
|
|
#include <qse/cmn/map.h>
|
|
|
|
|
2011-09-03 09:27:44 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Define USE_REX to use rex.h on behalf of tre.h
|
|
|
|
* rex.h currently does not support backreference.
|
|
|
|
*/
|
|
|
|
#ifdef USE_REX
|
|
|
|
enum qse_sed_depth_t
|
|
|
|
{
|
|
|
|
QSE_SED_DEPTH_REX_BUILD = (1 << 0),
|
|
|
|
QSE_SED_DEPTH_REX_MATCH = (1 << 1)
|
|
|
|
};
|
2011-09-07 08:18:36 +00:00
|
|
|
typedef enum qse_sed_depth_t qse_sed_depth_t;
|
2011-09-03 09:27:44 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#define QSE_SED_CMD_NOOP QSE_T('\0')
|
|
|
|
#define QSE_SED_CMD_QUIT QSE_T('q')
|
|
|
|
|
2009-05-19 22:32:12 +00:00
|
|
|
typedef struct qse_sed_adr_t qse_sed_adr_t;
|
|
|
|
typedef struct qse_sed_cmd_t qse_sed_cmd_t;
|
2009-05-30 19:19:46 +00:00
|
|
|
typedef struct qse_sed_cmd_blk_t qse_sed_cmd_blk_t;
|
|
|
|
|
|
|
|
struct qse_sed_adr_t
|
|
|
|
{
|
|
|
|
enum
|
|
|
|
{
|
|
|
|
QSE_SED_ADR_NONE, /* no address */
|
|
|
|
QSE_SED_ADR_DOL, /* $ - last line */
|
|
|
|
QSE_SED_ADR_LINE, /* specified line */
|
|
|
|
QSE_SED_ADR_REX, /* lines matching regular expression */
|
|
|
|
QSE_SED_ADR_STEP /* line steps - only in the second address */
|
|
|
|
} type;
|
|
|
|
|
|
|
|
union
|
|
|
|
{
|
|
|
|
qse_size_t lno;
|
|
|
|
void* rex;
|
|
|
|
} u;
|
|
|
|
};
|
|
|
|
|
|
|
|
#define QSE_SED_CMD_QUIT_QUIET QSE_T('Q')
|
|
|
|
#define QSE_SED_CMD_APPEND QSE_T('a')
|
|
|
|
#define QSE_SED_CMD_INSERT QSE_T('i')
|
|
|
|
#define QSE_SED_CMD_CHANGE QSE_T('c')
|
|
|
|
#define QSE_SED_CMD_DELETE QSE_T('d')
|
|
|
|
#define QSE_SED_CMD_DELETE_FIRSTLN QSE_T('D')
|
|
|
|
#define QSE_SED_CMD_PRINT_LNNUM QSE_T('=')
|
|
|
|
#define QSE_SED_CMD_PRINT QSE_T('p')
|
|
|
|
#define QSE_SED_CMD_PRINT_FIRSTLN QSE_T('P')
|
|
|
|
#define QSE_SED_CMD_PRINT_CLEARLY QSE_T('l')
|
|
|
|
#define QSE_SED_CMD_HOLD QSE_T('h')
|
|
|
|
#define QSE_SED_CMD_HOLD_APPEND QSE_T('H')
|
|
|
|
#define QSE_SED_CMD_RELEASE QSE_T('g')
|
|
|
|
#define QSE_SED_CMD_RELEASE_APPEND QSE_T('G')
|
|
|
|
#define QSE_SED_CMD_EXCHANGE QSE_T('x')
|
|
|
|
#define QSE_SED_CMD_NEXT QSE_T('n')
|
|
|
|
#define QSE_SED_CMD_NEXT_APPEND QSE_T('N')
|
|
|
|
#define QSE_SED_CMD_READ_FILE QSE_T('r')
|
|
|
|
#define QSE_SED_CMD_READ_FILELN QSE_T('R')
|
|
|
|
#define QSE_SED_CMD_WRITE_FILE QSE_T('w')
|
|
|
|
#define QSE_SED_CMD_WRITE_FILELN QSE_T('W')
|
|
|
|
#define QSE_SED_CMD_BRANCH QSE_T('b')
|
|
|
|
#define QSE_SED_CMD_BRANCH_COND QSE_T('t')
|
|
|
|
#define QSE_SED_CMD_SUBSTITUTE QSE_T('s')
|
|
|
|
#define QSE_SED_CMD_TRANSLATE QSE_T('y')
|
2011-09-21 23:10:09 +00:00
|
|
|
#define QSE_SED_CMD_CLEAR_PATTERN QSE_T('z')
|
2009-05-30 19:19:46 +00:00
|
|
|
|
|
|
|
struct qse_sed_cmd_t
|
|
|
|
{
|
|
|
|
qse_char_t type;
|
2009-08-26 07:07:54 +00:00
|
|
|
qse_sed_loc_t loc;
|
2009-05-30 19:19:46 +00:00
|
|
|
|
|
|
|
int negated;
|
|
|
|
|
|
|
|
qse_sed_adr_t a1; /* optional start address */
|
|
|
|
qse_sed_adr_t a2; /* optional end address */
|
|
|
|
|
|
|
|
union
|
|
|
|
{
|
|
|
|
/* text for the a, i, c commands */
|
|
|
|
qse_xstr_t text;
|
|
|
|
|
|
|
|
/* file name for r, w, R, W */
|
|
|
|
qse_xstr_t file;
|
|
|
|
|
|
|
|
/* data for the s command */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
void* rex; /* regular expression */
|
|
|
|
qse_xstr_t rpl; /* replacement */
|
|
|
|
|
|
|
|
/* flags */
|
|
|
|
qse_xstr_t file; /* file name for w */
|
|
|
|
unsigned short occ;
|
|
|
|
unsigned short g: 1; /* global */
|
|
|
|
unsigned short p: 1; /* print */
|
|
|
|
unsigned short i: 1; /* case insensitive */
|
|
|
|
} subst;
|
|
|
|
|
|
|
|
/* translation set for the y command */
|
|
|
|
qse_xstr_t transet;
|
|
|
|
|
|
|
|
/* branch target for b and t */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
qse_xstr_t label;
|
|
|
|
qse_sed_cmd_t* target;
|
|
|
|
} branch;
|
|
|
|
} u;
|
|
|
|
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
int a1_matched;
|
|
|
|
int c_ready;
|
2009-05-30 23:29:06 +00:00
|
|
|
|
|
|
|
/* points to the next command for fast traversal and
|
|
|
|
* fast random jumps */
|
|
|
|
qse_sed_cmd_t* next;
|
2009-05-30 19:19:46 +00:00
|
|
|
} state;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct qse_sed_cmd_blk_t
|
|
|
|
{
|
|
|
|
qse_size_t len;
|
2009-05-30 23:29:06 +00:00
|
|
|
qse_sed_cmd_t buf[256];
|
2009-05-30 19:19:46 +00:00
|
|
|
qse_sed_cmd_blk_t* next;
|
|
|
|
};
|
2009-05-19 22:32:12 +00:00
|
|
|
|
|
|
|
/**
|
|
|
|
* The qse_sed_t type defines a stream editor
|
|
|
|
*/
|
|
|
|
struct qse_sed_t
|
|
|
|
{
|
|
|
|
QSE_DEFINE_COMMON_FIELDS (sed)
|
|
|
|
|
2009-05-28 07:55:17 +00:00
|
|
|
qse_sed_errstr_t errstr; /**< error string getter */
|
2009-05-19 22:32:12 +00:00
|
|
|
qse_sed_errnum_t errnum; /**< stores an error number */
|
2009-05-22 00:17:17 +00:00
|
|
|
qse_char_t errmsg[128]; /**< error message holder */
|
2009-08-26 21:03:51 +00:00
|
|
|
qse_sed_loc_t errloc; /**< location of the last error */
|
2009-05-22 00:17:17 +00:00
|
|
|
|
2009-05-19 22:32:12 +00:00
|
|
|
int option; /**< stores options */
|
|
|
|
|
2009-09-03 06:55:55 +00:00
|
|
|
qse_sed_lformatter_t lformatter;
|
|
|
|
|
2009-05-30 23:29:06 +00:00
|
|
|
struct
|
|
|
|
{
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
qse_size_t build;
|
|
|
|
qse_size_t match;
|
|
|
|
} rex;
|
|
|
|
} depth;
|
|
|
|
|
2009-05-19 22:32:12 +00:00
|
|
|
/** source text pointers */
|
|
|
|
struct
|
|
|
|
{
|
2009-08-26 07:07:54 +00:00
|
|
|
qse_sed_loc_t loc; /**< location */
|
2009-05-23 19:21:10 +00:00
|
|
|
qse_cint_t cc; /**< last character read */
|
2009-05-19 22:32:12 +00:00
|
|
|
const qse_char_t* ptr; /**< beginning of the source text */
|
|
|
|
const qse_char_t* end; /**< end of the source text */
|
|
|
|
const qse_char_t* cur; /**< current source text pointer */
|
|
|
|
} src;
|
|
|
|
|
2009-05-25 07:29:12 +00:00
|
|
|
/** temporary data for compiling */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
qse_str_t rex; /**< regular expression buffer */
|
|
|
|
qse_str_t lab; /**< label name buffer */
|
|
|
|
|
|
|
|
/** data structure to compile command groups */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
/** current level of command group nesting */
|
|
|
|
int level;
|
|
|
|
/** keeps track of the begining of nested groups */
|
|
|
|
qse_sed_cmd_t* cmd[128];
|
|
|
|
} grp;
|
|
|
|
|
|
|
|
/** a table storing labels seen */
|
2010-07-15 06:54:48 +00:00
|
|
|
qse_map_t labs;
|
2009-05-25 07:29:12 +00:00
|
|
|
} tmp;
|
2009-05-19 22:32:12 +00:00
|
|
|
|
|
|
|
/** compiled commands */
|
2009-05-30 19:19:46 +00:00
|
|
|
struct
|
|
|
|
{
|
|
|
|
qse_sed_cmd_blk_t fb; /**< the first block is static */
|
|
|
|
qse_sed_cmd_blk_t* lb; /**< points to the last block */
|
2009-05-30 23:29:06 +00:00
|
|
|
|
|
|
|
qse_sed_cmd_t quit;
|
2011-09-09 01:49:53 +00:00
|
|
|
qse_sed_cmd_t quit_quiet;
|
2009-05-30 23:29:06 +00:00
|
|
|
qse_sed_cmd_t again;
|
|
|
|
qse_sed_cmd_t over;
|
2009-05-30 19:19:46 +00:00
|
|
|
} cmd;
|
|
|
|
|
2009-05-19 22:32:12 +00:00
|
|
|
/** data for execution */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
/** data needed for output streams and files */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
qse_sed_io_fun_t fun; /**< an output handler */
|
|
|
|
qse_sed_io_arg_t arg; /**< output handling data */
|
|
|
|
|
|
|
|
qse_char_t buf[2048];
|
|
|
|
qse_size_t len;
|
|
|
|
int eof;
|
|
|
|
|
|
|
|
/*****************************************************/
|
|
|
|
/* the following two fields are very tightly-coupled.
|
|
|
|
* don't make any partial changes */
|
2010-07-15 06:54:48 +00:00
|
|
|
qse_map_t files;
|
2009-05-19 22:32:12 +00:00
|
|
|
qse_sed_t* files_ext;
|
|
|
|
/*****************************************************/
|
|
|
|
} out;
|
|
|
|
|
|
|
|
/** data needed for input streams */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
qse_sed_io_fun_t fun; /**< an input handler */
|
|
|
|
qse_sed_io_arg_t arg; /**< input handling data */
|
|
|
|
|
|
|
|
qse_char_t xbuf[1]; /**< a read-ahead buffer */
|
|
|
|
int xbuf_len; /**< data length in the buffer */
|
|
|
|
|
|
|
|
qse_char_t buf[2048]; /**< input buffer */
|
|
|
|
qse_size_t len; /**< data length in the buffer */
|
|
|
|
qse_size_t pos; /**< current position in the buffer */
|
|
|
|
int eof; /**< EOF indicator */
|
|
|
|
|
|
|
|
qse_str_t line; /**< pattern space */
|
|
|
|
qse_size_t num; /**< current line number */
|
|
|
|
} in;
|
|
|
|
|
|
|
|
/** text buffers */
|
|
|
|
struct
|
|
|
|
{
|
2011-09-20 22:40:45 +00:00
|
|
|
qse_str_t append;
|
2011-09-18 09:41:26 +00:00
|
|
|
qse_str_t hold; /* hold space */
|
2009-05-19 22:32:12 +00:00
|
|
|
qse_str_t subst;
|
|
|
|
} txt;
|
|
|
|
|
|
|
|
/** indicates if a successful substitution has been made
|
|
|
|
* since the last read on the input stream. */
|
|
|
|
int subst_done;
|
2011-09-07 08:18:36 +00:00
|
|
|
void* last_rex;
|
2011-09-20 22:40:45 +00:00
|
|
|
|
|
|
|
/** stop requested */
|
|
|
|
int stopreq;
|
2009-05-19 22:32:12 +00:00
|
|
|
} e;
|
|
|
|
};
|
|
|
|
|
2009-06-23 07:01:28 +00:00
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
2011-09-03 09:27:44 +00:00
|
|
|
int qse_sed_init (
|
|
|
|
qse_sed_t* sed,
|
|
|
|
qse_mmgr_t* mmgr
|
|
|
|
);
|
|
|
|
|
|
|
|
void qse_sed_fini (
|
|
|
|
qse_sed_t* sed
|
|
|
|
);
|
|
|
|
|
|
|
|
const qse_char_t* qse_sed_dflerrstr (
|
|
|
|
qse_sed_t* sed,
|
|
|
|
qse_sed_errnum_t errnum
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef USE_REX
|
|
|
|
/**
|
|
|
|
* The qse_sed_getmaxdepth() gets the maximum processing depth.
|
|
|
|
*/
|
|
|
|
qse_size_t qse_sed_getmaxdepth (
|
|
|
|
qse_sed_t* sed, /**< stream editor */
|
|
|
|
qse_sed_depth_t id /**< one of qse_sed_depth_t values */
|
|
|
|
);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The qse_sed_setmaxdepth() sets the maximum processing depth.
|
|
|
|
*/
|
|
|
|
void qse_sed_setmaxdepth (
|
|
|
|
qse_sed_t* sed, /**< stream editor */
|
|
|
|
int ids, /**< 0 or a number OR'ed of #qse_sed_depth_t values */
|
|
|
|
qse_size_t depth /**< maximum depth level */
|
|
|
|
);
|
|
|
|
#endif
|
2009-06-23 07:01:28 +00:00
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
|
|
|
#endif
|
2009-10-05 08:08:27 +00:00
|
|
|
|
2009-05-19 22:32:12 +00:00
|
|
|
#endif
|