520 lines
14 KiB
C
520 lines
14 KiB
C
/*
|
|
* $Id$
|
|
*
|
|
Copyright (c) 2014-2015 Chung, Hyung-Hwan. All rights reserved.
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
modification, are permitted provided that the following conditions
|
|
are met:
|
|
1. Redistributions of source code must retain the above copyright
|
|
notice, this list of conditions and the following disclaimer.
|
|
2. Redistributions in binary form must reproduce the above copyright
|
|
notice, this list of conditions and the following disclaimer in the
|
|
documentation and/or other materials provided with the distribution.
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE AUTHOR "AS IS" AND ANY EXPRESS OR
|
|
IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
|
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
|
IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
|
NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
|
THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#ifndef _STIX_PRV_H_
|
|
#define _STIX_PRV_H_
|
|
|
|
#include "stix.h"
|
|
|
|
/* this is useful for debugging. stix_gc() can be called
|
|
* while stix has not been fully initialized when this is defined*/
|
|
#define STIX_SUPPORT_GC_DURING_IGNITION
|
|
#define STIX_DEBUG_GC_1
|
|
|
|
|
|
#include <stdio.h> /* TODO: delete these header inclusion lines */
|
|
#include <string.h>
|
|
#include <assert.h>
|
|
|
|
#define STIX_MEMSET(dst,src,size) memset(dst,src,size)
|
|
#define STIX_MEMCPY(dst,src,size) memcpy(dst,src,size)
|
|
#define STIX_ASSERT(x) assert(x)
|
|
|
|
#define STIX_ALIGN(x,y) ((((x) + (y) - 1) / (y)) * (y))
|
|
|
|
|
|
/* ========================================================================= */
|
|
/* CLASS SPEC ENCODING */
|
|
/* ========================================================================= */
|
|
|
|
/*
|
|
* The spec field of a class object encodes the number of the fixed part
|
|
* and the type of the indexed part. The fixed part is the number of
|
|
* named instance variables. If the spec of a class is indexed, the object
|
|
* of the class can be i nstantiated with the size of the indexed part.
|
|
*
|
|
* For example, on a platform where sizeof(stix_oow_t) is 4,
|
|
* the layout of the spec field of a class as an OOP value looks like this:
|
|
*
|
|
* 31 10 9 8 7 6 5 4 3 2 1 0
|
|
* |number of named instance variables|indexed-type|indexability|oop-tag|
|
|
*
|
|
* the number of named instance variables is stored in high 23 bits.
|
|
* the indexed type takes up bit 3 to bit 8. And the indexability is
|
|
* stored in bit 2.
|
|
*
|
|
* The maximum number of named(fixed) instance variables for a class is:
|
|
* 2 ^ ((BITS-IN-OOW - STIX_OOP_TAG_BITS) - STIX_OBJ_TYPE_BITS - 1) - 1
|
|
*
|
|
* STIX_OOP_TAG_BITS are decremented from the number of bits in OOW because
|
|
* the spec field is always encoded as a small integer.
|
|
*
|
|
* The number of named instance variables can be greater than 0 if the
|
|
* class spec is not indexed or if it's a pointer indexed class
|
|
* (indexed_type == STIX_OBJ_TYPE_OOP)
|
|
*
|
|
* indexed_type is one of the #stix_obj_type_t enumerators.
|
|
*/
|
|
|
|
/*
|
|
* The STIX_CLASS_SPEC_MAKE() macro creates a class spec value.
|
|
* _class->spec = STIX_OOP_FROM_SMINT(STIX_CLASS_SPEC_MAKE(0, 1, STIX_OBJ_TYPE_CHAR));
|
|
*/
|
|
#define STIX_CLASS_SPEC_MAKE(named_instvar,is_indexed,indexed_type) ( \
|
|
(((stix_oow_t)(named_instvar)) << (STIX_OBJ_FLAGS_TYPE_BITS + 1)) | \
|
|
(((stix_oow_t)(indexed_type)) << 1) | (((stix_oow_t)is_indexed) & 1) )
|
|
|
|
/* what is the number of named instance variables?
|
|
* STIX_CLASS_SPEC_NAMED_INSTVAR(STIX_OOP_TO_SMINT(_class->spec))
|
|
*/
|
|
#define STIX_CLASS_SPEC_NAMED_INSTVAR(spec) \
|
|
(((stix_oow_t)(spec)) >> (STIX_OBJ_FLAGS_TYPE_BITS + 1))
|
|
|
|
/* is it a user-indexable class?
|
|
* all objects can be indexed with basicAt:.
|
|
* this indicates if an object can be instantiated with a dynamic size
|
|
* (new: size) and and can be indexed with at:.
|
|
*/
|
|
#define STIX_CLASS_SPEC_IS_INDEXED(spec) (((stix_oow_t)(spec)) & 1)
|
|
|
|
/* if so, what is the indexing type? character? pointer? etc? */
|
|
#define STIX_CLASS_SPEC_INDEXED_TYPE(spec) \
|
|
((((stix_oow_t)(spec)) >> 1) & STIX_LBMASK(stix_oow_t, STIX_OBJ_FLAGS_TYPE_BITS))
|
|
|
|
/* What is the maximum number of named instance variables?
|
|
* 2 ^ ((BITS-IN-OOW - STIX_OOP_TAG_BITS) - STIX_OBJ_TYPE_BITS - 1) - 1
|
|
* This limit is set because the number must be encoded into the spec field
|
|
* of the class with limited number of bits assigned to the number of
|
|
* named instance variables.
|
|
*/
|
|
#define STIX_MAX_NAMED_INSTVARS \
|
|
STIX_BITS_MAX(stix_oow_t, STIX_OOW_BITS - STIX_OOP_TAG_BITS - (STIX_OBJ_FLAGS_TYPE_BITS + 1))
|
|
|
|
/* Given the number of named instance variables, what is the maximum number
|
|
* of indexed instance variables? The number of indexed instance variables
|
|
* is not stored in the spec field of the class. It only affects the actual
|
|
* size of an object(obj->_size) selectively combined with the number of
|
|
* named instance variables. So it's the maximum value of obj->_size minus
|
|
* the number of named instance variables.
|
|
*/
|
|
#define STIX_MAX_INDEXED_INSTVARS(named_instvar) ((~(stix_oow_t)0) - named_instvar)
|
|
|
|
|
|
#if defined(STIX_INCLUDE_COMPILER)
|
|
|
|
/* ========================================================================= */
|
|
/* SOURCE CODE I/O FOR COMPILER */
|
|
/* ========================================================================= */
|
|
|
|
enum stix_iocmd_t
|
|
{
|
|
STIX_IO_OPEN,
|
|
STIX_IO_CLOSE,
|
|
STIX_IO_READ
|
|
};
|
|
typedef enum stix_iocmd_t stix_iocmd_t;
|
|
|
|
struct stix_ioloc_t
|
|
{
|
|
unsigned long line; /**< line */
|
|
unsigned long colm; /**< column */
|
|
const stix_uch_t* file; /**< file specified in #include */
|
|
};
|
|
typedef struct stix_ioloc_t stix_ioloc_t;
|
|
|
|
struct stix_iolxc_t
|
|
{
|
|
stix_uci_t c; /**< character */
|
|
stix_ioloc_t l; /**< location */
|
|
};
|
|
typedef struct stix_iolxc_t stix_iolxc_t;
|
|
|
|
enum stix_ioarg_flag_t
|
|
{
|
|
STIX_IO_INCLUDED = (1 << 0)
|
|
};
|
|
typedef enum stix_ioarg_flag_t stix_ioarg_flag_t;
|
|
|
|
typedef struct stix_ioarg_t stix_ioarg_t;
|
|
struct stix_ioarg_t
|
|
{
|
|
/**
|
|
* [IN] I/O object name.
|
|
* It is #STIX_NULL for the main stream and points to a non-NULL string
|
|
* for an included stream.
|
|
*/
|
|
const stix_uch_t* name;
|
|
|
|
/**
|
|
* [OUT] I/O handle set by a handler.
|
|
* The source stream handler can set this field when it opens a stream.
|
|
* All subsequent operations on the stream see this field as set
|
|
* during opening.
|
|
*/
|
|
void* handle;
|
|
|
|
/**
|
|
* [OUT] place data here
|
|
*/
|
|
stix_uch_t buf[1024];
|
|
|
|
/**
|
|
* [IN] points to the data of the includer. It is #STIX_NULL for the
|
|
* main stream.
|
|
*/
|
|
stix_ioarg_t* includer;
|
|
|
|
/*-----------------------------------------------------------------*/
|
|
/*----------- from here down, internal use only -------------------*/
|
|
struct
|
|
{
|
|
int pos, len;
|
|
} b;
|
|
|
|
unsigned long line;
|
|
unsigned long colm;
|
|
|
|
stix_iolxc_t lxc;
|
|
/*-----------------------------------------------------------------*/
|
|
};
|
|
|
|
typedef stix_ssize_t (*stix_ioimpl_t) (
|
|
stix_t* stix,
|
|
stix_iocmd_t cmd,
|
|
stix_ioarg_t* arg
|
|
);
|
|
|
|
|
|
|
|
|
|
struct stix_iotok_t
|
|
{
|
|
enum
|
|
{
|
|
STIX_IOTOK_EOF,
|
|
STIX_IOTOK_CHRLIT,
|
|
STIX_IOTOK_STRLIT,
|
|
STIX_IOTOK_SYMLIT,
|
|
STIX_IOTOK_NUMLIT,
|
|
STIX_IOTOK_IDENT,
|
|
STIX_IOTOK_BINSEL,
|
|
STIX_IOTOK_KEYWORD,
|
|
STIX_IOTOK_PRIMITIVE,
|
|
STIX_IOTOK_ASSIGN,
|
|
STIX_IOTOK_COLON,
|
|
STIX_IOTOK_RETURN,
|
|
STIX_IOTOK_LBRACE,
|
|
STIX_IOTOK_RBRACE,
|
|
STIX_IOTOK_LBRACK,
|
|
STIX_IOTOK_RBRACK,
|
|
STIX_IOTOK_LPAREN,
|
|
STIX_IOTOK_RPAREN,
|
|
STIX_IOTOK_APAREN, /* #( */
|
|
STIX_IOTOK_BPAREN, /* #[ */
|
|
STIX_IOTOK_PERIOD,
|
|
STIX_IOTOK_SEMICOLON
|
|
} type;
|
|
|
|
stix_ucs_t name;
|
|
stix_size_t name_capa;
|
|
|
|
stix_ioloc_t loc;
|
|
};
|
|
typedef struct stix_iotok_t stix_iotok_t;
|
|
|
|
enum stix_synerrnum_t
|
|
{
|
|
STIX_SYNERR_NOERR,
|
|
STIX_SYNERR_ILCHR, /* illegal character */
|
|
STIX_SYNERR_CMTNC, /* comment not closed */
|
|
STIX_SYNERR_STRNC, /* string not closed */
|
|
STIX_SYNERR_CLTNT, /* character literal not terminated */
|
|
STIX_SYNERR_HLTNT, /* hased literal not terminated */
|
|
STIX_SYNERR_CLNMS, /* colon missing */
|
|
};
|
|
typedef enum stix_synerrnum_t stix_synerrnum_t;
|
|
|
|
typedef struct stix_iolink_t stix_iolink_t;
|
|
struct stix_iolink_t
|
|
{
|
|
stix_iolink_t* link;
|
|
};
|
|
|
|
struct stix_synerr_t
|
|
{
|
|
stix_synerrnum_t num;
|
|
stix_ioloc_t loc;
|
|
stix_ucs_t tgt;
|
|
};
|
|
typedef struct stix_synerr_t stix_synerr_t;
|
|
|
|
struct stix_compiler_t
|
|
{
|
|
/* input handler */
|
|
stix_ioimpl_t impl;
|
|
|
|
/* information about the last meaningful character read.
|
|
* this is a copy of curinp->lxc if no ungetting is performed.
|
|
* if there is something in the unget buffer, this is overwritten
|
|
* by a value from the buffer when the request to read a character
|
|
* is served */
|
|
stix_iolxc_t lxc;
|
|
|
|
/* unget buffer */
|
|
stix_iolxc_t ungot[10];
|
|
int nungots;
|
|
|
|
/* static input data buffer */
|
|
stix_ioarg_t arg;
|
|
|
|
/* pointer to the current input data. initially, it points to &arg */
|
|
stix_ioarg_t* curinp;
|
|
|
|
/* the last token read */
|
|
stix_iotok_t tok;
|
|
|
|
stix_iolink_t* io_names;
|
|
|
|
stix_synerr_t synerr;
|
|
|
|
/* temporary space to handle an illegal character */
|
|
stix_uch_t ilchr;
|
|
stix_ucs_t ilchr_ucs;
|
|
};
|
|
|
|
#endif
|
|
|
|
|
|
#if defined(__cplusplus)
|
|
extern "C" {
|
|
#endif
|
|
|
|
/* ========================================================================= */
|
|
/* heap.c */
|
|
/* ========================================================================= */
|
|
|
|
/**
|
|
* The stix_makeheap() function creates a new heap of the \a size bytes.
|
|
*
|
|
* \return heap pointer on success and #STIX_NULL on failure.
|
|
*/
|
|
stix_heap_t* stix_makeheap (
|
|
stix_t* stix,
|
|
stix_size_t size
|
|
);
|
|
|
|
/**
|
|
* The stix_killheap() function destroys the heap pointed to by \a heap.
|
|
*/
|
|
void stix_killheap (
|
|
stix_t* stix,
|
|
stix_heap_t* heap
|
|
);
|
|
|
|
/**
|
|
* The stix_allocheapmem() function allocates \a size bytes in the heap pointed
|
|
* to by \a heap.
|
|
*
|
|
* \return memory pointer on success and #STIX_NULL on failure.
|
|
*/
|
|
void* stix_allocheapmem (
|
|
stix_t* stix,
|
|
stix_heap_t* heap,
|
|
stix_size_t size
|
|
);
|
|
|
|
|
|
/* ========================================================================= */
|
|
/* stix.c */
|
|
/* ========================================================================= */
|
|
stix_oow_t stix_hashbytes (
|
|
const stix_uint8_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
stix_oow_t stix_hashchars (
|
|
const stix_uch_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
int stix_equalchars (
|
|
const stix_uch_t* str1,
|
|
const stix_uch_t* str2,
|
|
stix_oow_t len
|
|
);
|
|
|
|
/* ========================================================================= */
|
|
/* obj.c */
|
|
/* ========================================================================= */
|
|
void* stix_allocbytes (
|
|
stix_t* stix,
|
|
stix_size_t size
|
|
);
|
|
|
|
/**
|
|
* The stix_allocoopobj() function allocates a raw object composed of \a size
|
|
* pointer fields excluding the header.
|
|
*/
|
|
stix_oop_t stix_allocoopobj (
|
|
stix_t* stix,
|
|
stix_oow_t size
|
|
);
|
|
|
|
stix_oop_t stix_alloccharobj (
|
|
stix_t* stix,
|
|
const stix_uch_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
stix_oop_t stix_allocuint8obj (
|
|
stix_t* stix,
|
|
const stix_uint8_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
stix_oop_t stix_allocuint16obj (
|
|
stix_t* stix,
|
|
const stix_uint16_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
/* ========================================================================= */
|
|
/* sym.c */
|
|
/* ========================================================================= */
|
|
stix_oop_t stix_makesymbol (
|
|
stix_t* stix,
|
|
const stix_uch_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
stix_oop_t stix_findsymbol (
|
|
stix_t* stix,
|
|
const stix_uch_t* ptr,
|
|
stix_oow_t len
|
|
);
|
|
|
|
/* ========================================================================= */
|
|
/* dic.c */
|
|
/* ========================================================================= */
|
|
stix_oop_t stix_putatsysdic (
|
|
stix_t* stix,
|
|
stix_oop_t key,
|
|
stix_oop_t value
|
|
);
|
|
|
|
stix_oop_t stix_getatsysdic (
|
|
stix_t* stix,
|
|
stix_oop_t key
|
|
);
|
|
|
|
/* ========================================================================= */
|
|
/* utf8.c */
|
|
/* ========================================================================= */
|
|
stix_size_t stix_uctoutf8 (
|
|
stix_uch_t uc,
|
|
stix_bch_t* utf8,
|
|
stix_size_t size
|
|
);
|
|
|
|
stix_size_t stix_utf8touc (
|
|
const stix_bch_t* utf8,
|
|
stix_size_t size,
|
|
stix_uch_t* uc
|
|
);
|
|
|
|
int stix_ucstoutf8 (
|
|
const stix_uch_t* ucs,
|
|
stix_size_t* ucslen,
|
|
stix_bch_t* bcs,
|
|
stix_size_t* bcslen
|
|
);
|
|
|
|
/**
|
|
* The stix_utf8toucs() function converts a UTF8 string to a uncide string.
|
|
*
|
|
* It never returns -2 if \a ucs is #STIX_NULL.
|
|
*
|
|
* \code
|
|
* const stix_bch_t* bcs = "test string";
|
|
* stix_uch_t ucs[100];
|
|
* qse_size_t ucslen = STIX_COUNTOF(buf), n;
|
|
* qse_size_t bcslen = 11;
|
|
* int n;
|
|
* n = qse_bcstoucs (bcs, &bcslen, ucs, &ucslen);
|
|
* if (n <= -1) { invalid/incomplenete sequence or buffer to small }
|
|
* \endcode
|
|
*
|
|
* For a null-terminated string, you can specify ~(stix_size_t)0 in
|
|
* \a bcslen. The destination buffer \a ucs also must be large enough to
|
|
* store a terminating null. Otherwise, -2 is returned.
|
|
*
|
|
* The resulting \a ucslen can still be greater than 0 even if the return
|
|
* value is negative. The value indiates the number of characters converted
|
|
* before the error has occurred.
|
|
*
|
|
* \return 0 on success.
|
|
* -1 if \a bcs contains an illegal character.
|
|
* -2 if the wide-character string buffer is too small.
|
|
* -3 if \a bcs is not a complete sequence.
|
|
*/
|
|
int stix_utf8toucs (
|
|
const stix_bch_t* bcs,
|
|
stix_size_t* bcslen,
|
|
stix_uch_t* ucs,
|
|
stix_size_t* ucslen
|
|
);
|
|
|
|
|
|
/**
|
|
* The stix_ucslen() function returns the number of characters before
|
|
* a terminating null.
|
|
*/
|
|
/*
|
|
stix_size_t stix_ucslen (
|
|
const stix_uch_t* ucs
|
|
);
|
|
*/
|
|
|
|
/* ========================================================================= */
|
|
/* comp.c */
|
|
/* ========================================================================= */
|
|
int stix_compile (
|
|
stix_t* stix,
|
|
stix_ioimpl_t io
|
|
);
|
|
|
|
void stix_getsynerr (
|
|
stix_t* stix,
|
|
stix_synerr_t* synerr
|
|
);
|
|
|
|
#if defined(__cplusplus)
|
|
}
|
|
#endif
|
|
|
|
|
|
#endif
|