hio/mio/lib/mio-utl.h

436 lines
12 KiB
C

/*
* $Id$
*
Copyright (c) 2014-2018 Chung, Hyung-Hwan. All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
1. Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
2. Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in the
documentation and/or other materials provided with the distribution.
THIS SOFTWARE IS PROVIDED BY THE AUTHOR "AS IS" AND ANY EXPRESS OR
IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef _MIO_UTL_H_
#define _MIO_UTL_H_
#include "mio-cmn.h"
#define MIO_CONST_SWAP16(x) \
((mio_uint16_t)((((mio_uint16_t)(x) & (mio_uint16_t)0x00ffU) << 8) | \
(((mio_uint16_t)(x) & (mio_uint16_t)0xff00U) >> 8) ))
#define MIO_CONST_SWAP32(x) \
((mio_uint32_t)((((mio_uint32_t)(x) & (mio_uint32_t)0x000000ffUL) << 24) | \
(((mio_uint32_t)(x) & (mio_uint32_t)0x0000ff00UL) << 8) | \
(((mio_uint32_t)(x) & (mio_uint32_t)0x00ff0000UL) >> 8) | \
(((mio_uint32_t)(x) & (mio_uint32_t)0xff000000UL) >> 24) ))
#if defined(MIO_ENDIAN_LITTLE)
# define MIO_CONST_NTOH16(x) MIO_CONST_SWAP16(x)
# define MIO_CONST_HTON16(x) MIO_CONST_SWAP16(x)
# define MIO_CONST_NTOH32(x) MIO_CONST_SWAP32(x)
# define MIO_CONST_HTON32(x) MIO_CONST_SWAP32(x)
#elif defined(MIO_ENDIAN_BIG)
# define MIO_CONST_NTOH16(x) (x)
# define MIO_CONST_HTON16(x) (x)
# define MIO_CONST_NTOH32(x) (x)
# define MIO_CONST_HTON32(x) (x)
#else
# error UNKNOWN ENDIAN
#endif
#ifdef __cplusplus
extern "C" {
#endif
/**
* The mio_equal_uchars() function determines equality of two strings
* of the same length \a len.
*/
MIO_EXPORT int mio_equal_uchars (
const mio_uch_t* str1,
const mio_uch_t* str2,
mio_oow_t len
);
MIO_EXPORT int mio_equal_bchars (
const mio_bch_t* str1,
const mio_bch_t* str2,
mio_oow_t len
);
MIO_EXPORT int mio_comp_uchars (
const mio_uch_t* str1,
mio_oow_t len1,
const mio_uch_t* str2,
mio_oow_t len2
);
MIO_EXPORT int mio_comp_bchars (
const mio_bch_t* str1,
mio_oow_t len1,
const mio_bch_t* str2,
mio_oow_t len2
);
MIO_EXPORT int mio_comp_ucstr (
const mio_uch_t* str1,
const mio_uch_t* str2
);
MIO_EXPORT int mio_comp_bcstr (
const mio_bch_t* str1,
const mio_bch_t* str2
);
MIO_EXPORT int mio_comp_ucstr_bcstr (
const mio_uch_t* str1,
const mio_bch_t* str2
);
MIO_EXPORT int mio_comp_uchars_ucstr (
const mio_uch_t* str1,
mio_oow_t len,
const mio_uch_t* str2
);
MIO_EXPORT int mio_comp_uchars_bcstr (
const mio_uch_t* str1,
mio_oow_t len,
const mio_bch_t* str2
);
MIO_EXPORT int mio_comp_bchars_bcstr (
const mio_bch_t* str1,
mio_oow_t len,
const mio_bch_t* str2
);
MIO_EXPORT int mio_comp_bchars_ucstr (
const mio_bch_t* str1,
mio_oow_t len,
const mio_uch_t* str2
);
MIO_EXPORT void mio_copy_uchars (
mio_uch_t* dst,
const mio_uch_t* src,
mio_oow_t len
);
MIO_EXPORT void mio_copy_bchars (
mio_bch_t* dst,
const mio_bch_t* src,
mio_oow_t len
);
MIO_EXPORT void mio_copy_bchars_to_uchars (
mio_uch_t* dst,
const mio_bch_t* src,
mio_oow_t len
);
MIO_EXPORT mio_oow_t mio_copy_ucstr (
mio_uch_t* dst,
mio_oow_t len,
const mio_uch_t* src
);
MIO_EXPORT mio_oow_t mio_copy_bcstr (
mio_bch_t* dst,
mio_oow_t len,
const mio_bch_t* src
);
MIO_EXPORT mio_uch_t* mio_find_uchar (
const mio_uch_t* ptr,
mio_oow_t len,
mio_uch_t c
);
MIO_EXPORT mio_bch_t* mio_find_bchar (
const mio_bch_t* ptr,
mio_oow_t len,
mio_bch_t c
);
MIO_EXPORT mio_uch_t* mio_rfind_uchar (
const mio_uch_t* ptr,
mio_oow_t len,
mio_uch_t c
);
MIO_EXPORT mio_bch_t* mio_rfind_bchar (
const mio_bch_t* ptr,
mio_oow_t len,
mio_bch_t c
);
MIO_EXPORT mio_uch_t* mio_find_uchar_in_ucstr (
const mio_uch_t* ptr,
mio_uch_t c
);
MIO_EXPORT mio_bch_t* mio_find_bchar_in_bcstr (
const mio_bch_t* ptr,
mio_bch_t c
);
MIO_EXPORT mio_oow_t mio_count_ucstr (
const mio_uch_t* str
);
MIO_EXPORT mio_oow_t mio_count_bcstr (
const mio_bch_t* str
);
#if defined(MIO_OOCH_IS_UCH)
# define mio_equal_oochars(str1,str2,len) mio_equal_uchars(str1,str2,len)
# define mio_comp_oochars(str1,len1,str2,len2) mio_comp_uchars(str1,len1,str2,len2)
# define mio_comp_oocstr_bcstr(str1,str2) mio_comp_ucstr_bcstr(str1,str2)
# define mio_comp_oochars_bcstr(str1,len1,str2) mio_comp_uchars_bcstr(str1,len1,str2)
# define mio_comp_oochars_ucstr(str1,len1,str2) mio_comp_uchars_ucstr(str1,len1,str2)
# define mio_comp_oochars_oocstr(str1,len1,str2) mio_comp_uchars_ucstr(str1,len1,str2)
# define mio_comp_oocstr(str1,str2) mio_comp_ucstr(str1,str2)
# define mio_copy_oochars(dst,src,len) mio_copy_uchars(dst,src,len)
# define mio_copy_bchars_to_oochars(dst,src,len) mio_copy_bchars_to_uchars(dst,src,len)
# define mio_copy_oocstr(dst,len,src) mio_copy_ucstr(dst,len,src)
# define mio_find_oochar(ptr,len,c) mio_find_uchar(ptr,len,c)
# define mio_rfind_oochar(ptr,len,c) mio_rfind_uchar(ptr,len,c)
# define mio_find_oochar_in_oocstr(ptr,c) mio_find_uchar_in_ucstr(ptr,c)
# define mio_count_oocstr(str) mio_count_ucstr(str)
#else
# define mio_equal_oochars(str1,str2,len) mio_equal_bchars(str1,str2,len)
# define mio_comp_oochars(str1,len1,str2,len2) mio_comp_bchars(str1,len1,str2,len2)
# define mio_comp_oocstr_bcstr(str1,str2) mio_comp_bcstr(str1,str2)
# define mio_comp_oochars_bcstr(str1,len1,str2) mio_comp_bchars_bcstr(str1,len1,str2)
# define mio_comp_oochars_ucstr(str1,len1,str2) mio_comp_bchars_ucstr(str1,len1,str2)
# define mio_comp_oochars_oocstr(str1,len1,str2) mio_comp_bchars_bcstr(str1,len1,str2)
# define mio_comp_oocstr(str1,str2) mio_comp_bcstr(str1,str2)
# define mio_copy_oochars(dst,src,len) mio_copy_bchars(dst,src,len)
# define mio_copy_bchars_to_oochars(dst,src,len) mio_copy_bchars(dst,src,len)
# define mio_copy_oocstr(dst,len,src) mio_copy_bcstr(dst,len,src)
# define mio_find_oochar(ptr,len,c) mio_find_bchar(ptr,len,c)
# define mio_rfind_oochar(ptr,len,c) mio_rfind_bchar(ptr,len,c)
# define mio_find_oochar_in_oocstr(ptr,c) mio_find_bchar_in_bcstr(ptr,c)
# define mio_count_oocstr(str) mio_count_bcstr(str)
#endif
/* ------------------------------------------------------------------------- */
MIO_EXPORT int mio_ucwidth (
mio_uch_t uc
);
/* ------------------------------------------------------------------------- */
#if defined(MIO_OOCH_IS_UCH)
# define mio_conv_oocs_to_bcs_with_cmgr(oocs,oocslen,bcs,bcslen,cmgr) mio_conv_ucs_to_bcs_with_cmgr(oocs,oocslen,bcs,bcslen,cmgr)
# define mio_conv_oochars_to_bchars_with_cmgr(oocs,oocslen,bcs,bcslen,cmgr) mio_conv_uchars_to_bchars_with_cmgr(oocs,oocslen,bcs,bcslen,cmgr)
#else
# define mio_conv_oocs_to_ucs_with_cmgr(oocs,oocslen,ucs,ucslen,cmgr) mio_conv_bcs_to_ucs_with_cmgr(oocs,oocslen,ucs,ucslen,cmgr,0)
# define mio_conv_oochars_to_uchars_with_cmgr(oocs,oocslen,ucs,ucslen,cmgr) mio_conv_bchars_to_uchars_with_cmgr(oocs,oocslen,ucs,ucslen,cmgr,0)
#endif
MIO_EXPORT int mio_conv_bcs_to_ucs_with_cmgr (
const mio_bch_t* bcs,
mio_oow_t* bcslen,
mio_uch_t* ucs,
mio_oow_t* ucslen,
mio_cmgr_t* cmgr,
int all
);
MIO_EXPORT int mio_conv_bchars_to_uchars_with_cmgr (
const mio_bch_t* bcs,
mio_oow_t* bcslen,
mio_uch_t* ucs,
mio_oow_t* ucslen,
mio_cmgr_t* cmgr,
int all
);
MIO_EXPORT int mio_conv_ucs_to_bcs_with_cmgr (
const mio_uch_t* ucs,
mio_oow_t* ucslen,
mio_bch_t* bcs,
mio_oow_t* bcslen,
mio_cmgr_t* cmgr
);
MIO_EXPORT int mio_conv_uchars_to_bchars_with_cmgr (
const mio_uch_t* ucs,
mio_oow_t* ucslen,
mio_bch_t* bcs,
mio_oow_t* bcslen,
mio_cmgr_t* cmgr
);
/* ------------------------------------------------------------------------- */
MIO_EXPORT mio_cmgr_t* mio_get_utf8_cmgr (
void
);
/**
* The mio_conv_uchars_to_utf8() function converts a unicode character string \a ucs
* to a UTF8 string and writes it into the buffer pointed to by \a bcs, but
* not more than \a bcslen bytes including the terminating null.
*
* Upon return, \a bcslen is modified to the actual number of bytes written to
* \a bcs excluding the terminating null; \a ucslen is modified to the number of
* wide characters converted.
*
* You may pass #MIO_NULL for \a bcs to dry-run conversion or to get the
* required buffer size for conversion. -2 is never returned in this case.
*
* \return
* - 0 on full conversion,
* - -1 on no or partial conversion for an illegal character encountered,
* - -2 on no or partial conversion for a small buffer.
*
* \code
* const mio_uch_t ucs[] = { 'H', 'e', 'l', 'l', 'o' };
* mio_bch_t bcs[10];
* mio_oow_t ucslen = 5;
* mio_oow_t bcslen = MIO_COUNTOF(bcs);
* n = mio_conv_uchars_to_utf8 (ucs, &ucslen, bcs, &bcslen);
* if (n <= -1)
* {
* // conversion error
* }
* \endcode
*/
MIO_EXPORT int mio_conv_uchars_to_utf8 (
const mio_uch_t* ucs,
mio_oow_t* ucslen,
mio_bch_t* bcs,
mio_oow_t* bcslen
);
/**
* The mio_conv_utf8_to_uchars() function converts a UTF8 string to a uncide string.
*
* It never returns -2 if \a ucs is #MIO_NULL.
*
* \code
* const mio_bch_t* bcs = "test string";
* mio_uch_t ucs[100];
* mio_oow_t ucslen = MIO_COUNTOF(buf), n;
* mio_oow_t bcslen = 11;
* int n;
* n = mio_conv_utf8_to_uchars (bcs, &bcslen, ucs, &ucslen);
* if (n <= -1) { invalid/incomplenete sequence or buffer to small }
* \endcode
*
* The resulting \a ucslen can still be greater than 0 even if the return
* value is negative. The value indiates the number of characters converted
* before the error has occurred.
*
* \return 0 on success.
* -1 if \a bcs contains an illegal character.
* -2 if the wide-character string buffer is too small.
* -3 if \a bcs is not a complete sequence.
*/
MIO_EXPORT int mio_conv_utf8_to_uchars (
const mio_bch_t* bcs,
mio_oow_t* bcslen,
mio_uch_t* ucs,
mio_oow_t* ucslen
);
MIO_EXPORT int mio_conv_ucstr_to_utf8 (
const mio_uch_t* ucs,
mio_oow_t* ucslen,
mio_bch_t* bcs,
mio_oow_t* bcslen
);
MIO_EXPORT int mio_conv_utf8_to_ucstr (
const mio_bch_t* bcs,
mio_oow_t* bcslen,
mio_uch_t* ucs,
mio_oow_t* ucslen
);
MIO_EXPORT mio_oow_t mio_uc_to_utf8 (
mio_uch_t uc,
mio_bch_t* utf8,
mio_oow_t size
);
MIO_EXPORT mio_oow_t mio_utf8_to_uc (
const mio_bch_t* utf8,
mio_oow_t size,
mio_uch_t* uc
);
/* ------------------------------------------------------------------------- */
#if defined(MIO_HAVE_UINT16_T)
MIO_EXPORT mio_uint16_t mio_ntoh16 (
mio_uint16_t x
);
MIO_EXPORT mio_uint16_t mio_hton16 (
mio_uint16_t x
);
#endif
#if defined(MIO_HAVE_UINT32_T)
MIO_EXPORT mio_uint32_t mio_ntoh32 (
mio_uint32_t x
);
MIO_EXPORT mio_uint32_t mio_hton32 (
mio_uint32_t x
);
#endif
#if defined(MIO_HAVE_UINT64_T)
MIO_EXPORT mio_uint64_t mio_ntoh64 (
mio_uint64_t x
);
MIO_EXPORT mio_uint64_t mio_hton64 (
mio_uint64_t x
);
#endif
#if defined(MIO_HAVE_UINT128_T)
MIO_EXPORT mio_uint128_t mio_ntoh128 (
mio_uint128_t x
);
MIO_EXPORT mio_uint128_t mio_hton128 (
mio_uint128_t x
);
#endif
#ifdef __cplusplus
}
#endif
#endif