2020-03-03 13:47:51 +00:00
/*
Copyright ( c ) 2016 - 2020 Chung , Hyung - Hwan . All rights reserved .
Redistribution and use in source and binary forms , with or without
modification , are permitted provided that the following conditions
are met :
1. Redistributions of source code must retain the above copyright
notice , this list of conditions and the following disclaimer .
2. Redistributions in binary form must reproduce the above copyright
notice , this list of conditions and the following disclaimer in the
documentation and / or other materials provided with the distribution .
THIS SOFTWARE IS PROVIDED BY THE AUTHOR " AS IS " AND ANY EXPRESS OR
IMPLIED WARRANTIES , INCLUDING , BUT NOT LIMITED TO , THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED .
IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT , INDIRECT ,
INCIDENTAL , SPECIAL , EXEMPLARY , OR CONSEQUENTIAL DAMAGES ( INCLUDING , BUT
NOT LIMITED TO , PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES ; LOSS OF USE ,
DATA , OR PROFITS ; OR BUSINESS INTERRUPTION ) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY , WHETHER IN CONTRACT , STRICT LIABILITY , OR TORT
( INCLUDING NEGLIGENCE OR OTHERWISE ) ARISING IN ANY WAY OUT OF THE USE OF
THIS SOFTWARE , EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE .
*/
2020-05-01 18:01:29 +00:00
# include "mio-htrd.h"
# include "mio-chr.h"
2020-05-04 08:40:05 +00:00
# include "mio-path.h"
2020-05-01 18:01:29 +00:00
# include "mio-prv.h"
2020-03-03 13:47:51 +00:00
static const mio_bch_t NUL = ' \0 ' ;
/* for htrd->fed.s.flags */
# define CONSUME_UNTIL_CLOSE (1 << 0)
/* for htrd->flags */
# define FEEDING_SUSPENDED (1 << 0)
# define FEEDING_DUMMIFIED (1 << 1)
static MIO_INLINE int is_whspace_octet ( mio_bch_t c )
{
return c = = ' ' | | c = = ' \t ' | | c = = ' \r ' | | c = = ' \n ' ;
}
static MIO_INLINE int is_space_octet ( mio_bch_t c )
{
return c = = ' ' | | c = = ' \t ' | | c = = ' \r ' ;
}
static MIO_INLINE int is_purespace_octet ( mio_bch_t c )
{
return c = = ' ' | | c = = ' \t ' ;
}
static MIO_INLINE int is_upalpha_octet ( mio_bch_t c )
{
return c > = ' A ' & & c < = ' Z ' ;
}
static MIO_INLINE int is_loalpha_octet ( mio_bch_t c )
{
return c > = ' a ' & & c < = ' z ' ;
}
static MIO_INLINE int is_alpha_octet ( mio_bch_t c )
{
return ( c > = ' A ' & & c < = ' Z ' ) | | ( c > = ' a ' & & c < = ' z ' ) ;
}
static MIO_INLINE int is_digit_octet ( mio_bch_t c )
{
return c > = ' 0 ' & & c < = ' 9 ' ;
}
static MIO_INLINE int is_xdigit_octet ( mio_bch_t c )
{
return ( c > = ' 0 ' & & c < = ' 9 ' ) | | ( c > = ' A ' & & c < = ' F ' ) | | ( c > = ' a ' & & c < = ' f ' ) ;
}
static MIO_INLINE int digit_to_num ( mio_bch_t c )
{
2020-05-01 18:01:29 +00:00
return MIO_DIGIT_TO_NUM ( c ) ;
2020-03-03 13:47:51 +00:00
}
static MIO_INLINE int xdigit_to_num ( mio_bch_t c )
{
2020-05-01 18:01:29 +00:00
return MIO_XDIGIT_TO_NUM ( c ) ;
2020-03-03 13:47:51 +00:00
}
2020-05-01 18:56:33 +00:00
static MIO_INLINE int push_to_buffer ( mio_htrd_t * htrd , mio_becs_t * octb , const mio_bch_t * ptr , mio_oow_t len )
2020-03-03 13:47:51 +00:00
{
2020-05-01 18:56:33 +00:00
if ( mio_becs_ncat ( octb , ptr , len ) = = ( mio_oow_t ) - 1 )
2020-03-03 13:47:51 +00:00
{
htrd - > errnum = MIO_HTRD_ENOMEM ;
return - 1 ;
}
return 0 ;
}
2020-04-30 16:20:31 +00:00
static MIO_INLINE int push_content ( mio_htrd_t * htrd , const mio_bch_t * ptr , mio_oow_t len )
2020-03-03 13:47:51 +00:00
{
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , len > 0 ) ;
2020-03-03 13:47:51 +00:00
if ( mio_htre_addcontent ( & htrd - > re , ptr , len ) < = - 1 )
{
htrd - > errnum = MIO_HTRD_ENOMEM ;
return - 1 ;
}
/* mio_htre_addcontent() returns 1 on full success and 0 if adding is
* skipped . i treat both as success */
return 0 ;
}
static MIO_INLINE void clear_feed ( mio_htrd_t * htrd )
{
/* clear necessary part of the request/response before
* reading the next request / response */
htrd - > clean = 1 ;
mio_htre_clear ( & htrd - > re ) ;
2020-05-01 18:01:29 +00:00
mio_becs_clear ( & htrd - > fed . b . tra ) ;
mio_becs_clear ( & htrd - > fed . b . raw ) ;
2020-03-03 13:47:51 +00:00
MIO_MEMSET ( & htrd - > fed . s , 0 , MIO_SIZEOF ( htrd - > fed . s ) ) ;
}
2020-05-01 14:00:27 +00:00
mio_htrd_t * mio_htrd_open ( mio_t * mio , mio_oow_t xtnsize )
2020-03-03 13:47:51 +00:00
{
mio_htrd_t * htrd ;
2020-05-01 14:00:27 +00:00
htrd = ( mio_htrd_t * ) mio_allocmem ( mio , MIO_SIZEOF ( mio_htrd_t ) + xtnsize ) ;
2020-05-01 18:56:33 +00:00
if ( MIO_LIKELY ( htrd ) )
2020-03-03 13:47:51 +00:00
{
2020-05-01 18:56:33 +00:00
if ( MIO_UNLIKELY ( mio_htrd_init ( htrd , mio ) < = - 1 ) )
2020-03-03 13:47:51 +00:00
{
2020-05-01 14:00:27 +00:00
mio_freemem ( mio , htrd ) ;
2020-03-03 13:47:51 +00:00
return MIO_NULL ;
}
2020-05-01 18:01:29 +00:00
else MIO_MEMSET ( htrd + 1 , 0 , xtnsize ) ;
2020-03-03 13:47:51 +00:00
}
return htrd ;
}
void mio_htrd_close ( mio_htrd_t * htrd )
{
mio_htrd_fini ( htrd ) ;
2020-05-01 14:00:27 +00:00
mio_freemem ( htrd - > mio , htrd ) ;
2020-03-03 13:47:51 +00:00
}
2020-05-01 14:00:27 +00:00
int mio_htrd_init ( mio_htrd_t * htrd , mio_t * mio )
2020-03-03 13:47:51 +00:00
{
MIO_MEMSET ( htrd , 0 , MIO_SIZEOF ( * htrd ) ) ;
2020-05-01 14:00:27 +00:00
htrd - > mio = mio ;
2020-03-03 13:47:51 +00:00
htrd - > option = MIO_HTRD_REQUEST | MIO_HTRD_RESPONSE ;
#if 0
2020-05-01 14:00:27 +00:00
mio_becs_init ( & htrd - > tmp . qparam , htrd - > mio , 0 ) ;
2020-03-03 13:47:51 +00:00
# endif
2020-05-01 14:00:27 +00:00
mio_becs_init ( & htrd - > fed . b . raw , htrd - > mio , 0 ) ;
mio_becs_init ( & htrd - > fed . b . tra , htrd - > mio , 0 ) ;
2020-03-03 13:47:51 +00:00
2020-05-01 14:00:27 +00:00
if ( mio_htre_init ( & htrd - > re , mio ) < = - 1 )
2020-03-03 13:47:51 +00:00
{
2020-05-01 14:00:27 +00:00
mio_becs_fini ( & htrd - > fed . b . tra ) ;
mio_becs_fini ( & htrd - > fed . b . raw ) ;
2020-03-03 13:47:51 +00:00
#if 0
2020-05-01 14:00:27 +00:00
mio_becs_fini ( & htrd - > tmp . qparam ) ;
2020-03-03 13:47:51 +00:00
# endif
return - 1 ;
}
htrd - > clean = 1 ;
return 0 ;
}
void mio_htrd_fini ( mio_htrd_t * htrd )
{
mio_htre_fini ( & htrd - > re ) ;
2020-05-01 18:01:29 +00:00
mio_becs_fini ( & htrd - > fed . b . tra ) ;
mio_becs_fini ( & htrd - > fed . b . raw ) ;
2020-03-03 13:47:51 +00:00
#if 0
2020-05-01 18:01:29 +00:00
mio_becs_fini ( & htrd - > tmp . qparam ) ;
2020-03-03 13:47:51 +00:00
# endif
}
static mio_bch_t * parse_initial_line ( mio_htrd_t * htrd , mio_bch_t * line )
{
mio_bch_t * p = line ;
2020-05-01 18:01:29 +00:00
mio_bcs_t tmp ;
2020-03-03 13:47:51 +00:00
#if 0
/* ignore leading spaces excluding crlf */
while ( is_space_octet ( * p ) ) p + + ;
# endif
/* the method should start with an alphabet */
if ( ! is_alpha_octet ( * p ) ) goto badre ;
/* get the method name */
tmp . ptr = p ;
do { p + + ; } while ( is_alpha_octet ( * p ) ) ;
tmp . len = p - tmp . ptr ;
htrd - > re . type = MIO_HTRE_Q ;
if ( htrd - > option & MIO_HTRD_REQUEST )
{
/* method name must be followed by space */
if ( ! is_space_octet ( * p ) ) goto badre ;
* p = ' \0 ' ; /* null-terminate the method name */
2020-05-01 18:01:29 +00:00
htrd - > re . u . q . method . type = mio_bchars_to_http_method ( tmp . ptr , tmp . len ) ;
2020-03-03 13:47:51 +00:00
htrd - > re . u . q . method . name = tmp . ptr ;
}
2020-05-01 18:01:29 +00:00
else if ( ( htrd - > option & MIO_HTRD_RESPONSE ) & & mio_comp_bchars_bcstr ( tmp . ptr , tmp . len , " HTTP " , 1 ) = = 0 )
2020-03-03 13:47:51 +00:00
{
/* it begins with HTTP. it may be a response */
htrd - > re . type = MIO_HTRE_S ;
}
else goto badre ;
if ( htrd - > re . type = = MIO_HTRE_S )
{
/* response */
int n , status ;
if ( * p = = ' / ' & & p [ 1 ] ! = ' \0 ' & & p [ 2 ] = = ' . ' )
{
int q = digit_to_num ( p [ 1 ] ) ;
int w = digit_to_num ( p [ 3 ] ) ;
if ( q > = 0 & & w > = 0 )
{
htrd - > re . version . major = q ;
htrd - > re . version . minor = w ;
p + = 4 ;
}
else goto badre ;
}
else goto badre ;
/* version must be followed by space */
if ( ! is_space_octet ( * p ) ) goto badre ;
* p = ' \0 ' ; /* null-terminate version string */
htrd - > re . verstr = tmp . ptr ;
/* skip spaces */
do p + + ; while ( is_space_octet ( * p ) ) ;
n = digit_to_num ( * p ) ;
if ( n < = - 1 ) goto badre ;
tmp . ptr = p ;
status = 0 ;
do
{
status = status * 10 + n ;
p + + ;
}
while ( ( n = digit_to_num ( * p ) ) > = 0 ) ;
if ( ! is_space_octet ( * p ) ) goto badre ;
* p = ' \0 ' ; /* null-terminate the status code */
htrd - > re . u . s . code . val = status ;
htrd - > re . u . s . code . str = tmp . ptr ;
/* i don't treat the following weird messages as bad message:
* no status message follows the status code
*/
/* skip spaces */
do p + + ; while ( is_space_octet ( * p ) ) ;
tmp . ptr = p ;
tmp . len = 0 ;
while ( * p ! = ' \0 ' & & * p ! = ' \n ' )
{
if ( ! is_space_octet ( * p ) ) tmp . len = p - tmp . ptr + 1 ;
p + + ;
}
/* if the line does not end with a new line, it is a bad request */
if ( * p ! = ' \n ' ) goto badre ;
/* null-terminate the message */
( ( mio_bch_t * ) tmp . ptr ) [ tmp . len ] = ' \0 ' ;
htrd - > re . u . s . mesg = tmp . ptr ;
}
else
{
#if 0
mio_bch_t * out ;
# endif
2020-05-01 18:01:29 +00:00
mio_bcs_t param ;
2020-03-03 13:47:51 +00:00
/* skip spaces */
do p + + ; while ( is_space_octet ( * p ) ) ;
/* process the url part */
tmp . ptr = p ; /* remember the beginning of path*/
param . ptr = MIO_NULL ;
#if 0
out = p ;
while ( * p ! = ' \0 ' & & ! is_space_octet ( * p ) )
{
if ( * p = = ' % ' & & param . ptr = = MIO_NULL )
{
/* decode percent-encoded charaters in the
* path part . if we ' re in the parameter string
* part , we don ' t decode them . */
int q = xdigit_to_num ( * ( p + 1 ) ) ;
int w = xdigit_to_num ( * ( p + 2 ) ) ;
if ( q > = 0 & & w > = 0 )
{
int t = ( q < < 4 ) + w ;
if ( t = = 0 )
{
/* percent enconding contains a null character */
goto badre ;
}
* out + + = t ;
p + = 3 ;
htrd - > re . flags | = MIO_HTRE_QPATH_PERDEC ;
}
else * out + + = * p + + ;
}
else if ( * p = = ' ? ' )
{
if ( param . ptr = = MIO_NULL )
{
/* ? must be explicit to be an argument instroducer.
* % 3f is just a literal . */
tmp . len = out - tmp . ptr ;
* out + + = ' \0 ' ; /* null-terminate the path part */
param . ptr = out ;
p + + ;
}
else * out + + = * p + + ;
}
else * out + + = * p + + ;
}
/* the url must be followed by a space */
if ( ! is_space_octet ( * p ) ) goto badre ;
/* null-terminate the url part though we know the length */
* out = ' \0 ' ;
if ( htrd - > re . flags & MIO_HTRE_QPATH_PERDEC )
{
/* TODO: build the original qpath */
htrd - > re . orgpqath . ptr = XXX ;
htrd - > re . orgpath . len = XXXX ;
}
if ( param . ptr )
{
param . len = out - param . ptr ;
htrd - > re . u . q . path = tmp ;
htrd - > re . u . q . param = param ;
}
else
{
tmp . len = out - tmp . ptr ;
htrd - > re . u . q . path = tmp ;
htrd - > re . u . q . param . ptr = MIO_NULL ;
htrd - > re . u . q . param . len = 0 ;
}
# else
while ( * p ! = ' \0 ' & & ! is_space_octet ( * p ) )
{
if ( * p = = ' ? ' & & param . ptr = = MIO_NULL )
{
tmp . len = p - tmp . ptr ; /* length of the path part */
* p + + = ' \0 ' ; /* null-terminate the path part */
param . ptr = p ;
}
else p + + ;
}
/* the url must be followed by a space */
if ( ! is_space_octet ( * p ) ) goto badre ;
param . len = p - param . ptr ; /* length of the param part */
* p = ' \0 ' ; /* null-terminate the path or param part */
if ( param . ptr )
{
htrd - > re . u . q . path = tmp ;
htrd - > re . u . q . param = param ;
}
else
{
htrd - > re . u . q . path = tmp ;
htrd - > re . u . q . param . ptr = MIO_NULL ;
htrd - > re . u . q . param . len = 0 ;
}
# endif
if ( htrd - > option & MIO_HTRD_CANONQPATH )
{
mio_bch_t * qpath = htrd - > re . u . q . path . ptr ;
/* if the url begins with xxx://,
* skip xxx : / and canonicalize from the second slash */
while ( is_alpha_octet ( * qpath ) ) qpath + + ;
2020-05-01 18:01:29 +00:00
if ( mio_comp_bcstr_limited ( qpath , " :// " , 3 , 1 ) = = 0 )
2020-03-03 13:47:51 +00:00
{
qpath = qpath + 2 ; /* set the position to the second / in :// */
2020-05-01 18:01:29 +00:00
htrd - > re . u . q . path . len = mio_canon_bcstr_path ( qpath , qpath , 0 ) ;
2020-03-03 13:47:51 +00:00
htrd - > re . u . q . path . len + = qpath - htrd - > re . u . q . path . ptr ;
}
else
{
qpath = htrd - > re . u . q . path . ptr ;
2020-05-01 18:01:29 +00:00
htrd - > re . u . q . path . len = mio_canon_bcstr_path ( qpath , qpath , 0 ) ;
2020-03-03 13:47:51 +00:00
}
}
/* skip spaces after the url part */
do { p + + ; } while ( is_space_octet ( * p ) ) ;
tmp . ptr = p ;
/* check protocol version */
if ( ( p [ 0 ] = = ' H ' | | p [ 0 ] = = ' h ' ) & &
( p [ 1 ] = = ' T ' | | p [ 1 ] = = ' t ' ) & &
( p [ 2 ] = = ' T ' | | p [ 2 ] = = ' t ' ) & &
( p [ 3 ] = = ' P ' | | p [ 3 ] = = ' p ' ) & &
p [ 4 ] = = ' / ' & & p [ 6 ] = = ' . ' )
{
int q = digit_to_num ( p [ 5 ] ) ;
int w = digit_to_num ( p [ 7 ] ) ;
if ( q > = 0 & & w > = 0 )
{
htrd - > re . version . major = q ;
htrd - > re . version . minor = w ;
p + = 8 ;
}
else goto badre ;
}
else goto badre ;
tmp . len = p - tmp . ptr ;
/* skip trailing spaces on the line */
while ( is_space_octet ( * p ) ) p + + ;
/* if the line does not end with a new line, it is a bad request */
if ( * p ! = ' \n ' ) goto badre ;
( ( mio_bch_t * ) tmp . ptr ) [ tmp . len ] = ' \0 ' ;
htrd - > re . verstr = tmp . ptr ;
}
/* adjust Connection: Keep-Alive for HTTP 1.1 or later.
* this is initial . it can be adjusted further in capture_connection ( ) . */
if ( htrd - > re . version . major > 1 | |
( htrd - > re . version . major = = 1 & & htrd - > re . version . minor > = 1 ) )
{
htrd - > re . flags | = MIO_HTRE_ATTR_KEEPALIVE ;
}
return + + p ;
badre :
htrd - > errnum = MIO_HTRD_EBADRE ;
return MIO_NULL ;
}
void mio_htrd_clear ( mio_htrd_t * htrd )
{
clear_feed ( htrd ) ;
htrd - > flags = 0 ;
}
mio_htrd_errnum_t mio_htrd_geterrnum ( mio_htrd_t * htrd )
{
return htrd - > errnum ;
}
int mio_htrd_getopt ( mio_htrd_t * htrd )
{
return htrd - > option ;
}
void mio_htrd_setopt ( mio_htrd_t * htrd , int opts )
{
htrd - > option = opts ;
}
const mio_htrd_recbs_t * mio_htrd_getrecbs ( mio_htrd_t * htrd )
{
return htrd - > recbs ;
}
void mio_htrd_setrecbs ( mio_htrd_t * htrd , const mio_htrd_recbs_t * recbs )
{
htrd - > recbs = recbs ;
}
static int capture_connection ( mio_htrd_t * htrd , mio_htb_pair_t * pair )
{
mio_htre_hdrval_t * val ;
val = MIO_HTB_VPTR ( pair ) ;
while ( val - > next ) val = val - > next ;
/* The value for Connection: may get comma-separated.
2020-05-01 18:01:29 +00:00
* so use mio_find_bcstr_word_in_bcstr ( ) instead of mio_comp_bcstr ( ) . */
2020-03-03 13:47:51 +00:00
2020-05-01 18:01:29 +00:00
if ( mio_find_bcstr_word_in_bcstr ( val - > ptr , " close " , ' , ' , 1 ) )
2020-03-03 13:47:51 +00:00
{
htrd - > re . flags & = ~ MIO_HTRE_ATTR_KEEPALIVE ;
return 0 ;
}
2020-05-01 18:01:29 +00:00
if ( mio_find_bcstr_word_in_bcstr ( val - > ptr , " keep-alive " , ' , ' , 1 ) )
2020-03-03 13:47:51 +00:00
{
htrd - > re . flags | = MIO_HTRE_ATTR_KEEPALIVE ;
return 0 ;
}
/* Basically i don't care about other values.
* but for HTTP 1.0 , other values will set connection to ' close ' .
*
* Other values include even Keep - Alive specified multiple times .
* Connection : Keep - Alive
* Connection : Keep - Alive
* For the second Keep - Alive , this function sees ' Keep - Alive , Keep - Alive '
* That ' s because values of the same keys are concatenated .
*/
2020-05-01 18:01:29 +00:00
if ( htrd - > re . version . major < 1 | | ( htrd - > re . version . major = = 1 & & htrd - > re . version . minor < = 0 ) )
2020-03-03 13:47:51 +00:00
{
htrd - > re . flags & = ~ MIO_HTRE_ATTR_KEEPALIVE ;
}
return 0 ;
}
static int capture_content_length ( mio_htrd_t * htrd , mio_htb_pair_t * pair )
{
2020-04-30 16:20:31 +00:00
mio_oow_t len = 0 , off = 0 , tmp ;
2020-03-03 13:47:51 +00:00
const mio_bch_t * ptr ;
mio_htre_hdrval_t * val ;
/* get the last content_length */
val = MIO_HTB_VPTR ( pair ) ;
while ( val - > next ) val = val - > next ;
ptr = val - > ptr ;
while ( off < val - > len )
{
int num = digit_to_num ( ptr [ off ] ) ;
if ( num < = - 1 )
{
/* the length contains a non-digit */
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
}
tmp = len * 10 + num ;
if ( tmp < len )
{
/* the length has overflown */
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
}
len = tmp ;
off + + ;
}
if ( off = = 0 )
{
/* no length was provided */
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
}
if ( ( htrd - > re . flags & MIO_HTRE_ATTR_CHUNKED ) & & len > 0 )
{
/* content-length is greater than 0
* while transfer - encoding : chunked is specified . */
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
}
htrd - > re . flags | = MIO_HTRE_ATTR_LENGTH ;
htrd - > re . attr . content_length = len ;
return 0 ;
}
static int capture_expect ( mio_htrd_t * htrd , mio_htb_pair_t * pair )
{
mio_htre_hdrval_t * val ;
/* Expect is included */
htrd - > re . flags | = MIO_HTRE_ATTR_EXPECT ;
val = MIO_HTB_VPTR ( pair ) ;
while ( val )
{
/* Expect: 100-continue is included */
2020-05-01 18:01:29 +00:00
if ( mio_comp_bcstr ( val - > ptr , " 100-continue " , 1 ) = = 0 ) htrd - > re . flags | = MIO_HTRE_ATTR_EXPECT100 ;
2020-03-03 13:47:51 +00:00
val = val - > next ;
}
return 0 ;
}
static int capture_status ( mio_htrd_t * htrd , mio_htb_pair_t * pair )
{
mio_htre_hdrval_t * val ;
val = MIO_HTB_VPTR ( pair ) ;
while ( val - > next ) val = val - > next ;
htrd - > re . attr . status = val - > ptr ;
return 0 ;
}
static int capture_transfer_encoding ( mio_htrd_t * htrd , mio_htb_pair_t * pair )
{
int n ;
mio_htre_hdrval_t * val ;
val = MIO_HTB_VPTR ( pair ) ;
while ( val - > next ) val = val - > next ;
2020-05-01 18:01:29 +00:00
n = mio_comp_bcstr ( val - > ptr , " chunked " , 1 ) ;
2020-03-03 13:47:51 +00:00
if ( n = = 0 )
{
/* if (htrd->re.attr.content_length > 0) */
if ( htrd - > re . flags & MIO_HTRE_ATTR_LENGTH )
{
/* both content-length and 'transfer-encoding: chunked' are specified. */
goto badre ;
}
htrd - > re . flags | = MIO_HTRE_ATTR_CHUNKED ;
return 0 ;
}
/* other encoding type not supported yet */
badre :
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
}
static MIO_INLINE int capture_key_header ( mio_htrd_t * htrd , mio_htb_pair_t * pair )
{
static struct
{
const mio_bch_t * ptr ;
2020-04-30 16:20:31 +00:00
mio_oow_t len ;
2020-03-03 13:47:51 +00:00
int ( * handler ) ( mio_htrd_t * , mio_htb_pair_t * ) ;
} hdrtab [ ] =
{
{ " Connection " , 10 , capture_connection } ,
{ " Content-Length " , 14 , capture_content_length } ,
{ " Expect " , 6 , capture_expect } ,
{ " Status " , 6 , capture_status } ,
{ " Transfer-Encoding " , 17 , capture_transfer_encoding }
} ;
int n ;
2020-04-30 16:20:31 +00:00
mio_oow_t mid , count , base = 0 ;
2020-03-03 13:47:51 +00:00
/* perform binary search */
for ( count = MIO_COUNTOF ( hdrtab ) ; count > 0 ; count / = 2 )
{
mid = base + count / 2 ;
2020-05-01 18:01:29 +00:00
n = mio_comp_bchars ( MIO_HTB_KPTR ( pair ) , MIO_HTB_KLEN ( pair ) , hdrtab [ mid ] . ptr , hdrtab [ mid ] . len , 1 ) ;
2020-03-03 13:47:51 +00:00
if ( n = = 0 )
{
/* bingo! */
2020-05-01 18:01:29 +00:00
return hdrtab [ mid ] . handler ( htrd , pair ) ;
2020-03-03 13:47:51 +00:00
}
if ( n > 0 ) { base = mid + 1 ; count - - ; }
}
/* No callback functions were interested in this header field. */
return 0 ;
}
struct hdr_cbserter_ctx_t
{
mio_htrd_t * htrd ;
void * vptr ;
2020-04-30 16:20:31 +00:00
mio_oow_t vlen ;
2020-03-03 13:47:51 +00:00
} ;
static mio_htb_pair_t * hdr_cbserter (
mio_htb_t * htb , mio_htb_pair_t * pair ,
2020-04-30 16:20:31 +00:00
void * kptr , mio_oow_t klen , void * ctx )
2020-03-03 13:47:51 +00:00
{
struct hdr_cbserter_ctx_t * tx = ( struct hdr_cbserter_ctx_t * ) ctx ;
if ( pair = = MIO_NULL )
{
/* the key is new. let's create a new pair. */
mio_htb_pair_t * p ;
mio_htre_hdrval_t * val ;
2020-05-01 14:00:27 +00:00
val = mio_allocmem ( htb - > mio , MIO_SIZEOF ( * val ) ) ;
2020-05-01 18:01:29 +00:00
if ( MIO_UNLIKELY ( ! val ) )
2020-03-03 13:47:51 +00:00
{
tx - > htrd - > errnum = MIO_HTRD_ENOMEM ;
return MIO_NULL ;
}
MIO_MEMSET ( val , 0 , MIO_SIZEOF ( * val ) ) ;
val - > ptr = tx - > vptr ;
val - > len = tx - > vlen ;
val - > next = MIO_NULL ;
2020-05-01 18:56:33 +00:00
p = mio_htb_allocpair ( htb , kptr , klen , val , 0 ) ;
if ( MIO_UNLIKELY ( ! p ) )
2020-03-03 13:47:51 +00:00
{
2020-05-01 14:00:27 +00:00
mio_freemem ( htb - > mio , val ) ;
2020-03-03 13:47:51 +00:00
tx - > htrd - > errnum = MIO_HTRD_ENOMEM ;
}
else
{
2020-05-15 06:18:49 +00:00
if ( capture_key_header ( tx - > htrd , p ) < = - 1 )
2020-03-03 13:47:51 +00:00
{
/* Destroy the pair created here
* as it is not added to the hash table yet */
mio_htb_freepair ( htb , p ) ;
p = MIO_NULL ;
}
}
return p ;
}
else
{
/* RFC2616
* Multiple message - header fields with the same field - name
* MAY be present in a message if and only if the entire
* field - value for that header field is defined as a
* comma - separated list [ i . e . , # ( values ) ] . It MUST be possible
* to combine the multiple header fields into one
* " field-name: field-value " pair , without changing the semantics
* of the message , by appending each subsequent field - value
* to the first , each separated by a comma . The order in which
* header fields with the same field - name are received is therefore
* significant to the interpretation of the combined field value ,
* and thus a proxy MUST NOT change the order of these field values
* when a message is forwarded .
* RFC6265 defines the syntax for Set - Cookie and Cookie .
* this seems to be conflicting with RFC2616 .
*
* Origin servers SHOULD NOT fold multiple Set - Cookie header fields
* into a single header field . The usual mechanism for folding HTTP
* headers fields ( i . e . , as defined in [ RFC2616 ] ) might change the
* semantics of the Set - Cookie header field because the % x2C ( " , " )
* character is used by Set - Cookie in a way that conflicts with
* such folding .
*
* So i just maintain the list of values for a key instead of
* folding them .
*/
mio_htre_hdrval_t * val ;
mio_htre_hdrval_t * tmp ;
2020-05-01 14:00:27 +00:00
val = ( mio_htre_hdrval_t * ) mio_allocmem ( tx - > htrd - > mio , MIO_SIZEOF ( * val ) ) ;
2020-05-01 18:01:29 +00:00
if ( MIO_UNLIKELY ( ! val ) )
2020-03-03 13:47:51 +00:00
{
tx - > htrd - > errnum = MIO_HTRD_ENOMEM ;
return MIO_NULL ;
}
MIO_MEMSET ( val , 0 , MIO_SIZEOF ( * val ) ) ;
val - > ptr = tx - > vptr ;
val - > len = tx - > vlen ;
val - > next = MIO_NULL ;
/* TODO: doubly linked list for speed-up??? */
tmp = MIO_HTB_VPTR ( pair ) ;
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( tx - > htrd - > mio , tmp ! = MIO_NULL ) ;
2020-03-03 13:47:51 +00:00
/* find the tail */
while ( tmp - > next ) tmp = tmp - > next ;
/* append it to the list*/
tmp - > next = val ;
2020-05-15 06:18:49 +00:00
if ( capture_key_header ( tx - > htrd , pair ) < = - 1 ) return MIO_NULL ;
2020-03-03 13:47:51 +00:00
return pair ;
}
}
mio_bch_t * parse_header_field ( mio_htrd_t * htrd , mio_bch_t * line , mio_htb_t * tab )
{
mio_bch_t * p = line , * last ;
struct
{
mio_bch_t * ptr ;
2020-04-30 16:20:31 +00:00
mio_oow_t len ;
2020-03-03 13:47:51 +00:00
} name , value ;
#if 0
/* ignore leading spaces excluding crlf */
while ( is_space_octet ( * p ) ) p + + ;
# endif
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , ! is_whspace_octet ( * p ) ) ;
2020-03-03 13:47:51 +00:00
/* check the field name */
name . ptr = last = p ;
while ( * p ! = ' \0 ' & & * p ! = ' \n ' & & * p ! = ' : ' )
{
if ( ! is_space_octet ( * p + + ) ) last = p ;
}
name . len = last - name . ptr ;
if ( * p ! = ' : ' )
{
if ( ! ( htrd - > option & MIO_HTRD_STRICT ) )
{
while ( is_space_octet ( * p ) ) p + + ;
if ( * p = = ' \n ' )
{
/* ignore a line without a colon */
p + + ;
return p ;
}
}
goto badhdr ;
}
* last = ' \0 ' ;
/* skip the colon and spaces after it */
do { p + + ; } while ( is_space_octet ( * p ) ) ;
value . ptr = last = p ;
while ( * p ! = ' \0 ' & & * p ! = ' \n ' )
{
if ( ! is_space_octet ( * p + + ) ) last = p ;
}
value . len = last - value . ptr ;
if ( * p ! = ' \n ' ) goto badhdr ; /* not ending with a new line */
/* peep at the beginning of the next line to check if it is
* the continuation */
if ( is_purespace_octet ( * + + p ) )
{
/* RFC: HTTP/1.0 headers may be folded onto multiple lines if
* each continuation line begins with a space or horizontal tab .
* All linear whitespace , including folding , has the same semantics
* as SP . */
mio_bch_t * cpydst ;
cpydst = p - 1 ;
if ( * ( cpydst - 1 ) = = ' \r ' ) cpydst - - ;
/* process all continued lines */
do
{
while ( * p ! = ' \0 ' & & * p ! = ' \n ' )
{
* cpydst = * p + + ;
if ( ! is_space_octet ( * cpydst + + ) ) last = cpydst ;
}
value . len = last - value . ptr ;
if ( * p ! = ' \n ' ) goto badhdr ;
if ( * ( cpydst - 1 ) = = ' \r ' ) cpydst - - ;
}
while ( is_purespace_octet ( * + + p ) ) ;
}
* last = ' \0 ' ;
/* insert the new field to the header table */
{
struct hdr_cbserter_ctx_t ctx ;
ctx . htrd = htrd ;
ctx . vptr = value . ptr ;
ctx . vlen = value . len ;
htrd - > errnum = MIO_HTRD_ENOERR ;
if ( mio_htb_cbsert (
tab , name . ptr , name . len ,
hdr_cbserter , & ctx ) = = MIO_NULL )
{
if ( htrd - > errnum = = MIO_HTRD_ENOERR )
htrd - > errnum = MIO_HTRD_ENOMEM ;
return MIO_NULL ;
}
}
return p ;
badhdr :
htrd - > errnum = MIO_HTRD_EBADHDR ;
return MIO_NULL ;
}
static MIO_INLINE int parse_initial_line_and_headers (
2020-04-30 16:20:31 +00:00
mio_htrd_t * htrd , const mio_bch_t * req , mio_oow_t rlen )
2020-03-03 13:47:51 +00:00
{
mio_bch_t * p ;
/* add the actual request */
if ( push_to_buffer ( htrd , & htrd - > fed . b . raw , req , rlen ) < = - 1 ) return - 1 ;
/* add the terminating null for easier parsing */
if ( push_to_buffer ( htrd , & htrd - > fed . b . raw , & NUL , 1 ) < = - 1 ) return - 1 ;
2020-05-01 18:01:29 +00:00
p = MIO_BECS_PTR ( & htrd - > fed . b . raw ) ;
2020-03-03 13:47:51 +00:00
#if 0
if ( htrd - > option & MIO_HTRD_SKIPEMPTYLINES )
while ( is_whspace_octet ( * p ) ) p + + ;
else
# endif
while ( is_space_octet ( * p ) ) p + + ;
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , * p ! = ' \0 ' ) ;
2020-03-03 13:47:51 +00:00
/* parse the initial line */
if ( ! ( htrd - > option & MIO_HTRD_SKIPINITIALLINE ) )
{
p = parse_initial_line ( htrd , p ) ;
if ( p = = MIO_NULL ) return - 1 ;
}
/* parse header fields */
do
{
while ( is_whspace_octet ( * p ) ) p + + ;
if ( * p = = ' \0 ' ) break ;
/* TODO: return error if protocol is 0.9.
* HTTP / 0.9 must not get headers . . . */
p = parse_header_field ( htrd , p , & htrd - > re . hdrtab ) ;
if ( p = = MIO_NULL ) return - 1 ;
}
while ( 1 ) ;
return 0 ;
}
/* chunk parsing phases */
# define GET_CHUNK_DONE 0
# define GET_CHUNK_LEN 1
# define GET_CHUNK_DATA 2
# define GET_CHUNK_CRLF 3
# define GET_CHUNK_TRAILERS 4
2020-04-30 16:20:31 +00:00
static const mio_bch_t * getchunklen ( mio_htrd_t * htrd , const mio_bch_t * ptr , mio_oow_t len )
2020-03-03 13:47:51 +00:00
{
const mio_bch_t * end = ptr + len ;
/* this function must be called in the GET_CHUNK_LEN context */
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , htrd - > fed . s . chunk . phase = = GET_CHUNK_LEN ) ;
2020-03-03 13:47:51 +00:00
if ( htrd - > fed . s . chunk . count < = 0 )
{
/* skip leading spaces if the first character of
* the chunk length has not been read yet */
while ( ptr < end & & is_space_octet ( * ptr ) ) ptr + + ;
}
while ( ptr < end )
{
int n = xdigit_to_num ( * ptr ) ;
if ( n < = - 1 ) break ;
htrd - > fed . s . chunk . len = htrd - > fed . s . chunk . len * 16 + n ;
htrd - > fed . s . chunk . count + + ;
ptr + + ;
}
/* skip trailing spaces if the length has been read */
while ( ptr < end & & is_space_octet ( * ptr ) ) ptr + + ;
if ( ptr < end )
{
if ( * ptr = = ' \n ' )
{
/* the chunk length line ended properly */
if ( htrd - > fed . s . chunk . count < = 0 )
{
/* empty line - no more chunk */
htrd - > fed . s . chunk . phase = GET_CHUNK_DONE ;
}
else if ( htrd - > fed . s . chunk . len < = 0 )
{
/* length explicity specified to 0
get trailing headers . . . . */
htrd - > fed . s . chunk . phase = GET_CHUNK_TRAILERS ;
}
else
{
/* ready to read the chunk data... */
htrd - > fed . s . chunk . phase = GET_CHUNK_DATA ;
}
htrd - > fed . s . need = htrd - > fed . s . chunk . len ;
ptr + + ;
}
else
{
htrd - > errnum = MIO_HTRD_EBADRE ;
return MIO_NULL ;
}
}
return ptr ;
}
static const mio_bch_t * get_trailing_headers (
mio_htrd_t * htrd , const mio_bch_t * req , const mio_bch_t * end )
{
const mio_bch_t * ptr = req ;
while ( ptr < end )
{
register mio_bch_t b = * ptr + + ;
switch ( b )
{
case ' \0 ' :
/* guarantee that the request does not contain a null
* character */
htrd - > errnum = MIO_HTRD_EBADRE ;
return MIO_NULL ;
case ' \n ' :
if ( htrd - > fed . s . crlf < = 1 )
{
htrd - > fed . s . crlf = 2 ;
break ;
}
else
{
mio_bch_t * p ;
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , htrd - > fed . s . crlf < = 3 ) ;
2020-03-03 13:47:51 +00:00
htrd - > fed . s . crlf = 0 ;
if ( push_to_buffer (
htrd , & htrd - > fed . b . tra , req , ptr - req ) < = - 1 )
return MIO_NULL ;
if ( push_to_buffer (
htrd , & htrd - > fed . b . tra , & NUL , 1 ) < = - 1 )
return MIO_NULL ;
2020-05-01 18:01:29 +00:00
p = MIO_BECS_PTR ( & htrd - > fed . b . tra ) ;
2020-03-03 13:47:51 +00:00
do
{
while ( is_whspace_octet ( * p ) ) p + + ;
if ( * p = = ' \0 ' ) break ;
/* TODO: return error if protocol is 0.9.
* HTTP / 0.9 must not get headers . . . */
p = parse_header_field (
htrd , p ,
( ( htrd - > option & MIO_HTRD_TRAILERS ) ? & htrd - > re . trailers : & htrd - > re . hdrtab )
) ;
if ( p = = MIO_NULL ) return MIO_NULL ;
}
while ( 1 ) ;
htrd - > fed . s . chunk . phase = GET_CHUNK_DONE ;
goto done ;
}
case ' \r ' :
if ( htrd - > fed . s . crlf = = 0 | | htrd - > fed . s . crlf = = 2 )
htrd - > fed . s . crlf + + ;
else htrd - > fed . s . crlf = 1 ;
break ;
default :
/* mark that neither CR nor LF was seen */
htrd - > fed . s . crlf = 0 ;
break ;
}
}
if ( push_to_buffer ( htrd , & htrd - > fed . b . tra , req , ptr - req ) < = - 1 )
return MIO_NULL ;
done :
return ptr ;
}
/* feed the percent encoded string */
2020-05-15 06:18:49 +00:00
int mio_htrd_feed ( mio_htrd_t * htrd , const mio_bch_t * req , mio_oow_t len , mio_oow_t * rem )
2020-03-03 13:47:51 +00:00
{
const mio_bch_t * end = req + len ;
const mio_bch_t * ptr = req ;
int header_completed_during_this_feed = 0 ;
2020-04-30 16:20:31 +00:00
mio_oow_t avail ;
2020-03-03 13:47:51 +00:00
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , len > 0 ) ;
2020-03-03 13:47:51 +00:00
if ( htrd - > flags & FEEDING_SUSPENDED )
{
htrd - > errnum = MIO_HTRD_ESUSPENDED ;
return - 1 ;
}
/*if (htrd->option & MIO_HTRD_DUMMY)*/
if ( htrd - > flags & FEEDING_DUMMIFIED )
{
/* treat everything as contents.
* i don ' t care about headers or whatsoever . */
2020-05-15 06:18:49 +00:00
return push_content ( htrd , req , len ) ;
2020-03-03 13:47:51 +00:00
}
/* does this goto drop code maintainability? */
if ( htrd - > fed . s . need > 0 )
{
/* we're in need of as many octets as htrd->fed.s.need
* for contents body . make a proper jump to resume
* content handling */
goto content_resume ;
}
switch ( htrd - > fed . s . chunk . phase )
{
case GET_CHUNK_LEN :
goto dechunk_resume ;
case GET_CHUNK_DATA :
/* this won't be reached as htrd->fed.s.need
* is greater than 0 if GET_CHUNK_DATA is true */
goto content_resume ;
case GET_CHUNK_CRLF :
goto dechunk_crlf ;
case GET_CHUNK_TRAILERS :
goto dechunk_get_trailers ;
}
htrd - > clean = 0 ; /* mark that htrd is in need of some data */
while ( ptr < end )
{
register mio_bch_t b = * ptr + + ;
#if 0
if ( htrd - > option & MIO_HTRD_SKIPEMPTYLINES & &
htrd - > fed . s . plen < = 0 & & is_whspace_octet ( b ) )
{
/* let's drop leading whitespaces across multiple
* lines */
req + + ;
continue ;
}
# endif
switch ( b )
{
case ' \0 ' :
/* guarantee that the request does not contain
* a null character */
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
case ' \n ' :
{
if ( htrd - > fed . s . crlf < = 1 )
{
/* htrd->fed.s.crlf == 0
* = > CR was not seen
* htrd - > fed . s . crlf = = 1
* = > CR was seen
* whatever the current case is ,
* mark the first LF is seen here .
*/
htrd - > fed . s . crlf = 2 ;
}
else
{
/* htrd->fed.s.crlf == 2
* = > no 2 nd CR before LF
* htrd - > fed . s . crlf = = 3
* = > 2 nd CR before LF
*/
/* we got a complete request header. */
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , htrd - > fed . s . crlf < = 3 ) ;
2020-05-15 06:18:49 +00:00
2020-03-03 13:47:51 +00:00
/* reset the crlf state */
htrd - > fed . s . crlf = 0 ;
/* reset the raw request length */
htrd - > fed . s . plen = 0 ;
if ( parse_initial_line_and_headers ( htrd , req , ptr - req ) < = - 1 ) return - 1 ;
/* compelete request header is received */
header_completed_during_this_feed = 1 ;
if ( htrd - > option & MIO_HTRD_PEEKONLY )
{
/* when MIO_HTRD_PEEKONLY is set,
* the peek callback is invoked once
* a complete header is seen . the caller
* should not feed more data by calling
* this function again once the callback is
* invoked . the trailing data is appended
* to the content buffer .
*
* NOTE : if the current feed that completed
* the header contains the next request ,
* the next request is treated as if it
* belongs to the current request .
*
* In priciple , this option was added for
* reading CGI outputs . So it comes with
* awkwardity described above .
*/
2020-05-15 06:18:49 +00:00
if ( ptr < end & & push_content ( htrd , ptr , end - ptr ) < = - 1 ) return - 1 ;
2020-03-03 13:47:51 +00:00
/* i don't really know if it is really completed
* with content . MIO_HTRD_PEEKONLY is not compatible
* with the completed state . anyway , let me complete
* it . */
mio_htre_completecontent ( & htrd - > re ) ;
/* this jump is only to invoke the peek
* callback . this function should not be fed
* more . */
goto feedme_more ;
}
/* carry on processing content body fed together with the header */
if ( htrd - > re . flags & MIO_HTRE_ATTR_CHUNKED )
{
/* transfer-encoding: chunked */
2020-05-15 06:18:49 +00:00
/*MIO_ASSERT (htrd->mio, !(htrd->re.flags & MIO_HTRE_ATTR_LENGTH)); <- this assertion is wrong. non-conforming client may include content-length while transfer-encoding is chunked*/
2020-03-03 13:47:51 +00:00
dechunk_start :
htrd - > fed . s . chunk . phase = GET_CHUNK_LEN ;
htrd - > fed . s . chunk . len = 0 ;
htrd - > fed . s . chunk . count = 0 ;
dechunk_resume :
2020-05-15 06:18:49 +00:00
ptr = getchunklen ( htrd , ptr , end - ptr ) ;
if ( MIO_UNLIKELY ( ! ptr ) ) return - 1 ;
2020-03-03 13:47:51 +00:00
if ( htrd - > fed . s . chunk . phase = = GET_CHUNK_LEN )
{
/* still in the GET_CHUNK_LEN state.
* the length has been partially read . */
goto feedme_more ;
}
else if ( htrd - > fed . s . chunk . phase = = GET_CHUNK_TRAILERS )
{
/* this state is reached after the
* last chunk length 0 is read . The next
* empty line immediately completes
* a content body . so i need to adjust
* this crlf status to 2 as if a trailing
* header line has been read . */
htrd - > fed . s . crlf = 2 ;
dechunk_get_trailers :
2020-05-15 06:18:49 +00:00
ptr = get_trailing_headers ( htrd , ptr , end ) ;
if ( ! MIO_UNLIKELY ( ptr ) ) return - 1 ;
2020-03-03 13:47:51 +00:00
if ( htrd - > fed . s . chunk . phase = = GET_CHUNK_TRAILERS )
{
/* still in the same state.
* the trailers have not been processed fully */
goto feedme_more ;
}
}
}
else
{
/* we need to read as many octets as
* Content - Length */
if ( ( htrd - > option & MIO_HTRD_RESPONSE ) & &
! ( htrd - > re . flags & MIO_HTRE_ATTR_LENGTH ) & &
! ( htrd - > re . flags & MIO_HTRE_ATTR_KEEPALIVE ) )
{
/* for a response, no content-length and
* no chunk are specified and ' connection '
* is to close . i must read until the
* connection is closed . however , there isn ' t
* any good way to know when to stop from
* within this function . so the caller
* can call mio_htrd_halt ( ) for this . */
/* set this to the maximum in a type safe way
* assuming it ' s unsigned . the problem of
* the current implementation is that
* it can ' t receive more than */
htrd - > fed . s . need = 0 ;
htrd - > fed . s . need = ~ htrd - > fed . s . need ;
htrd - > fed . s . flags | = CONSUME_UNTIL_CLOSE ;
}
else if ( ( htrd - > option & MIO_HTRD_RESPONSE ) & &
! ( htrd - > re . flags & MIO_HTRE_ATTR_LENGTH ) & &
( htrd - > re . flags & MIO_HTRE_ATTR_KEEPALIVE ) )
{
/*
* what the hell !
* no content - length , but keep - alive and not chunked .
* there ' s no way to know how large the contents is .
*
* For a request ' http : //php.net/manual/en/function.curl-strerror.php' containing the following header fields:
* If - Modified - Since : Fri , 31 Oct 2014 11 : 12 : 47 GMT
* Accept - Encoding : gzip , deflate
*
* the service gave this response as of this writing :
*
HTTP / 1.1 304 Not Modified
Server : nginx / 1.6 .2
Date : Tue , 04 Nov 2014 15 : 45 : 46 GMT
Connection : keep - alive
Vary : Accept - Encoding
Set - Cookie : LAST_LANG = en ; expires = Wed , 04 - Nov - 2015 15 : 45 : 46 GMT ; Max - Age = 31536000 ; path = / ; domain = . php . net
Set - Cookie : COUNTRY = KOR % 2 C220 .121 .110 .171 ; expires = Tue , 11 - Nov - 2014 15 : 45 : 46 GMT ; Max - Age = 604800 ; path = / ; domain = . php . net
XXXXXXXX
*
* XXXXXXX is some compressed garbage included in the contents - body .
* why does the service behave this way ? is it a server bug or am i doing anything wrong ?
*
* < < WORKAROUND > >
* i decided to drop whatever trailing data avaiable
* after the header fields for this feeding .
* if more contents are fed in later , it will still
* end up with a bad request error . */
ptr = end ;
htrd - > fed . s . need = 0 ;
}
else
{
htrd - > fed . s . need = htrd - > re . attr . content_length ;
}
}
if ( htrd - > fed . s . need > 0 )
{
/* content-length or chunked data length
* specified */
content_resume :
avail = end - ptr ;
if ( avail < = 0 )
{
/* we didn't get a complete content yet */
/* avail can be 0 if data fed ends with
* a chunk length withtout actual data .
* so i check if avail is greater than 0
* in order not to push empty content . */
goto feedme_more ;
}
else if ( avail < htrd - > fed . s . need )
{
/* the data is not as large as needed */
if ( push_content ( htrd , ptr , avail ) < = - 1 ) return - 1 ;
if ( ! ( htrd - > fed . s . flags & CONSUME_UNTIL_CLOSE ) )
{
/* i don't decrement htrd->fed.s.need
* if i should read until connection is closed .
* well , unless set your own callback ,
* push_content ( ) above will fail
* if too much has been received already */
htrd - > fed . s . need - = avail ;
}
/* we didn't get a complete content yet */
goto feedme_more ;
}
else
{
/* we got all or more than needed */
if ( push_content ( htrd , ptr , htrd - > fed . s . need ) < = - 1 ) return - 1 ;
ptr + = htrd - > fed . s . need ;
if ( ! ( htrd - > fed . s . flags & CONSUME_UNTIL_CLOSE ) )
htrd - > fed . s . need = 0 ;
}
}
if ( htrd - > fed . s . chunk . phase = = GET_CHUNK_DATA )
{
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , htrd - > fed . s . need = = 0 ) ;
2020-03-03 13:47:51 +00:00
htrd - > fed . s . chunk . phase = GET_CHUNK_CRLF ;
dechunk_crlf :
while ( ptr < end & & is_space_octet ( * ptr ) ) ptr + + ;
if ( ptr < end )
{
if ( * ptr = = ' \n ' )
{
/* end of chunk data. */
ptr + + ;
/* more octets still available.
* let it decode the next chunk
*/
if ( ptr < end ) goto dechunk_start ;
/* no more octets available after
* chunk data . the chunk state variables
* need to be reset when a jump is made
* to dechunk_resume upon the next call
*/
htrd - > fed . s . chunk . phase = GET_CHUNK_LEN ;
htrd - > fed . s . chunk . len = 0 ;
htrd - > fed . s . chunk . count = 0 ;
goto feedme_more ;
}
else
{
/* redundant character ... */
htrd - > errnum = MIO_HTRD_EBADRE ;
return - 1 ;
}
}
else
{
/* data not enough */
goto feedme_more ;
}
}
/* the content has been received fully */
mio_htre_completecontent ( & htrd - > re ) ;
if ( header_completed_during_this_feed & & htrd - > recbs - > peek )
{
/* the peek handler has not been executed.
* this can happen if this function is fed with
* at least the ending part of a complete header
* plus complete content body and the header
* of the next request . */
int n ;
2020-05-15 06:18:49 +00:00
htrd - > errnum = MIO_HTRD_ENOERR ;
2020-05-08 09:48:26 +00:00
n = htrd - > recbs - > peek ( htrd , & htrd - > re ) ;
2020-03-03 13:47:51 +00:00
if ( n < = - 1 )
{
if ( htrd - > errnum = = MIO_HTRD_ENOERR )
2020-05-15 06:18:49 +00:00
htrd - > errnum = MIO_HTRD_ERECBS ;
2020-03-03 13:47:51 +00:00
/* need to clear request on error?
clear_feed ( htrd ) ; */
return - 1 ;
}
header_completed_during_this_feed = 0 ;
}
if ( htrd - > recbs - > poke )
{
int n ;
htrd - > errnum = MIO_HTRD_ENOERR ;
2020-05-08 09:48:26 +00:00
n = htrd - > recbs - > poke ( htrd , & htrd - > re ) ;
2020-03-03 13:47:51 +00:00
if ( n < = - 1 )
{
if ( htrd - > errnum = = MIO_HTRD_ENOERR )
2020-05-15 06:18:49 +00:00
htrd - > errnum = MIO_HTRD_ERECBS ;
2020-03-03 13:47:51 +00:00
/* need to clear request on error?
clear_feed ( htrd ) ; */
return - 1 ;
}
}
#if 0
mio_printf ( MIO_T ( " CONTENT_LENGTH %d, RAW HEADER LENGTH %d \n " ) ,
2020-05-01 18:01:29 +00:00
( int ) MIO_BECS_LEN ( & htrd - > re . content ) ,
( int ) MIO_BECS_LEN ( & htrd - > fed . b . raw ) ) ;
2020-03-03 13:47:51 +00:00
# endif
clear_feed ( htrd ) ;
2020-05-15 06:18:49 +00:00
if ( rem )
{
/* stop even if there are fed data left */
* rem = end - ptr ; /* remaining feeds */
return 0 ; /* to indicate completed when the 'rem' is not NULL */
}
else if ( ptr > = end )
{
/* no more feeds to handle */
return 0 ;
}
if ( htrd - > flags & FEEDING_SUSPENDED ) /* in case the callback called mio_htrd_suspend() */
2020-03-03 13:47:51 +00:00
{
htrd - > errnum = MIO_HTRD_ESUSPENDED ;
return - 1 ;
}
/*if (htrd->option & MIO_HTRD_DUMMY)*/
2020-05-15 06:18:49 +00:00
if ( htrd - > flags & FEEDING_DUMMIFIED ) /* in case the callback called mio_htrd_dummify() */
2020-03-03 13:47:51 +00:00
{
/* once the mode changes to RAW in a callback,
* left - over is pushed as contents */
if ( ptr < end )
2020-05-15 06:18:49 +00:00
return push_content ( htrd , ptr , end - ptr ) ;
2020-03-03 13:47:51 +00:00
else
return 0 ;
}
/* let ptr point to the next character to LF or
* the optional contents */
req = ptr ;
/* since there are more to handle, i mark that
* htrd is in need of some data . this may
* not be really compatible with SKIPEMPTYLINES .
* SHOULD I simply remove the option ? */
htrd - > clean = 0 ;
}
break ;
}
case ' \r ' :
if ( htrd - > fed . s . crlf = = 0 | | htrd - > fed . s . crlf = = 2 )
htrd - > fed . s . crlf + + ;
else htrd - > fed . s . crlf = 1 ;
break ;
default :
/* increment length of a request in raw
* excluding crlf */
htrd - > fed . s . plen + + ;
/* mark that neither CR nor LF was seen */
htrd - > fed . s . crlf = 0 ;
}
}
if ( ptr > req )
{
/* enbuffer the incomplete request */
2020-05-15 06:18:49 +00:00
if ( push_to_buffer ( htrd , & htrd - > fed . b . raw , req , ptr - req ) < = - 1 ) return - 1 ;
2020-03-03 13:47:51 +00:00
}
feedme_more :
if ( header_completed_during_this_feed & & htrd - > recbs - > peek )
{
int n ;
2020-05-15 06:18:49 +00:00
htrd - > errnum = MIO_HTRD_ENOERR ;
n = htrd - > recbs - > peek ( htrd , & htrd - > re ) ;
2020-03-03 13:47:51 +00:00
if ( n < = - 1 )
{
if ( htrd - > errnum = = MIO_HTRD_ENOERR )
2020-05-15 06:18:49 +00:00
htrd - > errnum = MIO_HTRD_ERECBS ;
2020-03-03 13:47:51 +00:00
/* need to clear request on error?
clear_feed ( htrd ) ; */
return - 1 ;
}
}
2020-05-15 06:18:49 +00:00
if ( rem ) * rem = 0 ;
2020-03-03 13:47:51 +00:00
return 0 ;
}
int mio_htrd_halt ( mio_htrd_t * htrd )
{
2020-05-15 06:18:49 +00:00
if ( ( htrd - > fed . s . flags & CONSUME_UNTIL_CLOSE ) | | ! htrd - > clean )
2020-03-03 13:47:51 +00:00
{
mio_htre_completecontent ( & htrd - > re ) ;
if ( htrd - > recbs - > poke )
{
int n ;
htrd - > errnum = MIO_HTRD_ENOERR ;
n = htrd - > recbs - > poke ( htrd , & htrd - > re ) ;
if ( n < = - 1 )
{
if ( htrd - > errnum = = MIO_HTRD_ENOERR )
2020-05-15 06:18:49 +00:00
htrd - > errnum = MIO_HTRD_ERECBS ;
2020-03-03 13:47:51 +00:00
/* need to clear request on error?
clear_feed ( htrd ) ; */
return - 1 ;
}
}
clear_feed ( htrd ) ;
}
return 0 ;
}
void mio_htrd_suspend ( mio_htrd_t * htrd )
{
htrd - > flags | = FEEDING_SUSPENDED ;
}
void mio_htrd_resume ( mio_htrd_t * htrd )
{
htrd - > flags & = ~ FEEDING_SUSPENDED ;
}
void mio_htrd_dummify ( mio_htrd_t * htrd )
{
htrd - > flags | = FEEDING_DUMMIFIED ;
}
void mio_htrd_undummify ( mio_htrd_t * htrd )
{
htrd - > flags & = ~ FEEDING_DUMMIFIED ;
}
#if 0
2020-05-01 18:01:29 +00:00
int mio_htrd_scanqparam ( mio_htrd_t * htrd , const mio_bcs_t * cstr )
2020-03-03 13:47:51 +00:00
{
2020-05-01 18:01:29 +00:00
mio_bcs_t key , val ;
2020-03-03 13:47:51 +00:00
const mio_bch_t * p , * end ;
mio_bch_t * out ;
if ( cstr = = MIO_NULL ) cstr = mio_htre_getqparamcstr ( & htrd - > re ) ;
p = cstr - > ptr ;
if ( p = = MIO_NULL ) return 0 ; /* no param string to scan */
end = p + cstr - > len ;
/* a key and a value pair including two terminating null
* can ' t exceed the the qparamstrlen + 2. only + 1 below as there is
* one more space for an internal terminating null */
2020-05-01 18:01:29 +00:00
mio_becs_setlen ( & htrd - > tmp . qparam , cstr - > len + 1 ) ;
2020-03-03 13:47:51 +00:00
/* let out point to the beginning of the qparam buffer.
* the loop below emits percent - decode key and value to this buffer . */
2020-05-01 18:01:29 +00:00
out = MIO_BECS_PTR ( & htrd - > tmp . qparam ) ;
2020-03-03 13:47:51 +00:00
key . ptr = out ; key . len = 0 ;
val . ptr = MIO_NULL ; val . len = 0 ;
do
{
if ( p > = end | | * p = = ' & ' | | * p = = ' ; ' )
{
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , key . ptr ! = MIO_NULL ) ;
2020-03-03 13:47:51 +00:00
* out + + = ' \0 ' ;
if ( val . ptr = = MIO_NULL )
{
if ( key . len = = 0 )
{
/* both key and value are empty.
* we don ' t need to do anything */
goto next_octet ;
}
val . ptr = out ;
* out + + = ' \0 ' ;
2020-05-01 18:01:29 +00:00
MIO_ASSERT ( htrd - > mio , val . len = = 0 ) ;
2020-03-03 13:47:51 +00:00
}
2020-05-01 18:01:29 +00:00
/* set request parameter string callback before scanning */
MIO_ASSERT ( htrd - > mio , htrd - > recbs - > qparamstr ! = MIO_NULL ) ;
2020-03-03 13:47:51 +00:00
htrd - > errnum = MIO_HTRD_ENOERR ;
2020-05-15 06:18:49 +00:00
if ( htrd - > recbs - > qparamstr ( htrd , & key , & val ) < = - 1 )
2020-03-03 13:47:51 +00:00
{
if ( htrd - > errnum = = MIO_HTRD_ENOERR )
htrd - > errnum = MIO_HTRD_ERECBS ;
return - 1 ;
}
next_octet :
if ( p > = end ) break ;
p + + ;
2020-05-01 18:01:29 +00:00
out = MIO_BECS_PTR ( & htrd - > tmp . qparam ) ;
2020-03-03 13:47:51 +00:00
key . ptr = out ; key . len = 0 ;
val . ptr = MIO_NULL ; val . len = 0 ;
}
else if ( * p = = ' = ' )
{
* out + + = ' \0 ' ; p + + ;
val . ptr = out ;
/*val.len = 0; */
}
else
{
if ( * p = = ' % ' & & p + 2 < = end )
{
int q = xdigit_to_num ( * ( p + 1 ) ) ;
if ( q > = 0 )
{
int w = xdigit_to_num ( * ( p + 2 ) ) ;
if ( w > = 0 )
{
/* unlike the path part, we don't care if it
* contains a null character */
* out + + = ( ( q < < 4 ) + w ) ;
p + = 3 ;
goto next ;
}
}
}
* out + + = * p + + ;
next :
if ( val . ptr ) val . len + + ;
else key . len + + ;
}
}
while ( 1 ) ;
2020-05-01 18:01:29 +00:00
mio_becs_clear ( & htrd - > tmp . qparam ) ;
2020-03-03 13:47:51 +00:00
return 0 ;
}
# endif