doubango/tinyHTTP/src/parsers/thttp_parser_message.c
c732d49e
 #if HAVE_CRT
 #define _CRTDBG_MAP_ALLOC 
 #include <stdlib.h> 
 #include <crtdbg.h>
 #endif //HAVE_CRT
 
 /* #line 1 "./ragel/thttp_parser_message.rl" */
 /*
74ca6d11
 * Copyright (C) 2020, University of the Basque Country (UPV/EHU)
c732d49e
 * Contact for licensing options: <licensing-mcpttclient(at)mcopenplatform(dot)com>
 *
 * The original file was part of Open Source Doubango Framework
 * Copyright (C) 2010-2011 Mamadou Diop.
 * Copyright (C) 2012 Doubango Telecom <http://doubango.org>
 *
 * This file is part of Open Source Doubango Framework.
 *
 * DOUBANGO is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * DOUBANGO is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with DOUBANGO.
 *
 */
 
 /**@file thttp_parser_message.c
  * @brief HTTP parser.
  *
  */
 #include "tinyhttp/parsers/thttp_parser_message.h"
 #include "tinyhttp/parsers/thttp_parser_header.h"
 
 #include "tinyhttp/parsers/thttp_parser_url.h"
 
 #include "tsk_debug.h"
 #include "tsk_memory.h"
 
 static void thttp_message_parser_execute(tsk_ragel_state_t *state, thttp_message_t *message, tsk_bool_t extract_content);
 static void thttp_message_parser_init(tsk_ragel_state_t *state);
 static void thttp_message_parser_eoh(tsk_ragel_state_t *state, thttp_message_t *message, tsk_bool_t extract_content);
 
 /***********************************
 *	Ragel state machine.
 */
 
 /* #line 159 "./ragel/thttp_parser_message.rl" */
 
 
 
 TSK_RAGEL_DISABLE_WARNINGS_BEGIN()
 /* Regel data */
 
 /* #line 50 "./src/parsers/thttp_parser_message.c" */
 static const char _thttp_machine_parser_message_actions[] = {
 	0, 1, 0, 1, 1, 1, 2, 1, 
 	3, 1, 4, 1, 5, 1, 6, 1, 
 	7, 2, 0, 5, 2, 6, 0
 };
 
 static const unsigned char _thttp_machine_parser_message_key_offsets[] = {
 	0, 0, 16, 31, 31, 32, 34, 36, 
 	38, 40, 41, 43, 46, 48, 51, 52, 
 	53, 54, 55, 56, 57, 74, 91, 108, 
 	122, 124, 127, 129, 132, 134, 136, 138, 
 	139, 155, 171, 177, 183
 };
 
 static const char _thttp_machine_parser_message_trans_keys[] = {
 	33, 37, 39, 72, 104, 126, 42, 43, 
 	45, 46, 48, 57, 65, 90, 95, 122, 
 	32, 33, 37, 39, 126, 42, 43, 45, 
 	46, 48, 57, 65, 90, 95, 122, 32, 
 	72, 104, 84, 116, 84, 116, 80, 112, 
 	47, 48, 57, 46, 48, 57, 48, 57, 
 	13, 48, 57, 10, 13, 13, 10, 13, 
 	10, 32, 33, 37, 39, 84, 116, 126, 
 	42, 43, 45, 46, 48, 57, 65, 90, 
 	95, 122, 32, 33, 37, 39, 84, 116, 
 	126, 42, 43, 45, 46, 48, 57, 65, 
 	90, 95, 122, 32, 33, 37, 39, 80, 
 	112, 126, 42, 43, 45, 46, 48, 57, 
 	65, 90, 95, 122, 32, 33, 37, 39, 
 	47, 126, 42, 43, 45, 57, 65, 90, 
 	95, 122, 48, 57, 46, 48, 57, 48, 
 	57, 32, 48, 57, 48, 57, 48, 57, 
 	48, 57, 32, 13, 37, 60, 62, 96, 
 	127, 0, 8, 10, 31, 34, 35, 91, 
 	94, 123, 125, 13, 37, 60, 62, 96, 
 	127, 0, 8, 10, 31, 34, 35, 91, 
 	94, 123, 125, 48, 57, 65, 70, 97, 
 	102, 48, 57, 65, 70, 97, 102, 0
 };
 
 static const char _thttp_machine_parser_message_single_lengths[] = {
 	0, 6, 5, 0, 1, 2, 2, 2, 
 	2, 1, 0, 1, 0, 1, 1, 1, 
 	1, 1, 1, 1, 7, 7, 7, 6, 
 	0, 1, 0, 1, 0, 0, 0, 1, 
 	6, 6, 0, 0, 0
 };
 
 static const char _thttp_machine_parser_message_range_lengths[] = {
 	0, 5, 5, 0, 0, 0, 0, 0, 
 	0, 0, 1, 1, 1, 1, 0, 0, 
 	0, 0, 0, 0, 5, 5, 5, 4, 
 	1, 1, 1, 1, 1, 1, 1, 0, 
 	5, 5, 3, 3, 0
 };
 
 static const unsigned char _thttp_machine_parser_message_index_offsets[] = {
 	0, 0, 12, 23, 24, 26, 29, 32, 
 	35, 38, 40, 42, 45, 47, 50, 52, 
 	54, 56, 58, 60, 62, 75, 88, 101, 
 	112, 114, 117, 119, 122, 124, 126, 128, 
 	130, 142, 154, 158, 162
 };
 
 static const char _thttp_machine_parser_message_indicies[] = {
 	0, 0, 0, 2, 2, 0, 0, 0, 
 	0, 0, 0, 1, 3, 4, 4, 4, 
 	4, 4, 4, 4, 4, 4, 1, 5, 
 	7, 6, 8, 8, 1, 9, 9, 1, 
 	10, 10, 1, 11, 11, 1, 12, 1, 
 	13, 1, 14, 13, 1, 15, 1, 16, 
 	15, 1, 17, 1, 19, 18, 21, 20, 
 	22, 1, 24, 23, 25, 1, 3, 4, 
 	4, 4, 26, 26, 4, 4, 4, 4, 
 	4, 4, 1, 3, 4, 4, 4, 27, 
 	27, 4, 4, 4, 4, 4, 4, 1, 
 	3, 4, 4, 4, 28, 28, 4, 4, 
 	4, 4, 4, 4, 1, 3, 4, 4, 
 	4, 29, 4, 4, 4, 4, 4, 1, 
 	30, 1, 31, 30, 1, 32, 1, 33, 
 	32, 1, 34, 1, 35, 1, 36, 1, 
 	37, 1, 39, 40, 1, 1, 1, 1, 
 	1, 1, 1, 1, 1, 38, 42, 43, 
 	1, 1, 1, 1, 1, 1, 1, 1, 
 	1, 41, 44, 44, 44, 1, 41, 41, 
 	41, 1, 45, 0
 };
 
 static const char _thttp_machine_parser_message_trans_targs[] = {
 	2, 0, 20, 3, 2, 4, 4, 5, 
 	6, 7, 8, 9, 10, 11, 12, 13, 
 	14, 15, 16, 19, 16, 17, 18, 16, 
 	19, 36, 21, 22, 23, 24, 25, 26, 
 	27, 28, 29, 30, 31, 32, 33, 14, 
 	34, 33, 14, 34, 35, 36
 };
 
 static const char _thttp_machine_parser_message_trans_actions[] = {
 	1, 0, 1, 3, 0, 1, 0, 5, 
 	1, 0, 0, 0, 0, 0, 0, 0, 
 	7, 0, 1, 0, 0, 0, 0, 20, 
 	13, 15, 0, 0, 0, 0, 0, 0, 
 	0, 7, 1, 0, 0, 9, 1, 17, 
 	1, 0, 11, 0, 0, 0
 };
 
 static const int thttp_machine_parser_message_start = 1;
 static const int thttp_machine_parser_message_first_final = 36;
 static const int thttp_machine_parser_message_error = 0;
 
 static const int thttp_machine_parser_message_en_main = 1;
 
 
 /* #line 165 "./ragel/thttp_parser_message.rl" */
 TSK_RAGEL_DISABLE_WARNINGS_END()
 
 /**	Parses raw HTTP buffer.
  *
  * @param state	Ragel state containing the buffer references.
  * @param result @ref thttp_message_t object representing the raw buffer.
  * @param	extract_content	Indicates wheteher to parse the message content or not. If set to true, then
  * only headers will be parsed.
  *
  * @retval	Zero if succeed and non-zero error code otherwise. 
 **/
 int thttp_message_parse(tsk_ragel_state_t *state, thttp_message_t **result, tsk_bool_t extract_content)
 {
 	if(!state || state->pe <= state->p){
 		return -1;
 	}
 
 	if(!*result){
 		*result = thttp_message_create();
 	}
 
 	/* Ragel init */
 	thttp_message_parser_init(state);
 
 	/*
 	*	State mechine execution.
 	*/
 	thttp_message_parser_execute(state, *result, extract_content);
 
 	/* Check result */
 
 	if( state->cs < 
 /* #line 197 "./src/parsers/thttp_parser_message.c" */
 36
 /* #line 196 "./ragel/thttp_parser_message.rl" */
  ){
 		TSK_DEBUG_ERROR("Failed to parse HTTP message.");
 		TSK_OBJECT_SAFE_FREE(*result);
 		return -2;
 	}
 	return 0;
 }
 
 
 static void thttp_message_parser_init(tsk_ragel_state_t *state)
 {
 	int cs = 0;
 
 	/* Regel machine initialization. */
 	
 /* #line 215 "./src/parsers/thttp_parser_message.c" */
 	{
 	cs = thttp_machine_parser_message_start;
 	}
 
 /* #line 211 "./ragel/thttp_parser_message.rl" */
 	
 	state->cs = cs;
 }
 
 static void thttp_message_parser_execute(tsk_ragel_state_t *state, thttp_message_t *message, tsk_bool_t extract_content)
 {
 	int cs = state->cs;
 	const char *p = state->p;
 	const char *pe = state->pe;
 	const char *eof = state->eof;
 
 	TSK_RAGEL_DISABLE_WARNINGS_BEGIN()
 	
 /* #line 234 "./src/parsers/thttp_parser_message.c" */
 	{
 	int _klen;
 	unsigned int _trans;
 	const char *_acts;
 	unsigned int _nacts;
 	const char *_keys;
 
 	if ( p == pe )
 		goto _test_eof;
 	if ( cs == 0 )
 		goto _out;
 _resume:
 	_keys = _thttp_machine_parser_message_trans_keys + _thttp_machine_parser_message_key_offsets[cs];
 	_trans = _thttp_machine_parser_message_index_offsets[cs];
 
 	_klen = _thttp_machine_parser_message_single_lengths[cs];
 	if ( _klen > 0 ) {
 		const char *_lower = _keys;
 		const char *_mid;
 		const char *_upper = _keys + _klen - 1;
 		while (1) {
 			if ( _upper < _lower )
 				break;
 
 			_mid = _lower + ((_upper-_lower) >> 1);
 			if ( (*p) < *_mid )
 				_upper = _mid - 1;
 			else if ( (*p) > *_mid )
 				_lower = _mid + 1;
 			else {
 				_trans += (_mid - _keys);
 				goto _match;
 			}
 		}
 		_keys += _klen;
 		_trans += _klen;
 	}
 
 	_klen = _thttp_machine_parser_message_range_lengths[cs];
 	if ( _klen > 0 ) {
 		const char *_lower = _keys;
 		const char *_mid;
 		const char *_upper = _keys + (_klen<<1) - 2;
 		while (1) {
 			if ( _upper < _lower )
 				break;
 
 			_mid = _lower + (((_upper-_lower) >> 1) & ~1);
 			if ( (*p) < _mid[0] )
 				_upper = _mid - 2;
 			else if ( (*p) > _mid[1] )
 				_lower = _mid + 2;
 			else {
 				_trans += ((_mid - _keys)>>1);
 				goto _match;
 			}
 		}
 		_trans += _klen;
 	}
 
 _match:
 	_trans = _thttp_machine_parser_message_indicies[_trans];
 	cs = _thttp_machine_parser_message_trans_targs[_trans];
 
 	if ( _thttp_machine_parser_message_trans_actions[_trans] == 0 )
 		goto _again;
 
 	_acts = _thttp_machine_parser_message_actions + _thttp_machine_parser_message_trans_actions[_trans];
 	_nacts = (unsigned int) *_acts++;
 	while ( _nacts-- > 0 )
 	{
 		switch ( *_acts++ )
 		{
 	case 0:
 /* #line 43 "./ragel/thttp_parser_message.rl" */
 	{
 		state->tag_start = p;
 	}
 	break;
 	case 1:
 /* #line 48 "./ragel/thttp_parser_message.rl" */
 	{
 		int len;
 		state->tag_end = p;
 		len = (int)(state->tag_end  - state->tag_start);
 
 		if(message->type == thttp_unknown){
 			message->type = thttp_request;
 			if(!message->line.request.method){
 				#if HAVE_CRT //Debug memory
 				message->line.request.method = calloc(1, len+1);
 		
 	#else
 				message->line.request.method = tsk_calloc(1, len+1);
 		
 	#endif //HAVE_CRT
 				memcpy(message->line.request.method, state->tag_start, len);
 			}
 		}
 		else{
 			state->cs = thttp_machine_parser_message_error;
 		}
 	}
 	break;
 	case 2:
 /* #line 66 "./ragel/thttp_parser_message.rl" */
 	{
 		int len;
 		state->tag_end = p;
 		len = (int)(state->tag_end  - state->tag_start);
 		
 		if(!message->line.request.url){
 			message->line.request.url = thttp_url_parse(state->tag_start, (tsk_size_t)len);
 		}
 	}
 	break;
 	case 3:
 /* #line 77 "./ragel/thttp_parser_message.rl" */
 	{
 		int len;
 		state->tag_end = p;
 		len = (int)(state->tag_end  - state->tag_start);
 
 		if(!message->http_version){
 			#if HAVE_CRT //Debug memory
 			message->http_version = calloc(1, len+1);
 		
 	#else
 			message->http_version = tsk_calloc(1, len+1);
 		
 	#endif //HAVE_CRT
 			memcpy(message->http_version, state->tag_start, len);
 		}
 	}
 	break;
 	case 4:
 /* #line 89 "./ragel/thttp_parser_message.rl" */
 	{
 		int len;
 		state->tag_end = p;
 		len = (int)(state->tag_end  - state->tag_start);
 		
 		if(message->type == thttp_unknown){
 			message->type = thttp_response;
 			message->line.response.status_code = atoi(state->tag_start);
 		}
 		else{
 			state->cs = thttp_machine_parser_message_error;
 		}
 	}
 	break;
 	case 5:
 /* #line 104 "./ragel/thttp_parser_message.rl" */
 	{
 		int len;
 		state->tag_end = p;
 		len = (int)(state->tag_end  - state->tag_start);
 
 		if(!message->line.response.reason_phrase){
 			#if HAVE_CRT //Debug memory
 			message->line.response.reason_phrase = calloc(1, len+1);
 		
 	#else
 			message->line.response.reason_phrase = tsk_calloc(1, len+1);
 		
 	#endif //HAVE_CRT
 			memcpy(message->line.response.reason_phrase, state->tag_start, len);
 		}
 	}
 	break;
 	case 6:
 /* #line 116 "./ragel/thttp_parser_message.rl" */
 	{
 		int len;
 		state->tag_end = p;
 		len = (int)(state->tag_end  - state->tag_start);
 		
 		if(thttp_header_parse(state, message)){
 			TSK_DEBUG_ERROR("Failed to parse header - %s", state->tag_start);
 		}
 		else{
 			//TSK_DEBUG_INFO("THTTP_MESSAGE_PARSER::PARSE_HEADER len=%d state=%d", len, state->cs);
 		}
 	}
 	break;
 	case 7:
 /* #line 139 "./ragel/thttp_parser_message.rl" */
 	{
 		state->cs = cs;
 		state->p = p;
 		state->pe = pe;
 		state->eof = eof;
 
 		thttp_message_parser_eoh(state, message, extract_content);
 
 		cs = state->cs;
 		p = state->p;
 		pe = state->pe;
 		eof = state->eof;
 	}
 	break;
 /* #line 418 "./src/parsers/thttp_parser_message.c" */
 		}
 	}
 
 _again:
 	if ( cs == 0 )
 		goto _out;
 	if ( ++p != pe )
 		goto _resume;
 	_test_eof: {}
 	_out: {}
 	}
 
 /* #line 224 "./ragel/thttp_parser_message.rl" */
 	TSK_RAGEL_DISABLE_WARNINGS_END()
 
 	state->cs = cs;
 	state->p = p;
 	state->pe = pe;
 	state->eof = eof;
 }
 
 static void thttp_message_parser_eoh(tsk_ragel_state_t *state, thttp_message_t *message, tsk_bool_t extract_content)
 {
 	int cs = state->cs;
 	const char *p = state->p;
 	const char *pe = state->pe;
 	const char *eof = state->eof;
 
 	if(extract_content && message){
 		uint32_t clen = THTTP_MESSAGE_CONTENT_LENGTH(message);
 		if(clen){
 			if((p + clen)<pe && !message->Content){
 				message->Content = tsk_buffer_create((p+1), clen);
 				p = (p + clen);
 			}
 			else{
 				p = (pe - 1);
 			}
 		}
 	}
 	//%%write eof;
 
 	state->cs = cs;
 	state->p = p;
 	state->pe = pe;
 	state->eof = eof;
 }