flush WIP
[m6w6/ext-http] / php_http_header_parser.c
1 /*
2 +--------------------------------------------------------------------+
3 | PECL :: http |
4 +--------------------------------------------------------------------+
5 | Redistribution and use in source and binary forms, with or without |
6 | modification, are permitted provided that the conditions mentioned |
7 | in the accompanying LICENSE file are met. |
8 +--------------------------------------------------------------------+
9 | Copyright (c) 2004-2014, Michael Wallner <mike@php.net> |
10 +--------------------------------------------------------------------+
11 */
12
13 #include "php_http_api.h"
14
15 typedef struct php_http_header_parser_state_spec {
16 php_http_header_parser_state_t state;
17 unsigned need_data:1;
18 } php_http_header_parser_state_spec_t;
19
20 static const php_http_header_parser_state_spec_t php_http_header_parser_states[] = {
21 {PHP_HTTP_HEADER_PARSER_STATE_START, 1},
22 {PHP_HTTP_HEADER_PARSER_STATE_KEY, 1},
23 {PHP_HTTP_HEADER_PARSER_STATE_VALUE, 1},
24 {PHP_HTTP_HEADER_PARSER_STATE_VALUE_EX, 1},
25 {PHP_HTTP_HEADER_PARSER_STATE_HEADER_DONE, 0},
26 {PHP_HTTP_HEADER_PARSER_STATE_DONE, 0}
27 };
28
29 php_http_header_parser_t *php_http_header_parser_init(php_http_header_parser_t *parser)
30 {
31 if (!parser) {
32 parser = emalloc(sizeof(*parser));
33 }
34 memset(parser, 0, sizeof(*parser));
35
36 return parser;
37 }
38
39 php_http_header_parser_state_t php_http_header_parser_state_push(php_http_header_parser_t *parser, unsigned argc, ...)
40 {
41 va_list va_args;
42 unsigned i;
43 php_http_header_parser_state_t state = 0;
44
45 /* short circuit */
46 ZEND_PTR_STACK_RESIZE_IF_NEEDED((&parser->stack), argc);
47
48 va_start(va_args, argc);
49 for (i = 0; i < argc; ++i) {
50 state = va_arg(va_args, php_http_header_parser_state_t);
51 zend_ptr_stack_push(&parser->stack, (void *) state);
52 }
53 va_end(va_args);
54
55 return state;
56 }
57
58 php_http_header_parser_state_t php_http_header_parser_state_is(php_http_header_parser_t *parser)
59 {
60 if (parser->stack.top) {
61 return (php_http_header_parser_state_t) parser->stack.elements[parser->stack.top - 1];
62 }
63
64 return PHP_HTTP_HEADER_PARSER_STATE_START;
65 }
66
67 php_http_header_parser_state_t php_http_header_parser_state_pop(php_http_header_parser_t *parser)
68 {
69 if (parser->stack.top) {
70 return (php_http_header_parser_state_t) zend_ptr_stack_pop(&parser->stack);
71 }
72
73 return PHP_HTTP_HEADER_PARSER_STATE_START;
74 }
75
76 void php_http_header_parser_dtor(php_http_header_parser_t *parser)
77 {
78 zend_ptr_stack_destroy(&parser->stack);
79 php_http_info_dtor(&parser->info);
80 PTR_FREE(parser->_key.str);
81 PTR_FREE(parser->_val.str);
82 }
83
84 void php_http_header_parser_free(php_http_header_parser_t **parser)
85 {
86 if (*parser) {
87 php_http_header_parser_dtor(*parser);
88 efree(*parser);
89 *parser = NULL;
90 }
91 }
92
93 php_http_header_parser_state_t php_http_header_parser_parse(php_http_header_parser_t *parser, php_http_buffer_t *buffer, unsigned flags, HashTable *headers, php_http_info_callback_t callback_func, void *callback_arg)
94 {
95 while (buffer->used || !php_http_header_parser_states[php_http_header_parser_state_is(parser)].need_data) {
96 #if 0
97 const char *state[] = {"START", "KEY", "VALUE", "HEADER_DONE", "DONE"};
98 fprintf(stderr, "#HP: %s (avail:%zu, num:%d)\n", php_http_header_parser_state_is(parser) < 0 ? "FAILURE" : state[php_http_header_parser_state_is(parser)], buffer->used, headers?zend_hash_num_elements(headers):0);
99 _dpf(0, buffer->data, buffer->used);
100 #endif
101 switch (php_http_header_parser_state_pop(parser)) {
102 case PHP_HTTP_HEADER_PARSER_STATE_FAILURE:
103 return php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_FAILURE);
104
105 case PHP_HTTP_HEADER_PARSER_STATE_START: {
106 char *ptr = buffer->data;
107
108 while (ptr - buffer->data < buffer->used && PHP_HTTP_IS_CTYPE(space, *ptr)) {
109 ++ptr;
110 }
111
112 php_http_buffer_cut(buffer, 0, ptr - buffer->data);
113 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_KEY);
114 break;
115 }
116
117 case PHP_HTTP_HEADER_PARSER_STATE_KEY: {
118 const char *colon, *eol_str = NULL;
119 int eol_len = 0;
120
121 if (buffer->data == (eol_str = php_http_locate_bin_eol(buffer->data, buffer->used, &eol_len))) {
122 /* end of headers */
123 php_http_buffer_cut(buffer, 0, eol_len);
124 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_DONE);
125 } else if (php_http_info_parse(&parser->info, php_http_buffer_fix(buffer)->data)) {
126 /* new message starting with request/response line */
127 if (callback_func) {
128 callback_func(callback_arg, &headers, &parser->info);
129 }
130 php_http_info_dtor(&parser->info);
131 php_http_buffer_cut(buffer, 0, eol_str + eol_len - buffer->data);
132 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_HEADER_DONE);
133 } else if ((colon = memchr(buffer->data, ':', buffer->used)) && (!eol_str || eol_str > colon)) {
134 /* header: string */
135 parser->_key.str = estrndup(buffer->data, parser->_key.len = colon - buffer->data);
136 while (PHP_HTTP_IS_CTYPE(space, *++colon) && *colon != '\n' && *colon != '\r');
137 php_http_buffer_cut(buffer, 0, colon - buffer->data);
138 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_VALUE);
139 } else {
140 /* neither reqeust/response line nor header: string */
141 return php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_FAILURE);
142 }
143 break;
144 }
145
146 case PHP_HTTP_HEADER_PARSER_STATE_VALUE: {
147 const char *eol_str;
148 int eol_len;
149
150 #define SET_ADD_VAL(slen, eol_len) \
151 do { \
152 const char *ptr = buffer->data; \
153 size_t len = slen; \
154 \
155 while (len > 0 && PHP_HTTP_IS_CTYPE(space, *ptr)) { \
156 ++ptr; \
157 --len; \
158 } \
159 while (len > 0 && PHP_HTTP_IS_CTYPE(space, ptr[len - 1])) { \
160 --len; \
161 } \
162 \
163 if (len > 0) { \
164 if (parser->_val.str) { \
165 parser->_val.str = erealloc(parser->_val.str, parser->_val.len + len + 2); \
166 parser->_val.str[parser->_val.len++] = ' '; \
167 memcpy(&parser->_val.str[parser->_val.len], ptr, len); \
168 parser->_val.len += len; \
169 parser->_val.str[parser->_val.len] = '\0'; \
170 } else { \
171 parser->_val.len = len; \
172 parser->_val.str = estrndup(ptr, len); \
173 } \
174 } \
175 php_http_buffer_cut(buffer, 0, slen + eol_len); \
176 } while (0)
177
178 if ((eol_str = php_http_locate_bin_eol(buffer->data, buffer->used, &eol_len))) {
179 SET_ADD_VAL(eol_str - buffer->data, eol_len);
180
181 if (buffer->used) {
182 if (*buffer->data != '\t' && *buffer->data != ' ') {
183 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_HEADER_DONE);
184 break;
185 } else {
186 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_VALUE);
187 break;
188 }
189 }
190 }
191
192 if (flags & PHP_HTTP_HEADER_PARSER_CLEANUP) {
193 if (buffer->used) {
194 SET_ADD_VAL(buffer->used, 0);
195 }
196 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_HEADER_DONE);
197 } else {
198 return php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_VALUE_EX);
199 }
200 break;
201 }
202
203 case PHP_HTTP_HEADER_PARSER_STATE_VALUE_EX:
204 if (*buffer->data == ' ' || *buffer->data == '\t') {
205 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_VALUE);
206 } else {
207 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_HEADER_DONE);
208 }
209 break;
210
211 case PHP_HTTP_HEADER_PARSER_STATE_HEADER_DONE:
212 if (parser->_key.str && parser->_val.str) {
213 zval tmp, *exist;
214
215 if (!headers && callback_func) {
216 callback_func(callback_arg, &headers, NULL);
217 }
218
219 php_http_pretty_key(parser->_key.str, parser->_key.len, 1, 1);
220 if ((exist = zend_symtable_str_find(headers, parser->_key.str, parser->_key.len))) {
221 convert_to_array(exist);
222 add_next_index_str(exist, php_http_cs2zs(parser->_val.str, parser->_val.len));
223 } else {
224 ZVAL_STR(&tmp, php_http_cs2zs(parser->_val.str, parser->_val.len));
225 zend_symtable_str_update(headers, parser->_key.str, parser->_key.len, &tmp);
226 }
227 parser->_val.str = NULL;
228 }
229
230 PTR_SET(parser->_key.str, NULL);
231 PTR_SET(parser->_val.str, NULL);
232
233 php_http_header_parser_state_push(parser, 1, PHP_HTTP_HEADER_PARSER_STATE_KEY);
234 break;
235
236 case PHP_HTTP_HEADER_PARSER_STATE_DONE:
237 return PHP_HTTP_HEADER_PARSER_STATE_DONE;
238 }
239 }
240
241 return php_http_header_parser_state_is(parser);
242 }
243
244 /*
245 * Local variables:
246 * tab-width: 4
247 * c-basic-offset: 4
248 * End:
249 * vim600: noet sw=4 ts=4 fdm=marker
250 * vim<600: noet sw=4 ts=4
251 */
252