3 typedef struct php_http_message_parser_state_spec
{
4 php_http_message_parser_state_t state
;
6 } php_http_message_parser_state_spec_t
;
8 static const php_http_message_parser_state_spec_t php_http_message_parser_states
[] = {
9 {PHP_HTTP_MESSAGE_PARSER_STATE_START
, 1},
10 {PHP_HTTP_MESSAGE_PARSER_STATE_HEADER
, 1},
11 {PHP_HTTP_MESSAGE_PARSER_STATE_HEADER_DONE
, 0},
12 {PHP_HTTP_MESSAGE_PARSER_STATE_BODY
, 0},
13 {PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DUMB
, 1},
14 {PHP_HTTP_MESSAGE_PARSER_STATE_BODY_LENGTH
, 1},
15 {PHP_HTTP_MESSAGE_PARSER_STATE_BODY_CHUNKED
, 1},
16 {PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DONE
, 0},
17 {PHP_HTTP_MESSAGE_PARSER_STATE_DONE
, 0}
20 PHP_HTTP_API php_http_message_parser_t
*php_http_message_parser_init(php_http_message_parser_t
*parser TSRMLS_DC
)
23 parser
= emalloc(sizeof(*parser
));
25 memset(parser
, 0, sizeof(*parser
));
27 TSRMLS_SET_CTX(parser
->ts
);
29 php_http_header_parser_init(&parser
->header TSRMLS_CC
);
30 zend_stack_init(&parser
->stack
);
35 PHP_HTTP_API php_http_message_parser_state_t
php_http_message_parser_state_push(php_http_message_parser_t
*parser
, unsigned argc
, ...)
39 va_start(va_args
, argc
);
40 php_http_message_parser_state_t state
;
42 for (i
= 0; i
< argc
; ++i
) {
43 state
= va_arg(va_args
, php_http_message_parser_state_t
);
44 zend_stack_push(&parser
->stack
, &state
, sizeof(state
));
51 PHP_HTTP_API php_http_message_parser_state_t
php_http_message_parser_state_is(php_http_message_parser_t
*parser
)
53 php_http_message_parser_state_t
*state
;
55 if (SUCCESS
== zend_stack_top(&parser
->stack
, (void *) &state
)) {
58 return PHP_HTTP_MESSAGE_PARSER_STATE_START
;
61 PHP_HTTP_API php_http_message_parser_state_t
php_http_message_parser_state_pop(php_http_message_parser_t
*parser
)
63 php_http_message_parser_state_t state
, *state_ptr
;
64 if (SUCCESS
== zend_stack_top(&parser
->stack
, (void *) &state_ptr
)) {
66 zend_stack_del_top(&parser
->stack
);
69 return PHP_HTTP_MESSAGE_PARSER_STATE_START
;
72 PHP_HTTP_API
void php_http_message_parser_dtor(php_http_message_parser_t
*parser
)
74 php_http_header_parser_dtor(&parser
->header
);
75 zend_stack_destroy(&parser
->stack
);
76 if (parser
->dechunk
) {
77 php_http_encoding_stream_free(&parser
->dechunk TSRMLS_CC
);
79 if (parser
->inflate
) {
80 php_http_encoding_stream_free(&parser
->inflate TSRMLS_CC
);
84 PHP_HTTP_API
void php_http_message_parser_free(php_http_message_parser_t
**parser
)
87 php_http_message_parser_dtor(*parser
);
94 PHP_HTTP_API php_http_message_parser_state_t
php_http_message_parser_parse(php_http_message_parser_t
*parser
, php_http_buffer
*buffer
, unsigned flags
, php_http_message_t
**message
)
96 TSRMLS_FETCH_FROM_CTX(parser
->ts
);
101 while (buffer
->used
|| !php_http_message_parser_states
[php_http_message_parser_state_is(parser
)].need_data
) {
103 const char *state
[] = {"START", "HEADER", "HEADER_DONE", "BODY", "BODY_DUMB", "BODY_LENGTH", "BODY_CHUNK", "BODY_DONE", "DONE"};
104 fprintf(stderr
, "#MP: %s (%d) %zu\n",
105 state
[php_http_message_parser_state_is(parser
)], (*message
)->type
, buffer
->used
);
108 switch (php_http_message_parser_state_pop(parser
))
110 case PHP_HTTP_MESSAGE_PARSER_STATE_FAILURE
:
111 return php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_FAILURE
);
113 case PHP_HTTP_MESSAGE_PARSER_STATE_START
:
115 char *ptr
= buffer
->data
;
117 while (ptr
- buffer
->data
< buffer
->used
&& PHP_HTTP_IS_CTYPE(space
, *ptr
)) {
121 php_http_buffer_cut(buffer
, 0, ptr
- buffer
->data
);
124 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_HEADER
);
129 case PHP_HTTP_MESSAGE_PARSER_STATE_HEADER
:
131 unsigned header_parser_flags
= (flags
& PHP_HTTP_MESSAGE_PARSER_CLEANUP
) ? PHP_HTTP_HEADER_PARSER_CLEANUP
: 0;
133 switch (php_http_header_parser_parse(&parser
->header
, buffer
, header_parser_flags
, &(*message
)->hdrs
, (php_http_info_callback_t
) php_http_message_info_callback
, message
)) {
134 case PHP_HTTP_HEADER_PARSER_STATE_FAILURE
:
135 return PHP_HTTP_MESSAGE_PARSER_STATE_FAILURE
;
137 case PHP_HTTP_HEADER_PARSER_STATE_DONE
:
138 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_HEADER_DONE
);
142 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_HEADER
);
144 return PHP_HTTP_MESSAGE_PARSER_STATE_HEADER
;
150 case PHP_HTTP_MESSAGE_PARSER_STATE_HEADER_DONE
:
152 zval
*h
, **h_cl
= NULL
, **h_cr
= NULL
, **h_te
= NULL
;
154 if ((h
= php_http_message_header(*message
, ZEND_STRL("Transfer-Encoding"), 1))) {
155 zend_hash_update(&(*message
)->hdrs
, "X-Original-Transfer-Encoding", sizeof("X-Original-Transfer-Encoding"), &h
, sizeof(zval
*), (void *) &h_te
);
156 zend_hash_del(&(*message
)->hdrs
, "Transfer-Encoding", sizeof("Transfer-Encoding"));
158 if ((h
= php_http_message_header(*message
, ZEND_STRL("Content-Length"), 1))) {
159 zend_hash_update(&(*message
)->hdrs
, "X-Original-Content-Length", sizeof("X-Original-Content-Length"), &h
, sizeof(zval
*), (void *) &h_cl
);
161 if ((h
= php_http_message_header(*message
, ZEND_STRL("Content-Range"), 1))) {
162 zend_hash_update(&(*message
)->hdrs
, "X-Original-Content-Range", sizeof("X-Original-Content-Range"), &h
, sizeof(zval
*), (void *) &h_cr
);
163 zend_hash_del(&(*message
)->hdrs
, "Content-Range", sizeof("Content-Range"));
166 if ((h
= php_http_message_header(*message
, ZEND_STRL("Content-Encoding"), 1))) {
167 if (strstr(Z_STRVAL_P(h
), "gzip") || strstr(Z_STRVAL_P(h
), "x-gzip") || strstr(Z_STRVAL_P(h
), "deflate")) {
168 parser
->inflate
= php_http_encoding_stream_init(parser
->inflate
, php_http_encoding_stream_get_inflate_ops(), 0 TSRMLS_CC
);
169 zend_hash_update(&(*message
)->hdrs
, "X-Original-Content-Encoding", sizeof("X-Original-Content-Encoding"), &h
, sizeof(zval
*), NULL
);
170 zend_hash_del(&(*message
)->hdrs
, "Content-Encoding", sizeof("Content-Encoding"));
179 zend_hash_update(&(*message
)->hdrs
, "Content-Length", sizeof("Content-Length"), &h
, sizeof(zval
*), NULL
);
182 if (strstr(Z_STRVAL_PP(h_te
), "chunked")) {
183 parser
->dechunk
= php_http_encoding_stream_init(parser
->dechunk
, php_http_encoding_stream_get_dechunk_ops(), 0 TSRMLS_CC
);
184 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_BODY_CHUNKED
);
192 parser
->body_length
= strtoul(Z_STRVAL_PP(h_cl
), &stop
, 10);
194 if (stop
!= Z_STRVAL_PP(h_cl
)) {
195 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_BODY_LENGTH
);
201 ulong total
= 0, start
= 0, end
= 0;
203 if (!strncasecmp(Z_STRVAL_PP(h_cr
), "bytes", lenof("bytes"))
204 && ( Z_STRVAL_P(h
)[lenof("bytes")] == ':'
205 || Z_STRVAL_P(h
)[lenof("bytes")] == ' '
206 || Z_STRVAL_P(h
)[lenof("bytes")] == '='
209 char *total_at
= NULL
, *end_at
= NULL
;
210 char *start_at
= Z_STRVAL_PP(h_cr
) + sizeof("bytes");
212 start
= strtoul(start_at
, &end_at
, 10);
214 end
= strtoul(end_at
+ 1, &total_at
, 10);
215 if (total_at
&& strncmp(total_at
+ 1, "*", 1)) {
216 total
= strtoul(total_at
+ 1, NULL
, 10);
219 if (end
>= start
&& (!total
|| end
< total
)) {
220 parser
->body_length
= end
+ 1 - start
;
221 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_BODY_LENGTH
);
229 if ((*message
)->type
== PHP_HTTP_REQUEST
) {
230 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_DONE
);
232 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DUMB
);
237 case PHP_HTTP_MESSAGE_PARSER_STATE_BODY
:
241 if (parser
->inflate
) {
242 char *dec_str
= NULL
;
245 if (SUCCESS
!= php_http_encoding_stream_update(parser
->inflate
, str
, len
, &dec_str
, &dec_len TSRMLS_CC
)) {
246 return php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_FAILURE
);
249 if (str
!= buffer
->data
) {
256 php_stream_write(php_http_message_body_stream(&(*message
)->body
), str
, len
);
257 php_http_buffer_cut(buffer
, 0, cut
);
261 ZVAL_LONG(zcl
, php_http_message_body_size(&(*message
)->body
));
262 zend_hash_update(&(*message
)->hdrs
, "Content-Length", sizeof("Content-Length"), &zcl
, sizeof(zval
*), NULL
);
264 if (str
!= buffer
->data
) {
273 case PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DUMB
:
279 php_http_message_parser_state_push(parser
, 2, !buffer
->used
?PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DONE
:PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DUMB
, PHP_HTTP_MESSAGE_PARSER_STATE_BODY
);
283 case PHP_HTTP_MESSAGE_PARSER_STATE_BODY_LENGTH
:
285 len
= MIN(parser
->body_length
, buffer
->used
);
289 parser
->body_length
-= len
;
291 php_http_message_parser_state_push(parser
, 2, !parser
->body_length
?PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DONE
:PHP_HTTP_MESSAGE_PARSER_STATE_BODY_LENGTH
, PHP_HTTP_MESSAGE_PARSER_STATE_BODY
);
295 case PHP_HTTP_MESSAGE_PARSER_STATE_BODY_CHUNKED
:
298 * - pass available data through the dechunk stream
299 * - pass decoded data along
300 * - if stream zeroed:
301 * Y: - cut processed string out of buffer, but leave length of unprocessed dechunk stream data untouched
305 char *dec_str
= NULL
;
308 if (SUCCESS
!= php_http_encoding_stream_update(parser
->dechunk
, buffer
->data
, buffer
->used
, &dec_str
, &dec_len TSRMLS_CC
)) {
315 if (php_http_encoding_stream_done(parser
->dechunk
)) {
316 cut
= buffer
->used
- PHP_HTTP_BUFFER_LEN(parser
->dechunk
->ctx
);
317 php_http_message_parser_state_push(parser
, 2, PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DONE
, PHP_HTTP_MESSAGE_PARSER_STATE_BODY
);
320 php_http_message_parser_state_push(parser
, 2, PHP_HTTP_MESSAGE_PARSER_STATE_BODY_CHUNKED
, PHP_HTTP_MESSAGE_PARSER_STATE_BODY
);
325 case PHP_HTTP_MESSAGE_PARSER_STATE_BODY_DONE
:
327 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_DONE
);
329 if (parser
->dechunk
) {
330 char *dec_str
= NULL
;
333 if (SUCCESS
!= php_http_encoding_stream_finish(parser
->dechunk
, &dec_str
, &dec_len TSRMLS_CC
)) {
334 return php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_FAILURE
);
336 php_http_encoding_stream_dtor(parser
->dechunk
);
338 if (dec_str
&& dec_len
) {
342 php_http_message_parser_state_push(parser
, 1, PHP_HTTP_MESSAGE_PARSER_STATE_BODY
);
349 case PHP_HTTP_MESSAGE_PARSER_STATE_DONE
: {
350 char *ptr
= buffer
->data
;
352 while (ptr
- buffer
->data
< buffer
->used
&& PHP_HTTP_IS_CTYPE(space
, *ptr
)) {
356 php_http_buffer_cut(buffer
, 0, ptr
- buffer
->data
);
362 return php_http_message_parser_state_is(parser
);