ac663afa0eaf5b2bfaee6ec05b9c2a8fd4175b50
[m6w6/ext-psi] / src / context.c
1 #ifdef HAVE_CONFIG_H
2 # include "config.h"
3 #endif
4
5 #include "php.h"
6
7 #include <stdio.h>
8 #ifdef HAVE_SYS_TYPES_H
9 # include <sys/types.h>
10 #endif
11 #ifdef HAVE_SYS_STAT_H
12 # include <sys/stat.h>
13 #endif
14 #ifdef STDC_HEADERS
15 # include <stdlib.h>
16 # include <stddef.h>
17 #else
18 # ifdef HAVE_STDLIB_H
19 # include <stdlib.h>
20 # endif
21 #endif
22 #ifdef HAVE_STRING_H
23 # if !defined STDC_HEADERS && defined HAVE_MEMORY_H
24 # include <memory.h>
25 # endif
26 # include <string.h>
27 #endif
28 #ifdef HAVE_STRINGS_H
29 # include <strings.h>
30 #endif
31 #ifdef HAVE_INTTYPES_H
32 # include <inttypes.h>
33 #endif
34 #ifdef HAVE_STDINT_H
35 # include <stdint.h>
36 #endif
37 #ifdef HAVE_UNISTD_H
38 # include <unistd.h>
39 #endif
40
41 #ifdef HAVE_ERRNO_H
42 # include <errno.h>
43 #endif
44 #ifdef HAVE_GLOB_H
45 # include <glob.h>
46 #endif
47 #ifdef HAVE_NETINET_IN_H
48 # include <netinet/in.h>
49 #endif
50 #ifdef HAVE_ARPA_NAMESER_H
51 # include <arpa/nameser.h>
52 #endif
53 #ifdef HAVE_NETDB_H
54 # include <netdb.h>
55 #endif
56 #ifdef HAVE_RESOLV_H
57 # include <resolv.h>
58 #endif
59 #ifdef HAVE_SYS_SELECT_H
60 # include <sys/select.h>
61 #endif
62 #ifdef HAVE_SYS_SOCKET_H
63 # include <sys/socket.h>
64 #endif
65 #ifdef HAVE_SYS_TIME_H
66 # include <sys/time.h>
67 #endif
68 #ifdef HAVE_SYS_TIMES_H
69 # include <sys/times.h>
70 #endif
71 #ifdef HAVE_SYS_UIO_H
72 # include <sys/uio.h>
73 #endif
74 #ifdef HAVE_SYS_UTSNAME_H
75 # include <sys/utsname.h>
76 #endif
77 #ifdef HAVE_TIME_H
78 # include <time.h>
79 #endif
80 #ifdef HAVE_WCHAR_H
81 # include <wchar.h>
82 #endif
83
84 #ifdef HAVE_DIRENT_H
85 # include <dirent.h>
86 # define NAMLEN(dirent) strlen ((dirent)->d_name)
87 #else
88 # define dirent direct
89 # define NAMLEN(dirent) ((dirent)->d_namlen)
90 # ifdef HAVE_SYS_NDIR_H
91 # include <sys/ndir.h>
92 # endif
93 # ifdef HAVE_SYS_DIR_H
94 # include <sys/dir.h>
95 # endif
96 # ifdef HAVE_NDIR_H
97 # include <ndir.h>
98 # endif
99 #endif
100
101 #include <sys/param.h>
102 #include <dlfcn.h>
103 #include <fnmatch.h>
104
105 #include "php.h"
106 #include "php_scandir.h"
107 #include "php_psi.h"
108 #include "context.h"
109 #include "parser.h"
110
111 #include "libjit.h"
112 #include "libffi.h"
113
114 static struct psi_std_type {
115 token_t type_tag;
116 const char *type_name;
117 } psi_std_types[] = {
118 {PSI_T_FLOAT, "float"},
119 {PSI_T_DOUBLE, "double"},
120 {PSI_T_INT8, "int8_t"},
121 {PSI_T_INT16, "int16_t"},
122 {PSI_T_INT32, "int32_t"},
123 {PSI_T_INT64, "int64_t"},
124 {PSI_T_UINT8, "uint8_t"},
125 {PSI_T_UINT16, "uint16_t"},
126 {PSI_T_UINT32, "uint32_t"},
127 {PSI_T_UINT64, "uint64_t"},
128 {0}
129 };
130
131 static struct psi_predef_type {
132 token_t type_tag;
133 const char *type_name;
134 const char *alias;
135 } psi_predef_types[] = {
136 PSI_TYPES
137 {0}
138 };
139
140 static struct psi_predef_const {
141 token_t type_tag;
142 const char *type_name;
143 const char *var_name;
144 const char *val_text;
145 token_t val_type_tag;
146 } psi_predef_consts[] = {
147 PSI_CONSTS
148 {0}
149 };
150
151 PSI_MACROS
152
153 static struct psi_func_redir {
154 const char *name;
155 void (*func)(void);
156 } psi_func_redirs[] = {
157 PSI_REDIRS
158 {0}
159 };
160
161 static struct psi_predef_decl {
162 token_t type_tag;
163 const char *type_name;
164 const char *var_name;
165 size_t pointer_level;
166 size_t array_size;
167 } psi_predef_decls[] = {
168 PSI_DECLS
169 {0}
170 };
171
172 static struct psi_predef_struct {
173 token_t type_tag;
174 const char *type_name;
175 const char *var_name;
176 size_t offset;
177 size_t size;
178 size_t pointer_level;
179 size_t array_size;
180 } psi_predef_structs[] = {
181 PSI_STRUCTS
182 {0}
183 };
184
185 static int validate_lib(PSI_Data *data, void **dlopened) {
186 char lib[MAXPATHLEN];
187 const char *ptr = data->psi.file.ln;
188 size_t len;
189
190 if (!ptr) {
191 /* FIXME: assume stdlib */
192 return 1;
193 } else if (!strchr(ptr, '/')) {
194 len = snprintf(lib, MAXPATHLEN, "lib%s.%s", ptr, PHP_PSI_SHLIB_SUFFIX);
195 if (MAXPATHLEN == len) {
196 data->error(PSI_WARNING, "Library name too long: '%s'", ptr);
197 }
198 lib[len] = 0;
199 ptr = lib;
200 }
201 if (!(*dlopened = dlopen(ptr, RTLD_LAZY|RTLD_LOCAL))) {
202 data->error(PSI_WARNING, "Could not open library '%s': %s.",
203 data->psi.file.ln, dlerror());
204 return 0;
205 }
206 return 1;
207 }
208
209 static inline int locate_decl_type_alias(decl_typedefs *defs, decl_type *type) {
210 size_t i;
211 struct psi_std_type *stdtyp;
212
213 if (type->real) {
214 return 1;
215 }
216 for (i = 0; i < defs->count; ++i) {
217 decl_typedef *def = defs->list[i];
218
219 if (def->type->type != type->type && !strcmp(def->alias, type->name)) {
220 type->real = def->type;
221 return 1;
222 }
223 }
224 for (stdtyp = &psi_std_types[0]; stdtyp->type_tag; ++stdtyp) {
225 if (!strcmp(type->name, stdtyp->type_name)) {
226 type->type = stdtyp->type_tag;
227 return 1;
228 }
229 }
230
231 return 0;
232 }
233 static inline int locate_decl_type_struct(decl_structs *structs, decl_type *type) {
234 size_t i;
235
236 if (type->strct) {
237 return 1;
238 }
239 for (i = 0; i < structs->count; ++i) {
240 if (!strcmp(structs->list[i]->name, type->name)) {
241 type->strct = structs->list[i];
242 return 1;
243 }
244 }
245 return 0;
246 }
247
248 static inline int validate_decl_type(PSI_Data *data, decl_type *type) {
249 switch (type->type) {
250 case PSI_T_NAME:
251 if (!data->defs || !locate_decl_type_alias(data->defs, type)) {
252 return 0;
253 }
254 if (type->real) {
255 return validate_decl_type(data, type->real);
256 }
257 return 1;
258 case PSI_T_STRUCT:
259 if (!data->structs || !locate_decl_type_struct(data->structs, type)) {
260 return 0;
261 }
262 break;
263 }
264 return 1;
265 }
266 static inline int validate_decl_typedef(PSI_Data *data, decl_typedef *def) {
267 if (!validate_decl_type(data, def->type)) {
268 data->error(PSI_WARNING, "Type '%s' cannot be aliased to %s'%s'",
269 def->type->name, def->type->type == PSI_T_STRUCT?"struct ":"",def->alias);
270 return 0;
271 }
272 /* FIXME: check def->alias */
273 return 1;
274 }
275
276 static inline int validate_constant(PSI_Data *data, constant *c) {
277 /* FIXME */
278 return 1;
279 }
280
281 static inline int validate_decl_arg(PSI_Data *data, decl_arg *arg) {
282 if (!validate_decl_type(data, arg->type)) {
283 data->error(PSI_WARNING, "Cannot use '%s'(%d) as type for '%s'",
284 arg->type->name, arg->type->type, arg->var->name);
285 return 0;
286 }
287 return 1;
288 }
289
290 static inline int validate_decl_struct(PSI_Data *data, decl_struct *s) {
291 size_t i;
292
293 for (i = 0; i < s->args->count; ++i) {
294 if (!validate_decl_arg(data, s->args->args[i])) {
295 return 0;
296 }
297 }
298
299 for (i = 0; i < s->args->count; ++i) {
300 decl_arg *darg = s->args->args[i];
301
302 if (!validate_decl_arg(data, darg)) {
303 return 0;
304 }
305
306 ZEND_ASSERT(!darg->var->arg || darg->var->arg == darg);
307 darg->var->arg = darg;
308
309 if (!darg->layout) {
310 token_t t;
311
312 if (darg->var->pointer_level && (!darg->var->array_size || darg->var->pointer_level == 1)) {
313 t = PSI_T_POINTER;
314 } else {
315 t = real_decl_type(darg->type)->type;
316 }
317
318 if (i) {
319 decl_arg *last = s->args->args[i-1];
320 darg->layout = init_decl_struct_layout(
321 psi_t_align(t, last->layout->pos + last->layout->len),
322 psi_t_size(t) * darg->var->array_size);
323 } else {
324 darg->layout = init_decl_struct_layout(0, psi_t_size(t));
325 }
326 }
327 if (s->size < darg->layout->pos + darg->layout->len) {
328 s->size = darg->layout->pos + darg->layout->len;
329 }
330 }
331 return 1;
332 }
333
334 static const char * const abi_ccs[] = {
335 "default", /* \ */
336 "extern", /* > - all the same */
337 "cdecl", /* / */
338 "stdcall",
339 "fastcall",
340 };
341 static inline int validate_decl_abi(PSI_Data *data, decl_abi *abi) {
342 size_t i;
343
344 for (i = 0; i < sizeof(abi_ccs)/sizeof(char*); ++i) {
345 if (strcasecmp(abi->convention, abi_ccs[i])) {
346 return 1;
347 }
348 }
349 data->error(PSI_WARNING, "Invalid calling convention: '%s'", abi->convention);
350 return 0;
351 }
352 static inline int validate_decl_func(PSI_Data *data, void *dl, decl *decl, decl_arg *func)
353 {
354 struct psi_func_redir *redir;
355
356 if (!strcmp(func->var->name, "dlsym")) {
357 data->error(PSI_WARNING, "Cannot dlsym dlsym (sic!)");
358 return 0;
359 }
360
361 if (!validate_decl_arg(data, func)) {
362 return 0;
363 }
364 for (redir = &psi_func_redirs[0]; redir->name; ++redir) {
365 if (!strcmp(func->var->name, redir->name)) {
366 decl->call.sym = redir->func;
367 }
368 }
369 if (!decl->call.sym) {
370 #ifndef RTLD_NEXT
371 # define RTLD_NEXT ((void *) -1l)
372 #endif
373 decl->call.sym = dlsym(dl ?: RTLD_NEXT, func->var->name);
374 if (!decl->call.sym) {
375 data->error(PSI_WARNING, "Failed to locate symbol '%s': %s",
376 func->var->name, dlerror());
377 }
378 }
379 return 1;
380 }
381
382 static inline int validate_decl(PSI_Data *data, void *dl, decl *decl) {
383 if (!validate_decl_abi(data, decl->abi)) {
384 return 0;
385 }
386 if (!validate_decl_func(data, dl, decl, decl->func)) {
387 return 0;
388 }
389 if (decl->args) {
390 size_t i;
391
392 for (i = 0; i < decl->args->count; ++i) {
393 if (!validate_decl_arg(data, decl->args->args[i])) {
394 return 0;
395 }
396 }
397 }
398 return 1;
399 }
400 static inline decl_arg *locate_decl_var_arg(decl_var *var, decl_args *args, decl_arg *func) {
401 size_t i;
402
403 for (i = 0; i < args->count; ++i) {
404 decl_arg *arg = args->args[i];
405
406 if (!strcmp(var->name, arg->var->name)) {
407 ZEND_ASSERT(!var->arg || var->arg == arg);
408 return var->arg = arg;
409 }
410 }
411 if (func && !strcmp(var->name, func->var->name)) {
412 return var->arg = func;
413 }
414
415 return NULL;
416 }
417 static inline decl_arg *locate_struct_member(decl_struct *s, decl_var *var) {
418 if (s->args) {
419 return locate_decl_var_arg(var, s->args, NULL);
420 }
421
422 return NULL;
423 }
424 static inline constant *locate_num_exp_constant(num_exp *exp, constants *consts) {
425 size_t i;
426
427 for (i = 0; i < consts->count; ++i) {
428 constant *cnst = consts->list[i];
429
430 if (!strcmp(cnst->name, exp->u.numb)) {
431 free(exp->u.numb);
432 return exp->u.cnst = cnst;
433 }
434 }
435
436 return NULL;
437 }
438 static inline int validate_num_exp(PSI_Data *data, decl_args *dargs, decl_arg *func, num_exp *exp) {
439 if (exp->operand) {
440 switch (exp->operator) {
441 case PSI_T_PLUS:
442 exp->calculator = psi_calc_add;
443 break;
444 case PSI_T_MINUS:
445 exp->calculator = psi_calc_sub;
446 break;
447 case PSI_T_ASTERISK:
448 exp->calculator = psi_calc_mul;
449 break;
450 case PSI_T_SLASH:
451 exp->calculator = psi_calc_div;
452 break;
453 EMPTY_SWITCH_DEFAULT_CASE();
454 }
455 if (!validate_num_exp(data, dargs, func, exp->operand)) {
456 return 0;
457 }
458 }
459 switch (exp->t) {
460 case PSI_T_NAME:
461 if (!locate_decl_var_arg(exp->u.dvar, dargs, func)) {
462 data->error(PSI_WARNING, "Unknown variable '%s' in numeric expression",
463 exp->u.dvar->name);
464 return 0;
465 }
466 return 1;
467 case PSI_T_NSNAME:
468 if (!locate_num_exp_constant(exp, data->consts)) {
469 data->error(PSI_WARNING, "Unknown constant '%s' in numeric expression",
470 exp->u.numb);
471 return 0;
472 }
473 return 1;
474 case PSI_T_NUMBER:
475 return 1;
476 default:
477 return 0;
478 }
479 }
480 static inline int validate_set_value(PSI_Data *data, set_value *set, decl_arg *ref, decl_args *ref_list) {
481 size_t i;
482 decl_type *ref_type = real_decl_type(ref->type);
483 decl_var *set_var = set->vars->vars[0];
484
485 switch (set->func->type) {
486 case PSI_T_TO_BOOL:
487 set->func->handler = psi_to_bool;
488 break;
489 case PSI_T_TO_INT:
490 set->func->handler = psi_to_int;
491 break;
492 case PSI_T_TO_FLOAT:
493 set->func->handler = psi_to_double;
494 break;
495 case PSI_T_TO_STRING:
496 set->func->handler = psi_to_string;
497 break;
498 case PSI_T_TO_ARRAY:
499 set->func->handler = psi_to_array;
500 break;
501 case PSI_T_TO_OBJECT:
502 set->func->handler = psi_to_object;
503 break;
504 case PSI_T_VOID:
505 set->func->handler = psi_to_void;
506 break;
507 EMPTY_SWITCH_DEFAULT_CASE();
508 }
509
510 for (i = 1; i < set->vars->count; ++i) {
511 if (!locate_decl_var_arg(set->vars->vars[i], ref_list, ref)) {
512 return 0;
513 }
514 }
515 set_var->arg = ref;
516
517 if (set->count) {
518 int is_to_array = (set->func->type == PSI_T_TO_ARRAY);
519 int is_pointer_to_struct = (ref_type->type == PSI_T_STRUCT && ref->var->pointer_level);
520
521 if (!is_to_array && !is_pointer_to_struct) {
522 data->error(E_WARNING, "Inner `set` statement casts only work with "
523 "to_array() casts on structs or pointers: %s(%s...", set->func->name, set->vars->vars[0]->name);
524 return 0;
525 }
526 }
527 if (set->num) {
528 if (!validate_num_exp(data, ref_list, ref, set->num)) {
529 return 0;
530 }
531 }
532
533 if (ref_type->type == PSI_T_STRUCT) {
534 /* to_array(struct, to_...) */
535 for (i = 0; i < set->count; ++i) {
536 decl_var *sub_var = set->inner[i]->vars->vars[0];
537 decl_arg *sub_ref = locate_struct_member(ref_type->strct, sub_var);
538
539 set->inner[i]->outer.set = set;
540 if (sub_ref) {
541 if (!validate_set_value(data, set->inner[i], sub_ref, ref_type->strct->args)) {
542 return 0;
543 }
544 }
545 }
546 } else if (set->count == 1) {
547 /* to_array(ptr, to_string(*ptr)) */
548 decl_var *sub_var = set->inner[0]->vars->vars[0];
549 decl_arg *sub_ref = locate_decl_var_arg(sub_var, ref_list, ref);
550
551 set->inner[0]->outer.set = set;
552 if (sub_ref) {
553 if (strcmp(sub_var->name, set_var->name)) {
554 data->error(E_WARNING, "Inner `set` statement casts on pointers must reference the same variable");
555 return 0;
556 }
557 if (!validate_set_value(data, set->inner[0], sub_ref, ref_list)) {
558 return 0;
559 }
560 }
561 } else if (set->count > 1) {
562 data->error(E_WARNING, "Inner `set` statement casts on pointers may only occur once");
563 return 0;
564 }
565
566 return 1;
567 }
568 static inline decl *locate_impl_decl(decls *decls, return_stmt *ret) {
569 if (decls) {
570 size_t i;
571
572 for (i = 0; i < decls->count; ++i) {
573 if (!strcmp(decls->list[i]->func->var->name, ret->set->vars->vars[0]->name)) {
574 ret->decl = decls->list[i]->func;
575 return decls->list[i];
576 }
577 }
578 }
579
580 return NULL;
581 }
582 static inline int validate_impl_ret_stmt(PSI_Data *data, impl *impl) {
583 return_stmt *ret;
584
585 /* we must have exactly one ret stmt delcaring the native func to call */
586 /* and which type cast to apply */
587 if (impl->stmts->ret.count != 1) {
588 if (impl->stmts->ret.count > 1) {
589 data->error(PSI_WARNING, "Too many `return` statements for implmentation %s;"
590 " found %zu, exactly one is needed",
591 impl->func->name, impl->stmts->ret.count);
592 } else {
593 data->error(PSI_WARNING, "Missing `return` statement for implementation %s",
594 impl->func->name);
595 }
596 return 0;
597 }
598
599 ret = impl->stmts->ret.list[0];
600
601 if (!(impl->decl = locate_impl_decl(data->decls, ret))) {
602 data->error(PSI_WARNING, "Missing declaration for implementation %s",
603 impl->func->name);
604 return 0;
605 }
606
607 if (!validate_set_value(data, ret->set, ret->decl, impl->decl->args)) {
608 return 0;
609 }
610
611 impl->decl->impl = impl;
612
613 return 1;
614 }
615
616 static inline int validate_impl_let_stmts(PSI_Data *data, impl *impl) {
617 size_t i, j;
618 /* we can have multiple let stmts */
619 /* check that we have a let stmt for every decl arg */
620 if (impl->decl->args) for (i = 0; i < impl->decl->args->count; ++i) {
621 decl_arg *darg = impl->decl->args->args[i];
622 int check = 0;
623
624 for (j = 0; j < impl->stmts->let.count; ++j) {
625 let_stmt *let = impl->stmts->let.list[j];
626
627 if (!strcmp(let->var->name, darg->var->name)) {
628 darg->let = let;
629 check = 1;
630 break;
631 }
632 }
633 if (!check) {
634 data->error(PSI_WARNING, "Missing `let` statement for arg '%s %.*s%s'"
635 " of declaration '%s' for implementation '%s'",
636 darg->type->name, (int) darg->var->pointer_level, "*****",
637 darg->var->name, impl->decl->func->var->name, impl->func->name);
638 return 0;
639 }
640 }
641 /* check that the let_value references a known variable or NULL */
642 for (i = 0; i < impl->stmts->let.count; ++i) {
643 let_stmt *let = impl->stmts->let.list[i];
644 int check = 0;
645
646 if (let->val && let->val->func && let->val->func->alloc) {
647 if (!validate_num_exp(data, impl->decl->args, impl->decl->func, let->val->func->alloc->nmemb)) {
648 return 0;
649 }
650 if (!validate_num_exp(data, impl->decl->args, impl->decl->func, let->val->func->alloc->size)) {
651 return 0;
652 }
653 }
654 if (let->val && let->val->var) {
655 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
656 impl_arg *iarg = impl->func->args->args[j];
657
658 if (!strcmp(let->val->var->name, iarg->var->name)) {
659 let->arg = iarg;
660 check = 1;
661 break;
662 }
663 }
664 if (!check) {
665 data->error(PSI_WARNING, "Unknown value '$%s' of `let` statement"
666 " for variable '%s' of implementation '%s'",
667 let->val->var->name, let->var->name, impl->func->name);
668 return 0;
669 }
670 }
671 }
672 return 1;
673 }
674 static inline int validate_impl_set_stmts(PSI_Data *data, impl *impl) {
675 size_t i, j, k;
676 /* we can have any count of set stmts; processing out vars */
677 /* check that set stmts reference known variables */
678 for (i = 0; i < impl->stmts->set.count; ++i) {
679 set_stmt *set = impl->stmts->set.list[i];
680 int check = 0;
681
682 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
683 impl_arg *iarg = impl->func->args->args[j];
684
685 if (!strcmp(set->var->name, iarg->var->name)) {
686 set->arg = iarg;
687 check = 1;
688 break;
689 }
690 }
691 if (!check) {
692 data->error(PSI_WARNING, "Unknown variable '$%s' of `set` statement"
693 " of implementation '%s'",
694 set->var->name, impl->func->name);
695 return 0;
696 }
697
698 for (j = 0; j < set->val->vars->count; ++j) {
699 decl_var *set_var = set->val->vars->vars[j];
700
701 check = 0;
702 if (impl->decl->args) for (k = 0; k < impl->decl->args->count; ++k) {
703 decl_arg *set_arg = impl->decl->args->args[k];
704
705 if (!strcmp(set_var->name, set_arg->var->name)) {
706 check = 1;
707 set_var->arg = set_arg;
708 if (!validate_set_value(data, set->val, set_arg, impl->decl->args)) {
709 return 0;
710 }
711 break;
712 }
713 }
714
715 if (!check) {
716 data->error(PSI_WARNING, "Unknown value '%s' of `set` statement"
717 " for variable '$%s' of implementation '%s'",
718 set_var->name, set->arg->var->name, impl->func->name);
719 return 0;
720 }
721 }
722 }
723 return 1;
724 }
725 static inline decl *locate_free_decl(decls *decls, free_call *f) {
726 if (decls) {
727 size_t i;
728
729 for (i = 0; i < decls->count; ++i) {
730 if (!strcmp(decls->list[i]->func->var->name, f->func)) {
731 f->decl = decls->list[i];
732 return decls->list[i];
733 }
734 }
735 }
736
737 return NULL;
738 }
739 static inline int validate_impl_free_stmts(PSI_Data *data, impl *impl) {
740 size_t i, j, k, l;
741 /* we can have any count of free stmts; freeing any out vars */
742 for (i = 0; i < impl->stmts->fre.count; ++i) {
743 free_stmt *fre = impl->stmts->fre.list[i];
744
745 for (j = 0; j < fre->calls->count; ++j) {
746 free_call *free_call = fre->calls->list[j];
747
748 /* first find the decl of the free func */
749 if (!locate_free_decl(data->decls, free_call)) {
750 data->error(PSI_WARNING, "Unknown function '%s' in `free` statement"
751 " of implementation '%s'", free_call->func, impl->func->name);
752 return 0;
753 }
754 if (!impl->decl->args) {
755 data->error(PSI_WARNING, "Declaration '%s' of implementation '%s'"
756 " does not have any arguments to free",
757 impl->decl->func->var->name, impl->func->name);
758 }
759
760 /* now check for known vars */
761 for (l = 0; l < free_call->vars->count; ++l) {
762 int check = 0;
763 decl_var *free_var = free_call->vars->vars[l];
764
765 for (k = 0; k < impl->decl->args->count; ++k) {
766 decl_arg *free_arg = impl->decl->args->args[k];
767
768 if (!strcmp(free_var->name, free_arg->var->name)) {
769 check = 1;
770 free_var->arg = free_arg;
771 break;
772 }
773 }
774
775 if (!check) {
776 data->error(PSI_WARNING, "Unknown variable '%s' of `free` statement"
777 " of implementation '%s'",
778 free_var->name, impl->func->name);
779 return 0;
780 }
781 }
782 }
783 }
784 return 1;
785 }
786 static inline int validate_impl_stmts(PSI_Data *data, impl *impl) {
787 if (!impl->stmts) {
788 data->error(PSI_WARNING, "Missing body for implementation %s!",
789 impl->func->name);
790 return 0;
791 }
792
793 if (!validate_impl_ret_stmt(data, impl)) {
794 return 0;
795 }
796
797 if (!validate_impl_let_stmts(data, impl)) {
798 return 0;
799 }
800 if (!validate_impl_set_stmts(data, impl)) {
801 return 0;
802 }
803 if (!validate_impl_free_stmts(data, impl)) {
804 return 0;
805 }
806
807 return 1;
808 }
809
810 PSI_Context *PSI_ContextInit(PSI_Context *C, PSI_ContextOps *ops, PSI_ContextErrorFunc error)
811 {
812 size_t i;
813 PSI_Data T;
814 struct psi_predef_type *predef_type;
815 struct psi_predef_const *predef_const;
816 struct psi_predef_struct *predef_struct;
817 struct psi_predef_decl *predef_decl;
818
819 if (!C) {
820 C = malloc(sizeof(*C));
821 }
822 memset(C, 0, sizeof(*C));
823
824 C->error = error;
825 C->ops = ops;
826
827 if (ops->init) {
828 ops->init(C);
829 }
830
831 ZEND_ASSERT(ops->call != NULL);
832 ZEND_ASSERT(ops->compile != NULL);
833
834 /* build up predefs in a temporary PSI_Data for validation */
835 memset(&T, 0, sizeof(T));
836 T.error = error;
837
838 for (predef_type = &psi_predef_types[0]; predef_type->type_tag; ++predef_type) {
839 decl_type *type = init_decl_type(predef_type->type_tag, predef_type->type_name);
840 decl_typedef *def = init_decl_typedef(predef_type->alias, type);
841
842 T.defs = add_decl_typedef(T.defs, def);
843 }
844 for (predef_const = &psi_predef_consts[0]; predef_const->type_tag; ++predef_const) {
845 impl_def_val *val = init_impl_def_val(predef_const->val_type_tag, predef_const->val_text);
846 const_type *type = init_const_type(predef_const->type_tag, predef_const->type_name);
847 constant *constant = init_constant(type, predef_const->var_name, val);
848
849 T.consts = add_constant(T.consts, constant);
850 }
851 for (predef_struct = &psi_predef_structs[0]; predef_struct->type_tag; ++predef_struct) {
852 struct psi_predef_struct *member;
853 decl_args *dargs = init_decl_args(NULL);
854 decl_struct *dstruct = init_decl_struct(predef_struct->var_name, dargs);
855
856 dstruct->size = predef_struct->size;
857 for (member = &predef_struct[1]; member->type_tag; ++member) {
858 decl_type *type;
859 decl_var *dvar;
860 decl_arg *darg;
861
862 type = init_decl_type(member->type_tag, member->type_name);
863 dvar = init_decl_var(member->var_name, member->pointer_level, member->array_size);
864 darg = init_decl_arg(type, dvar);
865 darg->layout = init_decl_struct_layout(member->offset, member->size);
866 dargs = add_decl_arg(dargs, darg);
867 }
868
869 T.structs = add_decl_struct(T.structs, dstruct);
870 predef_struct = member;
871 }
872 for (predef_decl = &psi_predef_decls[0]; predef_decl->type_tag; ++predef_decl) {
873 struct psi_predef_decl *farg;
874 decl_type *ftype = init_decl_type(predef_decl->type_tag, predef_decl->type_name);
875 decl_var *fname = init_decl_var(predef_decl->var_name, predef_decl->pointer_level, predef_decl->array_size);
876 decl_arg *func = init_decl_arg(ftype, fname);
877 decl_args *args = init_decl_args(NULL);
878 decl *decl = init_decl(init_decl_abi("default"), func, args);
879
880
881 for (farg = &predef_decl[1]; farg->type_tag; ++farg) {
882 decl_type *arg_type = init_decl_type(farg->type_tag, farg->type_name);
883 decl_var *arg_var = init_decl_var(farg->var_name, farg->pointer_level, farg->array_size);
884 decl_arg *darg = init_decl_arg(arg_type, arg_var);
885 args = add_decl_arg(args, darg);
886 }
887
888 T.decls = add_decl(T.decls, decl);
889 predef_decl = farg;
890 }
891
892 for (i = 0; i < T.defs->count; ++i) {
893 decl_typedef *def = T.defs->list[i];
894
895 if (validate_decl_typedef(&T, def)) {
896 C->defs = add_decl_typedef(C->defs, def);
897 }
898 }
899
900 for (i = 0; i < T.consts->count; ++i) {
901 constant *constant = T.consts->list[i];
902
903 if (validate_constant(&T, constant)) {
904 C->consts = add_constant(C->consts, constant);
905 }
906 }
907
908 for (i = 0; i < T.structs->count; ++i) {
909 decl_struct *dstruct = T.structs->list[i];
910
911 if (validate_decl_struct(&T, dstruct)) {
912 C->structs = add_decl_struct(C->structs, dstruct);
913 }
914 }
915
916 for (i = 0; i < T.decls->count; ++i) {
917 decl *decl = T.decls->list[i];
918
919 if (validate_decl(&T, NULL, decl)) {
920 C->decls = add_decl(C->decls, decl);
921 }
922 }
923
924 C->count = 1;
925 C->data = malloc(sizeof(*C->data));
926 PSI_DataExchange(C->data, &T);
927
928 return C;
929 }
930
931 int PSI_ContextValidate(PSI_Context *C, PSI_Parser *P)
932 {
933 PSI_Data *D;
934 void *dlopened = NULL;
935 size_t count = C->count++;
936
937 C->data = realloc(C->data, C->count * sizeof(*C->data));
938 D = PSI_DataExchange(&C->data[count], PSI_DATA(P));
939
940 if (D->defs) {
941 size_t i;
942
943 for (i = 0; i < D->defs->count; ++i) {
944 if (validate_decl_typedef(PSI_DATA(C), D->defs->list[i])) {
945 C->defs = add_decl_typedef(C->defs, D->defs->list[i]);
946 }
947 }
948 }
949 if (D->structs) {
950 size_t i;
951
952 for (i = 0; i < D->structs->count; ++i) {
953 if (validate_decl_struct(PSI_DATA(C), D->structs->list[i])) {
954 C->structs = add_decl_struct(C->structs, D->structs->list[i]);
955 }
956 }
957 }
958 if (D->consts) {
959 size_t i;
960
961 for (i = 0; i < D->consts->count; ++i) {
962 if (validate_constant(PSI_DATA(C), D->consts->list[i])) {
963 C->consts = add_constant(C->consts, D->consts->list[i]);
964 }
965 }
966 }
967
968 if (!validate_lib(D, &dlopened)) {
969 return 0;
970 }
971
972 add_decl_lib(&C->psi.libs, dlopened);
973
974 if (D->decls) {
975 size_t i;
976
977 for (i = 0; i < D->decls->count; ++i) {
978 if (validate_decl(PSI_DATA(C), dlopened, D->decls->list[i])) {
979 C->decls = add_decl(C->decls, D->decls->list[i]);
980 }
981 }
982 }
983 if (D->impls) {
984 size_t i;
985
986 for (i = 0; i < D->impls->count; ++i) {
987 if (validate_impl_stmts(PSI_DATA(C), D->impls->list[i])) {
988 C->impls = add_impl(C->impls, D->impls->list[i]);
989 }
990 }
991 }
992
993 return 1;
994 }
995
996 static int psi_select_dirent(const struct dirent *entry)
997 {
998 #ifndef FNM_CASEFOLD
999 #define FNM_CASEFOLD 0
1000 #endif
1001 return 0 == fnmatch("*.psi", entry->d_name, FNM_CASEFOLD);
1002 }
1003
1004 void PSI_ContextBuild(PSI_Context *C, const char *paths)
1005 {
1006 int i, n, flags = psi_check_env("PSI_DEBUG") ? PSI_PARSER_DEBUG : 0;
1007 char *sep = NULL, *cpy = strdup(paths), *ptr = cpy;
1008 struct dirent **entries = NULL;
1009
1010
1011 do {
1012 sep = strchr(ptr, ':');
1013
1014 if (sep) {
1015 *sep = 0;
1016 }
1017
1018 n = php_scandir(ptr, &entries, psi_select_dirent, alphasort);
1019
1020 if (n > 0) {
1021 for (i = 0; i < n; ++i) {
1022 char psi[MAXPATHLEN];
1023 PSI_Parser P;
1024
1025 if (MAXPATHLEN <= slprintf(psi, MAXPATHLEN, "%s/%s", ptr, entries[i]->d_name)) {
1026 C->error(PSI_WARNING, "Path to PSI file too long: %s/%s",
1027 ptr, entries[i]->d_name);
1028 }
1029 if (!PSI_ParserInit(&P, psi, C->error, flags)) {
1030 C->error(PSI_WARNING, "Failed to init PSI parser (%s): %s",
1031 psi, strerror(errno));
1032 continue;
1033 }
1034
1035 while (0 < PSI_ParserScan(&P)) {
1036 PSI_ParserParse(&P, PSI_TokenAlloc(&P));
1037 if (P.num == PSI_T_EOF) {
1038 break;
1039 }
1040 }
1041
1042 PSI_ParserParse(&P, NULL);
1043 PSI_ContextValidate(C, &P);
1044 PSI_ParserDtor(&P);
1045 }
1046 }
1047
1048 if (entries) {
1049 for (i = 0; i < n; ++i) {
1050 free(entries[i]);
1051 }
1052 free(entries);
1053 }
1054
1055 ptr = sep + 1;
1056 } while (sep);
1057
1058
1059 if (PSI_ContextCompile(C) && SUCCESS != zend_register_functions(NULL, C->closures, NULL, MODULE_PERSISTENT)) {
1060 C->error(PSI_WARNING, "Failed to register functions!");
1061 }
1062
1063 free(cpy);
1064
1065 }
1066
1067 zend_function_entry *PSI_ContextCompile(PSI_Context *C)
1068 {
1069 size_t i;
1070
1071 if (C->consts) {
1072 zend_constant zc;
1073
1074 zc.flags = CONST_PERSISTENT|CONST_CS;
1075 zc.module_number = EG(current_module)->module_number;
1076
1077 for (i = 0; i < C->consts->count; ++i) {
1078 constant *c = C->consts->list[i];
1079
1080 zc.name = zend_string_init(c->name + (c->name[0] == '\\'), strlen(c->name) - (c->name[0] == '\\'), 1);
1081 ZVAL_NEW_STR(&zc.value, zend_string_init(c->val->text, strlen(c->val->text), 1));
1082
1083 switch (c->type->type) {
1084 case PSI_T_BOOL:
1085 convert_to_boolean(&zc.value);
1086 break;
1087 case PSI_T_INT:
1088 convert_to_long(&zc.value);
1089 break;
1090 case PSI_T_FLOAT:
1091 convert_to_double(&zc.value);
1092 break;
1093 }
1094 zend_register_constant(&zc);
1095 }
1096 }
1097
1098 return C->closures = C->ops->compile(C);
1099 }
1100
1101
1102 void PSI_ContextCall(PSI_Context *C, impl_val *ret_val, decl *decl)
1103 {
1104 errno = 0;
1105 C->ops->call(C, ret_val, decl);
1106 }
1107
1108 static inline void dump_decl_type(int fd, decl_type *t) {
1109 const char *pre;
1110
1111 switch (t->type) {
1112 case PSI_T_STRUCT:
1113 pre = "struct ";
1114 break;
1115 default:
1116 pre = "";
1117 }
1118 dprintf(fd, "%s%s", pre, t->name);
1119 }
1120 static inline void dump_decl_var(int fd, decl_var *v) {
1121 dprintf(fd, "%.*s%s", v->pointer_level-!!v->array_size, "**********", v->name);
1122 if (v->array_size) {
1123 dprintf(fd, "[%u]", v->array_size);
1124 }
1125 }
1126 static inline void dump_decl_arg(int fd, decl_arg *a) {
1127 dump_decl_type(fd, a->type);
1128 dprintf(fd, " ");
1129 dump_decl_var(fd, a->var);
1130 }
1131 static inline void dump_level(int fd, unsigned level) {
1132 dprintf(fd, "%.*s", level, "\t\t\t\t\t\t\t\t\t");
1133 }
1134 static inline void dump_impl_set_value(int fd, set_value *set, unsigned level) {
1135 size_t i;
1136
1137 if (level > 1) {
1138 /* only if not directly after `set ...` */
1139 dump_level(fd, level);
1140 }
1141 dprintf(fd, "%s(", set->func->name);
1142
1143 for (i = 0; i < set->vars->count; ++i) {
1144 decl_var *svar = set->vars->vars[i];
1145 if (i) {
1146 dprintf(fd, ", ");
1147 }
1148 dump_decl_var(fd, svar);
1149 }
1150 if (set->inner) {
1151 dprintf(fd, ",\n");
1152 for (i = 0; i < set->count; ++i) {
1153 dump_impl_set_value(fd, set->inner[i], level+1);
1154 }
1155 /* only if inner stmts, i.e. with new lines, were dumped */
1156 dump_level(fd, level);
1157 }
1158 if (level > 1) {
1159 dprintf(fd, "),\n");
1160 } else {
1161 dprintf(fd, ");\n");
1162 }
1163 }
1164 static inline void dump_num_exp(int fd, num_exp *exp) {
1165 switch (exp->t) {
1166 case PSI_T_NUMBER:
1167 dprintf(fd, "%s", exp->u.numb);
1168 break;
1169 case PSI_T_NAME:
1170 dump_decl_var(fd, exp->u.dvar);
1171 break;
1172 case PSI_T_NSNAME:
1173 dprintf(fd, "%s", exp->u.cnst->name);
1174 break;
1175 EMPTY_SWITCH_DEFAULT_CASE();
1176 }
1177 }
1178 void PSI_ContextDump(PSI_Context *C, int fd)
1179 {
1180 size_t i, j, k, l;
1181
1182 #ifdef HAVE_LIBJIT
1183 if (C->ops == PSI_Libjit()) {
1184 dprintf(fd, "// psi.engine=jit\n");
1185 }
1186 #endif
1187 #ifdef HAVE_LIBFFI
1188 if (C->ops == PSI_Libffi()) {
1189 dprintf(fd, "// psi.engine=ffi\n");
1190 }
1191 #endif
1192 dprintf(fd, "\n");
1193
1194 if (C->defs) {
1195 for (i = 0; i < C->defs->count; ++i) {
1196 decl_typedef *tdef = C->defs->list[i];
1197
1198 dprintf(fd, "typedef ");
1199 dump_decl_type(fd, tdef->type);
1200 dprintf(fd, " %s;\n", tdef->alias);
1201 }
1202 dprintf(fd, "\n");
1203 }
1204
1205 if (C->structs) {
1206 for (i = 0; i < C->structs->count; ++i) {
1207 decl_struct *strct = C->structs->list[i];
1208
1209 dprintf(fd, "struct %s::(%zu) {\n", strct->name, strct->size);
1210 if (strct->args) for (j = 0; j < strct->args->count; ++j) {
1211 decl_arg *sarg = strct->args->args[j];
1212
1213 dprintf(fd, "\t");
1214 dump_decl_arg(fd, sarg);
1215 dprintf(fd, "::(%zu, %zu);\n", sarg->layout->pos, sarg->layout->len);
1216 }
1217 dprintf(fd, "}\n");
1218 }
1219 dprintf(fd, "\n");
1220 }
1221 if (C->consts) {
1222 for (i = 0; i < C->consts->count; ++i) {
1223 constant *cnst = C->consts->list[i];
1224
1225 dprintf(fd, "const %s %s = ", cnst->type->name, cnst->name);
1226 if (cnst->val->type == PSI_T_QUOTED_STRING) {
1227 dprintf(fd, "\"%s\";\n", cnst->val->text);
1228 } else {
1229 dprintf(fd, "%s;\n", cnst->val->text);
1230 }
1231 }
1232 dprintf(fd, "\n");
1233 }
1234 if (C->decls) {
1235 for (i = 0; i < C->decls->count; ++i) {
1236 decl *decl = C->decls->list[i];
1237
1238 dprintf(fd, "%s ", decl->abi->convention);
1239 dump_decl_arg(fd, decl->func);
1240 dprintf(fd, "(");
1241 if (decl->args) for (j = 0; j < decl->args->count; ++j) {
1242 if (j) {
1243 dprintf(fd, ", ");
1244 }
1245 dump_decl_arg(fd, decl->args->args[j]);
1246 }
1247 dprintf(fd, ");\n");
1248 }
1249 dprintf(fd, "\n");
1250 }
1251 if (C->impls) {
1252 for (i = 0; i < C->impls->count; ++i) {
1253 impl *impl = C->impls->list[i];
1254
1255 dprintf(fd, "function %s(", impl->func->name);
1256 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
1257 impl_arg *iarg = impl->func->args->args[j];
1258
1259 dprintf(fd, "%s%s %s$%s",
1260 j ? ", " : "",
1261 iarg->type->name,
1262 iarg->var->reference ? "&" : "",
1263 iarg->var->name);
1264 if (iarg->def) {
1265 dprintf(fd, " = %s", iarg->def->text);
1266 }
1267 }
1268 dprintf(fd, ") : %s%s {\n",
1269 impl->func->return_reference ? "&":"",
1270 impl->func->return_type->name);
1271 if (impl->stmts) {
1272 for (j = 0; j < impl->stmts->let.count; ++j) {
1273 let_stmt *let = impl->stmts->let.list[j];
1274
1275 dprintf(fd, "\tlet %s", let->var->name);
1276 if (let->val) {
1277 dprintf(fd, " = %s", let->val->is_reference ? "&" : "");
1278 if (let->val->func) {
1279 dprintf(fd, "%s(", let->val->func->name);
1280 if (let->val->func->alloc) {
1281 dump_num_exp(fd, let->val->func->alloc->nmemb);
1282 dprintf(fd, ", ");
1283 dump_num_exp(fd, let->val->func->alloc->size);
1284 } else {
1285 dprintf(fd, "$%s", let->val->var->name);
1286 }
1287 dprintf(fd, ");\n");
1288 } else {
1289 dprintf(fd, "NULL;\n");
1290 }
1291 }
1292 }
1293 for (j = 0; j < impl->stmts->ret.count; ++j) {
1294 return_stmt *ret = impl->stmts->ret.list[j];
1295
1296 dprintf(fd, "\treturn ");
1297 dump_impl_set_value(fd, ret->set, 1);
1298 }
1299 for (j = 0; j < impl->stmts->set.count; ++j) {
1300 set_stmt *set = impl->stmts->set.list[j];
1301
1302 dprintf(fd, "\tset $%s = ", set->var->name);
1303 dump_impl_set_value(fd, set->val, 1);
1304 }
1305 for (j = 0; j < impl->stmts->fre.count; ++j) {
1306 free_stmt *fre = impl->stmts->fre.list[j];
1307
1308 dprintf(fd, "\tfree ");
1309 for (k = 0; k < fre->calls->count; ++k) {
1310 free_call *call = fre->calls->list[k];
1311
1312 if (k) {
1313 dprintf(fd, ", ");
1314 }
1315 dprintf(fd, "%s(", call->func);
1316 for (l = 0; l < call->vars->count; ++l) {
1317 decl_var *fvar = call->vars->vars[l];
1318
1319 dump_decl_var(fd, fvar);
1320 }
1321 dprintf(fd, ");\n");
1322 }
1323 }
1324 }
1325 dprintf(fd, "}\n");
1326 }
1327 dprintf(fd, "\n");
1328 }
1329 }
1330
1331 void PSI_ContextDtor(PSI_Context *C)
1332 {
1333 size_t i;
1334 zend_function_entry *zfe;
1335
1336 if (C->ops->dtor) {
1337 C->ops->dtor(C);
1338 }
1339
1340 free_decl_libs(&C->psi.libs);
1341
1342 if (C->data) {
1343 for (i = 0; i < C->count; ++i) {
1344 PSI_DataDtor(&C->data[i]);
1345 }
1346 free(C->data);
1347 }
1348
1349 if (C->closures) {
1350 for (zfe = C->closures; zfe->fname; ++zfe) {
1351 free((void *) zfe->arg_info);
1352 }
1353 free(C->closures);
1354 }
1355
1356 if (C->consts) {
1357 if (C->consts->list) {
1358 free(C->consts->list);
1359 }
1360 free(C->consts);
1361 }
1362 if (C->defs) {
1363 if (C->defs->list) {
1364 free(C->defs->list);
1365 }
1366 free(C->defs);
1367 }
1368 if (C->structs) {
1369 if (C->structs->list) {
1370 free(C->structs->list);
1371 }
1372 free(C->structs);
1373 }
1374 if (C->decls) {
1375 if (C->decls->list) {
1376 free(C->decls->list);
1377 }
1378 free(C->decls);
1379 }
1380 if (C->impls) {
1381 if (C->impls->list) {
1382 free(C->impls->list);
1383 }
1384 free(C->impls);
1385 }
1386
1387 memset(C, 0, sizeof(*C));
1388 }
1389
1390 void PSI_ContextFree(PSI_Context **C)
1391 {
1392 if (*C) {
1393 PSI_ContextDtor(*C);
1394 free(*C);
1395 *C = NULL;
1396 }
1397 }