44f82992e6e0ee1f739ea2aaa11aec137fc5f4ca
[m6w6/ext-psi] / src / context.c
1 #ifdef HAVE_CONFIG_H
2 # include "config.h"
3 #endif
4
5 #include "php.h"
6
7 #include <stdio.h>
8 #ifdef HAVE_SYS_TYPES_H
9 # include <sys/types.h>
10 #endif
11 #ifdef HAVE_SYS_STAT_H
12 # include <sys/stat.h>
13 #endif
14 #ifdef STDC_HEADERS
15 # include <stdlib.h>
16 # include <stddef.h>
17 #else
18 # ifdef HAVE_STDLIB_H
19 # include <stdlib.h>
20 # endif
21 #endif
22 #ifdef HAVE_STRING_H
23 # if !defined STDC_HEADERS && defined HAVE_MEMORY_H
24 # include <memory.h>
25 # endif
26 # include <string.h>
27 #endif
28 #ifdef HAVE_STRINGS_H
29 # include <strings.h>
30 #endif
31 #ifdef HAVE_INTTYPES_H
32 # include <inttypes.h>
33 #endif
34 #ifdef HAVE_STDINT_H
35 # include <stdint.h>
36 #endif
37 #ifdef HAVE_UNISTD_H
38 # include <unistd.h>
39 #endif
40
41 #ifdef HAVE_ERRNO_H
42 # include <errno.h>
43 #endif
44 #ifdef HAVE_GLOB_H
45 # include <glob.h>
46 #endif
47 #ifdef HAVE_NETINET_IN_H
48 # include <netinet/in.h>
49 #endif
50 #ifdef HAVE_ARPA_NAMESER_H
51 # include <arpa/nameser.h>
52 #endif
53 #ifdef HAVE_NETDB_H
54 # include <netdb.h>
55 #endif
56 #ifdef HAVE_RESOLV_H
57 # include <resolv.h>
58 #endif
59 #ifdef HAVE_SYS_SELECT_H
60 # include <sys/select.h>
61 #endif
62 #ifdef HAVE_SYS_SOCKET_H
63 # include <sys/socket.h>
64 #endif
65 #ifdef HAVE_SYS_TIME_H
66 # include <sys/time.h>
67 #endif
68 #ifdef HAVE_SYS_TIMES_H
69 # include <sys/times.h>
70 #endif
71 #ifdef HAVE_SYS_UIO_H
72 # include <sys/uio.h>
73 #endif
74 #ifdef HAVE_SYS_UTSNAME_H
75 # include <sys/utsname.h>
76 #endif
77 #ifdef HAVE_TIME_H
78 # include <time.h>
79 #endif
80 #ifdef HAVE_WCHAR_H
81 # include <wchar.h>
82 #endif
83
84 #ifdef HAVE_DIRENT_H
85 # include <dirent.h>
86 # define NAMLEN(dirent) strlen ((dirent)->d_name)
87 #else
88 # define dirent direct
89 # define NAMLEN(dirent) ((dirent)->d_namlen)
90 # ifdef HAVE_SYS_NDIR_H
91 # include <sys/ndir.h>
92 # endif
93 # ifdef HAVE_SYS_DIR_H
94 # include <sys/dir.h>
95 # endif
96 # ifdef HAVE_NDIR_H
97 # include <ndir.h>
98 # endif
99 #endif
100
101 #include <sys/param.h>
102 #include <dlfcn.h>
103 #include <fnmatch.h>
104
105 #include "php.h"
106 #include "php_scandir.h"
107 #include "php_psi.h"
108 #include "context.h"
109 #include "parser.h"
110
111 #include "libjit.h"
112 #include "libffi.h"
113
114 static struct psi_std_type {
115 token_t type_tag;
116 const char *type_name;
117 } psi_std_types[] = {
118 {PSI_T_FLOAT, "float"},
119 {PSI_T_DOUBLE, "double"},
120 {PSI_T_INT8, "int8_t"},
121 {PSI_T_INT16, "int16_t"},
122 {PSI_T_INT32, "int32_t"},
123 {PSI_T_INT64, "int64_t"},
124 {PSI_T_UINT8, "uint8_t"},
125 {PSI_T_UINT16, "uint16_t"},
126 {PSI_T_UINT32, "uint32_t"},
127 {PSI_T_UINT64, "uint64_t"},
128 {0}
129 };
130
131 static struct psi_predef_type {
132 token_t type_tag;
133 const char *type_name;
134 const char *alias;
135 } psi_predef_types[] = {
136 PSI_TYPES
137 {0}
138 };
139
140 static struct psi_predef_const {
141 token_t type_tag;
142 const char *type_name;
143 const char *var_name;
144 const char *val_text;
145 token_t val_type_tag;
146 } psi_predef_consts[] = {
147 PSI_CONSTS
148 {0}
149 };
150
151 PSI_MACROS
152
153 static struct psi_func_redir {
154 const char *name;
155 void (*func)(void);
156 } psi_func_redirs[] = {
157 PSI_REDIRS
158 {0}
159 };
160
161 static struct psi_predef_decl {
162 token_t type_tag;
163 const char *type_name;
164 const char *var_name;
165 size_t pointer_level;
166 size_t array_size;
167 } psi_predef_decls[] = {
168 PSI_DECLS
169 {0}
170 };
171
172 static struct psi_predef_struct {
173 token_t type_tag;
174 const char *type_name;
175 const char *var_name;
176 size_t offset;
177 size_t size;
178 size_t pointer_level;
179 size_t array_size;
180 } psi_predef_structs[] = {
181 PSI_STRUCTS
182 {0}
183 };
184
185 static int validate_lib(PSI_Data *data, void **dlopened) {
186 char lib[MAXPATHLEN];
187 const char *ptr = data->psi.file.ln;
188 size_t len;
189
190 if (!ptr) {
191 /* FIXME: assume stdlib */
192 return 1;
193 } else if (!strchr(ptr, '/')) {
194 len = snprintf(lib, MAXPATHLEN, "lib%s.%s", ptr, PHP_PSI_SHLIB_SUFFIX);
195 if (MAXPATHLEN == len) {
196 data->error(PSI_WARNING, "Library name too long: '%s'", ptr);
197 }
198 lib[len] = 0;
199 ptr = lib;
200 }
201 if (!(*dlopened = dlopen(ptr, RTLD_LAZY|RTLD_LOCAL))) {
202 data->error(PSI_WARNING, "Could not open library '%s': %s.",
203 data->psi.file.ln, dlerror());
204 return 0;
205 }
206 return 1;
207 }
208
209 static inline int locate_decl_type_alias(decl_typedefs *defs, decl_type *type) {
210 size_t i;
211 struct psi_std_type *stdtyp;
212
213 if (type->real) {
214 return 1;
215 }
216 for (i = 0; i < defs->count; ++i) {
217 decl_typedef *def = defs->list[i];
218
219 if (def->type->type != type->type && !strcmp(def->alias, type->name)) {
220 type->real = def->type;
221 return 1;
222 }
223 }
224 for (stdtyp = &psi_std_types[0]; stdtyp->type_tag; ++stdtyp) {
225 if (!strcmp(type->name, stdtyp->type_name)) {
226 type->type = stdtyp->type_tag;
227 return 1;
228 }
229 }
230
231 return 0;
232 }
233 static inline int locate_decl_type_struct(decl_structs *structs, decl_type *type) {
234 size_t i;
235
236 if (type->strct) {
237 return 1;
238 }
239 for (i = 0; i < structs->count; ++i) {
240 if (!strcmp(structs->list[i]->name, type->name)) {
241 type->strct = structs->list[i];
242 return 1;
243 }
244 }
245 return 0;
246 }
247
248 static inline int validate_decl_type(PSI_Data *data, decl_type *type) {
249 switch (type->type) {
250 case PSI_T_NAME:
251 if (!data->defs || !locate_decl_type_alias(data->defs, type)) {
252 return 0;
253 }
254 if (type->real) {
255 return validate_decl_type(data, type->real);
256 }
257 return 1;
258 case PSI_T_STRUCT:
259 if (!data->structs || !locate_decl_type_struct(data->structs, type)) {
260 return 0;
261 }
262 break;
263 }
264 return 1;
265 }
266 static inline int validate_decl_typedef(PSI_Data *data, decl_typedef *def) {
267 if (!validate_decl_type(data, def->type)) {
268 data->error(PSI_WARNING, "Type '%s' cannot be aliased to %s'%s'",
269 def->type->name, def->type->type == PSI_T_STRUCT?"struct ":"",def->alias);
270 return 0;
271 }
272 /* FIXME: check def->alias */
273 return 1;
274 }
275
276 static inline int validate_constant(PSI_Data *data, constant *c) {
277 /* FIXME */
278 return 1;
279 }
280
281 static inline int validate_decl_arg(PSI_Data *data, decl_arg *arg) {
282 if (!validate_decl_type(data, arg->type)) {
283 data->error(PSI_WARNING, "Cannot use '%s'(%d) as type for '%s'",
284 arg->type->name, arg->type->type, arg->var->name);
285 return 0;
286 }
287 return 1;
288 }
289
290 static inline int validate_decl_struct(PSI_Data *data, decl_struct *s) {
291 size_t i;
292
293 for (i = 0; i < s->args->count; ++i) {
294 if (!validate_decl_arg(data, s->args->args[i])) {
295 return 0;
296 }
297 }
298
299 for (i = 0; i < s->args->count; ++i) {
300 decl_arg *darg = s->args->args[i];
301
302 if (!validate_decl_arg(data, darg)) {
303 return 0;
304 }
305
306 ZEND_ASSERT(!darg->var->arg || darg->var->arg == darg);
307 darg->var->arg = darg;
308
309 if (!darg->layout) {
310 token_t t;
311
312 if (darg->var->pointer_level && (!darg->var->array_size || darg->var->pointer_level == 1)) {
313 t = PSI_T_POINTER;
314 } else {
315 t = real_decl_type(darg->type)->type;
316 }
317
318 if (i) {
319 decl_arg *last = s->args->args[i-1];
320 darg->layout = init_decl_struct_layout(
321 psi_t_align(t, last->layout->pos + last->layout->len),
322 psi_t_size(t) * darg->var->array_size);
323 } else {
324 darg->layout = init_decl_struct_layout(0, psi_t_size(t));
325 }
326 }
327 if (s->size < darg->layout->pos + darg->layout->len) {
328 s->size = darg->layout->pos + darg->layout->len;
329 }
330 }
331 return 1;
332 }
333
334 static const char * const abi_ccs[] = {
335 "default", /* \ */
336 "extern", /* > - all the same */
337 "cdecl", /* / */
338 "stdcall",
339 "fastcall",
340 };
341 static inline int validate_decl_abi(PSI_Data *data, decl_abi *abi) {
342 size_t i;
343
344 for (i = 0; i < sizeof(abi_ccs)/sizeof(char*); ++i) {
345 if (strcasecmp(abi->convention, abi_ccs[i])) {
346 return 1;
347 }
348 }
349 data->error(PSI_WARNING, "Invalid calling convention: '%s'", abi->convention);
350 return 0;
351 }
352 static inline int validate_decl_func(PSI_Data *data, void *dl, decl *decl, decl_arg *func)
353 {
354 struct psi_func_redir *redir;
355
356 if (!strcmp(func->var->name, "dlsym")) {
357 data->error(PSI_WARNING, "Cannot dlsym dlsym (sic!)");
358 return 0;
359 }
360
361 if (!validate_decl_arg(data, func)) {
362 return 0;
363 }
364 for (redir = &psi_func_redirs[0]; redir->name; ++redir) {
365 if (!strcmp(func->var->name, redir->name)) {
366 decl->call.sym = redir->func;
367 }
368 }
369 if (!decl->call.sym) {
370 #ifndef RTLD_NEXT
371 # define RTLD_NEXT ((void *) -1l)
372 #endif
373 decl->call.sym = dlsym(dl ?: RTLD_NEXT, func->var->name);
374 if (!decl->call.sym) {
375 data->error(PSI_WARNING, "Failed to locate symbol '%s': %s",
376 func->var->name, dlerror());
377 }
378 }
379 return 1;
380 }
381
382 static inline int validate_decl(PSI_Data *data, void *dl, decl *decl) {
383 if (!validate_decl_abi(data, decl->abi)) {
384 return 0;
385 }
386 if (!validate_decl_func(data, dl, decl, decl->func)) {
387 return 0;
388 }
389 if (decl->args) {
390 size_t i;
391
392 for (i = 0; i < decl->args->count; ++i) {
393 if (!validate_decl_arg(data, decl->args->args[i])) {
394 return 0;
395 }
396 }
397 }
398 return 1;
399 }
400 static inline decl_arg *locate_decl_var_arg(decl_var *var, decl_args *args) {
401 size_t i;
402
403 for (i = 0; i < args->count; ++i) {
404 decl_arg *arg = args->args[i];
405
406 if (!strcmp(var->name, arg->var->name)) {
407 ZEND_ASSERT(!var->arg || var->arg == arg);
408 return var->arg = arg;
409 }
410 }
411
412 return NULL;
413 }
414 static inline decl_arg *locate_struct_member(decl_struct *s, decl_var *var) {
415 if (s->args) {
416 return locate_decl_var_arg(var, s->args);
417 }
418
419 return NULL;
420 }
421 static inline int validate_set_value(PSI_Data *data, set_value *set, decl_arg *ref, decl_args *ref_list) {
422 size_t i;
423 decl_type *ref_type = real_decl_type(ref->type);
424 decl_var *set_var = set->vars->vars[0];
425
426 switch (set->func->type) {
427 case PSI_T_TO_BOOL:
428 set->func->handler = psi_to_bool;
429 break;
430 case PSI_T_TO_INT:
431 set->func->handler = psi_to_int;
432 break;
433 case PSI_T_TO_FLOAT:
434 set->func->handler = psi_to_double;
435 break;
436 case PSI_T_TO_STRING:
437 set->func->handler = psi_to_string;
438 break;
439 case PSI_T_TO_ARRAY:
440 set->func->handler = psi_to_array;
441 break;
442 EMPTY_SWITCH_DEFAULT_CASE();
443 }
444
445 for (i = 1; i < set->vars->count; ++i) {
446 if (!locate_decl_var_arg(set->vars->vars[i], ref_list)) {
447 return 0;
448 }
449 }
450 set_var->arg = ref;
451
452 if (set->count) {
453 int is_to_array = (set->func->type == PSI_T_TO_ARRAY);
454 int is_pointer_to_struct = (ref_type->type == PSI_T_STRUCT && ref->var->pointer_level);
455 if (is_to_array && !is_pointer_to_struct) {
456 data->error(E_WARNING, "Inner `set` statement casts only work with "
457 "to_array() casts on structs or pointers: %s(%s...", set->func->name, set->vars->vars[0]->name);
458 return 0;
459 }
460 }
461
462 if (ref_type->type == PSI_T_STRUCT) {
463 /* to_array(struct, to_...) */
464 for (i = 0; i < set->count; ++i) {
465 decl_var *sub_var = set->inner[i]->vars->vars[0];
466 decl_arg *sub_ref = locate_struct_member(ref_type->strct, sub_var);
467
468 set->inner[i]->outer.set = set;
469 if (sub_ref) {
470 if (!validate_set_value(data, set->inner[i], sub_ref, ref_type->strct->args)) {
471 return 0;
472 }
473 }
474 }
475 } else if (set->count == 1) {
476 /* to_array(ptr, to_string(*ptr)) */
477 decl_var *sub_var = set->inner[0]->vars->vars[0];
478 decl_arg *sub_ref = locate_decl_var_arg(sub_var, ref_list);
479
480 set->inner[0]->outer.set = set;
481 if (sub_ref) {
482 if (strcmp(sub_var->name, set_var->name)) {
483 data->error(E_WARNING, "Inner `set` statement casts on pointers must reference the same variable");
484 return 0;
485 }
486 if (!validate_set_value(data, set->inner[0], sub_ref, ref_list)) {
487 return 0;
488 }
489 }
490 } else if (set->count > 1) {
491 data->error(E_WARNING, "Inner `set` statement casts on pointers may only occur once");
492 return 0;
493 }
494
495 return 1;
496 }
497 static inline decl *locate_impl_decl(decls *decls, return_stmt *ret) {
498 if (decls) {
499 size_t i;
500
501 for (i = 0; i < decls->count; ++i) {
502 if (!strcmp(decls->list[i]->func->var->name, ret->set->vars->vars[0]->name)) {
503 ret->decl = decls->list[i]->func;
504 return decls->list[i];
505 }
506 }
507 }
508
509 return NULL;
510 }
511 static inline int validate_impl_ret_stmt(PSI_Data *data, impl *impl) {
512 return_stmt *ret;
513
514 /* we must have exactly one ret stmt delcaring the native func to call */
515 /* and which type cast to apply */
516 if (impl->stmts->ret.count != 1) {
517 if (impl->stmts->ret.count > 1) {
518 data->error(PSI_WARNING, "Too many `return` statements for implmentation %s;"
519 " found %zu, exactly one is needed",
520 impl->func->name, impl->stmts->ret.count);
521 } else {
522 data->error(PSI_WARNING, "Missing `return` statement for implementation %s",
523 impl->func->name);
524 }
525 return 0;
526 }
527
528 ret = impl->stmts->ret.list[0];
529
530 if (!(impl->decl = locate_impl_decl(data->decls, ret))) {
531 data->error(PSI_WARNING, "Missing declaration for implementation %s",
532 impl->func->name);
533 return 0;
534 }
535
536 if (!validate_set_value(data, ret->set, ret->decl, impl->decl->args)) {
537 return 0;
538 }
539
540 impl->decl->impl = impl;
541
542 return 1;
543 }
544 static inline int validate_impl_let_stmts(PSI_Data *data, impl *impl) {
545 size_t i, j;
546 /* we can have multiple let stmts */
547 /* check that we have a let stmt for every decl arg */
548 if (impl->decl->args) for (i = 0; i < impl->decl->args->count; ++i) {
549 decl_arg *darg = impl->decl->args->args[i];
550 int check = 0;
551
552 for (j = 0; j < impl->stmts->let.count; ++j) {
553 let_stmt *let = impl->stmts->let.list[j];
554
555 if (!strcmp(let->var->name, darg->var->name)) {
556 darg->let = let;
557 check = 1;
558 break;
559 }
560 }
561 if (!check) {
562 data->error(PSI_WARNING, "Missing `let` statement for arg '%s %.*s%s'"
563 " of declaration '%s' for implementation '%s'",
564 darg->type->name, (int) darg->var->pointer_level, "*****",
565 darg->var->name, impl->decl->func->var->name, impl->func->name);
566 return 0;
567 }
568 }
569 /* check that the let_value references a known variable or NULL */
570 for (i = 0; i < impl->stmts->let.count; ++i) {
571 let_stmt *let = impl->stmts->let.list[i];
572 int check = 0;
573
574 if (let->val && let->val->func && let->val->func->alloc) {
575 if (!validate_decl_type(data, let->val->func->alloc->type)) {
576 data->error(PSI_WARNING, "Cannot use '%s' as type for calloc in `let` statement",
577 let->val->func->alloc->type->name);
578 return 0;
579 }
580 }
581 if (let->val && let->val->var) {
582 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
583 impl_arg *iarg = impl->func->args->args[j];
584
585 if (!strcmp(let->val->var->name, iarg->var->name)) {
586 let->arg = iarg;
587 check = 1;
588 break;
589 }
590 }
591 if (!check) {
592 data->error(PSI_WARNING, "Unknown value '$%s' of `let` statement"
593 " for variable '%s' of implementation '%s'",
594 let->val->var->name, let->var->name, impl->func->name);
595 return 0;
596 }
597 }
598 }
599 return 1;
600 }
601 static inline int validate_impl_set_stmts(PSI_Data *data, impl *impl) {
602 size_t i, j, k;
603 /* we can have any count of set stmts; processing out vars */
604 /* check that set stmts reference known variables */
605 for (i = 0; i < impl->stmts->set.count; ++i) {
606 set_stmt *set = impl->stmts->set.list[i];
607 int check = 0;
608
609 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
610 impl_arg *iarg = impl->func->args->args[j];
611
612 if (!strcmp(set->var->name, iarg->var->name)) {
613 set->arg = iarg;
614 check = 1;
615 break;
616 }
617 }
618 if (!check) {
619 data->error(PSI_WARNING, "Unknown variable '$%s' of `set` statement"
620 " of implementation '%s'",
621 set->var->name, impl->func->name);
622 return 0;
623 }
624
625 for (j = 0; j < set->val->vars->count; ++j) {
626 decl_var *set_var = set->val->vars->vars[j];
627
628 check = 0;
629 if (impl->decl->args) for (k = 0; k < impl->decl->args->count; ++k) {
630 decl_arg *set_arg = impl->decl->args->args[k];
631
632 if (!strcmp(set_var->name, set_arg->var->name)) {
633 check = 1;
634 set_var->arg = set_arg;
635 if (!validate_set_value(data, set->val, set_arg, impl->decl->args)) {
636 return 0;
637 }
638 break;
639 }
640 }
641
642 if (!check) {
643 data->error(PSI_WARNING, "Unknown value '%s' of `set` statement"
644 " for variable '$%s' of implementation '%s'",
645 set_var->name, set->arg->var->name, impl->func->name);
646 return 0;
647 }
648 }
649 }
650 return 1;
651 }
652 static inline decl *locate_free_decl(decls *decls, free_call *f) {
653 if (decls) {
654 size_t i;
655
656 for (i = 0; i < decls->count; ++i) {
657 if (!strcmp(decls->list[i]->func->var->name, f->func)) {
658 f->decl = decls->list[i];
659 return decls->list[i];
660 }
661 }
662 }
663
664 return NULL;
665 }
666 static inline int validate_impl_free_stmts(PSI_Data *data, impl *impl) {
667 size_t i, j, k, l;
668 /* we can have any count of free stmts; freeing any out vars */
669 for (i = 0; i < impl->stmts->fre.count; ++i) {
670 free_stmt *fre = impl->stmts->fre.list[i];
671
672 for (j = 0; j < fre->calls->count; ++j) {
673 free_call *free_call = fre->calls->list[j];
674
675 /* first find the decl of the free func */
676 if (!locate_free_decl(data->decls, free_call)) {
677 data->error(PSI_WARNING, "Unknown function '%s' in `free` statement"
678 " of implementation '%s'", free_call->func, impl->func->name);
679 return 0;
680 }
681 if (!impl->decl->args) {
682 data->error(PSI_WARNING, "Declaration '%s' of implementation '%s'"
683 " does not have any arguments to free",
684 impl->decl->func->var->name, impl->func->name);
685 }
686
687 /* now check for known vars */
688 for (l = 0; l < free_call->vars->count; ++l) {
689 int check = 0;
690 decl_var *free_var = free_call->vars->vars[l];
691
692 for (k = 0; k < impl->decl->args->count; ++k) {
693 decl_arg *free_arg = impl->decl->args->args[k];
694
695 if (!strcmp(free_var->name, free_arg->var->name)) {
696 check = 1;
697 free_var->arg = free_arg;
698 break;
699 }
700 }
701
702 if (!check) {
703 data->error(PSI_WARNING, "Unknown variable '%s' of `free` statement"
704 " of implementation '%s'",
705 free_var->name, impl->func->name);
706 return 0;
707 }
708 }
709 }
710 }
711 return 1;
712 }
713 static inline int validate_impl_stmts(PSI_Data *data, impl *impl) {
714 if (!impl->stmts) {
715 data->error(PSI_WARNING, "Missing body for implementation %s!",
716 impl->func->name);
717 return 0;
718 }
719
720 if (!validate_impl_ret_stmt(data, impl)) {
721 return 0;
722 }
723
724 if (!validate_impl_let_stmts(data, impl)) {
725 return 0;
726 }
727 if (!validate_impl_set_stmts(data, impl)) {
728 return 0;
729 }
730 if (!validate_impl_free_stmts(data, impl)) {
731 return 0;
732 }
733
734 return 1;
735 }
736
737 PSI_Context *PSI_ContextInit(PSI_Context *C, PSI_ContextOps *ops, PSI_ContextErrorFunc error)
738 {
739 size_t i;
740 PSI_Data T;
741 struct psi_predef_type *predef_type;
742 struct psi_predef_const *predef_const;
743 struct psi_predef_struct *predef_struct;
744 struct psi_predef_decl *predef_decl;
745
746 if (!C) {
747 C = malloc(sizeof(*C));
748 }
749 memset(C, 0, sizeof(*C));
750
751 C->error = error;
752 C->ops = ops;
753
754 if (ops->init) {
755 ops->init(C);
756 }
757
758 ZEND_ASSERT(ops->call != NULL);
759 ZEND_ASSERT(ops->compile != NULL);
760
761 /* build up predefs in a temporary PSI_Data for validation */
762 memset(&T, 0, sizeof(T));
763 T.error = error;
764
765 for (predef_type = &psi_predef_types[0]; predef_type->type_tag; ++predef_type) {
766 decl_type *type = init_decl_type(predef_type->type_tag, predef_type->type_name);
767 decl_typedef *def = init_decl_typedef(predef_type->alias, type);
768
769 T.defs = add_decl_typedef(T.defs, def);
770 }
771 for (predef_const = &psi_predef_consts[0]; predef_const->type_tag; ++predef_const) {
772 impl_def_val *val = init_impl_def_val(predef_const->val_type_tag, predef_const->val_text);
773 const_type *type = init_const_type(predef_const->type_tag, predef_const->type_name);
774 constant *constant = init_constant(type, predef_const->var_name, val);
775
776 T.consts = add_constant(T.consts, constant);
777 }
778 for (predef_struct = &psi_predef_structs[0]; predef_struct->type_tag; ++predef_struct) {
779 struct psi_predef_struct *member;
780 decl_args *dargs = init_decl_args(NULL);
781 decl_struct *dstruct = init_decl_struct(predef_struct->var_name, dargs);
782
783 dstruct->size = predef_struct->size;
784 for (member = &predef_struct[1]; member->type_tag; ++member) {
785 decl_type *type;
786 decl_var *dvar;
787 decl_arg *darg;
788
789 type = init_decl_type(member->type_tag, member->type_name);
790 dvar = init_decl_var(member->var_name, member->pointer_level, member->array_size);
791 darg = init_decl_arg(type, dvar);
792 darg->layout = init_decl_struct_layout(member->offset, member->size);
793 dargs = add_decl_arg(dargs, darg);
794 }
795
796 T.structs = add_decl_struct(T.structs, dstruct);
797 predef_struct = member;
798 }
799 for (predef_decl = &psi_predef_decls[0]; predef_decl->type_tag; ++predef_decl) {
800 struct psi_predef_decl *farg;
801 decl_type *ftype = init_decl_type(predef_decl->type_tag, predef_decl->type_name);
802 decl_var *fname = init_decl_var(predef_decl->var_name, predef_decl->pointer_level, predef_decl->array_size);
803 decl_arg *func = init_decl_arg(ftype, fname);
804 decl_args *args = init_decl_args(NULL);
805 decl *decl = init_decl(init_decl_abi("default"), func, args);
806
807
808 for (farg = &predef_decl[1]; farg->type_tag; ++farg) {
809 decl_type *arg_type = init_decl_type(farg->type_tag, farg->type_name);
810 decl_var *arg_var = init_decl_var(farg->var_name, farg->pointer_level, farg->array_size);
811 decl_arg *darg = init_decl_arg(arg_type, arg_var);
812 args = add_decl_arg(args, darg);
813 }
814
815 T.decls = add_decl(T.decls, decl);
816 predef_decl = farg;
817 }
818
819 for (i = 0; i < T.defs->count; ++i) {
820 decl_typedef *def = T.defs->list[i];
821
822 if (validate_decl_typedef(&T, def)) {
823 C->defs = add_decl_typedef(C->defs, def);
824 }
825 }
826
827 for (i = 0; i < T.consts->count; ++i) {
828 constant *constant = T.consts->list[i];
829
830 if (validate_constant(&T, constant)) {
831 C->consts = add_constant(C->consts, constant);
832 }
833 }
834
835 for (i = 0; i < T.structs->count; ++i) {
836 decl_struct *dstruct = T.structs->list[i];
837
838 if (validate_decl_struct(&T, dstruct)) {
839 C->structs = add_decl_struct(C->structs, dstruct);
840 }
841 }
842
843 for (i = 0; i < T.decls->count; ++i) {
844 decl *decl = T.decls->list[i];
845
846 if (validate_decl(&T, NULL, decl)) {
847 C->decls = add_decl(C->decls, decl);
848 }
849 }
850
851 C->count = 1;
852 C->data = malloc(sizeof(*C->data));
853 PSI_DataExchange(C->data, &T);
854
855 return C;
856 }
857
858 int PSI_ContextValidate(PSI_Context *C, PSI_Parser *P)
859 {
860 PSI_Data *D;
861 void *dlopened = NULL;
862 size_t count = C->count++;
863
864 C->data = realloc(C->data, C->count * sizeof(*C->data));
865 D = PSI_DataExchange(&C->data[count], PSI_DATA(P));
866
867 if (D->defs) {
868 size_t i;
869
870 for (i = 0; i < D->defs->count; ++i) {
871 if (validate_decl_typedef(PSI_DATA(C), D->defs->list[i])) {
872 C->defs = add_decl_typedef(C->defs, D->defs->list[i]);
873 }
874 }
875 }
876 if (D->structs) {
877 size_t i;
878
879 for (i = 0; i < D->structs->count; ++i) {
880 if (validate_decl_struct(PSI_DATA(C), D->structs->list[i])) {
881 C->structs = add_decl_struct(C->structs, D->structs->list[i]);
882 }
883 }
884 }
885 if (D->consts) {
886 size_t i;
887
888 for (i = 0; i < D->consts->count; ++i) {
889 if (validate_constant(PSI_DATA(C), D->consts->list[i])) {
890 C->consts = add_constant(C->consts, D->consts->list[i]);
891 }
892 }
893 }
894
895 if (!validate_lib(D, &dlopened)) {
896 return 0;
897 }
898
899 add_decl_lib(&C->psi.libs, dlopened);
900
901 if (D->decls) {
902 size_t i;
903
904 for (i = 0; i < D->decls->count; ++i) {
905 if (validate_decl(PSI_DATA(C), dlopened, D->decls->list[i])) {
906 C->decls = add_decl(C->decls, D->decls->list[i]);
907 }
908 }
909 }
910 if (D->impls) {
911 size_t i;
912
913 for (i = 0; i < D->impls->count; ++i) {
914 if (validate_impl_stmts(PSI_DATA(C), D->impls->list[i])) {
915 C->impls = add_impl(C->impls, D->impls->list[i]);
916 }
917 }
918 }
919
920 return 1;
921 }
922
923 static int psi_select_dirent(const struct dirent *entry)
924 {
925 #ifndef FNM_CASEFOLD
926 #define FNM_CASEFOLD 0
927 #endif
928 return 0 == fnmatch("*.psi", entry->d_name, FNM_CASEFOLD);
929 }
930
931 void PSI_ContextBuild(PSI_Context *C, const char *paths)
932 {
933 int i, n, flags = psi_check_env("PSI_DEBUG") ? PSI_PARSER_DEBUG : 0;
934 char *sep = NULL, *cpy = strdup(paths), *ptr = cpy;
935 struct dirent **entries = NULL;
936
937
938 do {
939 sep = strchr(ptr, ':');
940
941 if (sep) {
942 *sep = 0;
943 }
944
945 n = php_scandir(ptr, &entries, psi_select_dirent, alphasort);
946
947 if (n > 0) {
948 for (i = 0; i < n; ++i) {
949 char psi[MAXPATHLEN];
950 PSI_Parser P;
951
952 if (MAXPATHLEN <= slprintf(psi, MAXPATHLEN, "%s/%s", ptr, entries[i]->d_name)) {
953 C->error(PSI_WARNING, "Path to PSI file too long: %s/%s",
954 ptr, entries[i]->d_name);
955 }
956 if (!PSI_ParserInit(&P, psi, C->error, flags)) {
957 C->error(PSI_WARNING, "Failed to init PSI parser (%s): %s",
958 psi, strerror(errno));
959 continue;
960 }
961
962 while (-1 != PSI_ParserScan(&P)) {
963 PSI_ParserParse(&P, PSI_TokenAlloc(&P));
964 };
965 PSI_ParserParse(&P, NULL);
966 PSI_ContextValidate(C, &P);
967 PSI_ParserDtor(&P);
968 }
969 }
970
971 if (entries) {
972 for (i = 0; i < n; ++i) {
973 free(entries[i]);
974 }
975 free(entries);
976 }
977
978 ptr = sep + 1;
979 } while (sep);
980
981
982 if (PSI_ContextCompile(C) && SUCCESS != zend_register_functions(NULL, C->closures, NULL, MODULE_PERSISTENT)) {
983 C->error(PSI_WARNING, "Failed to register functions!");
984 }
985
986 free(cpy);
987
988 }
989
990 zend_function_entry *PSI_ContextCompile(PSI_Context *C)
991 {
992 size_t i;
993
994 if (C->consts) {
995 zend_constant zc;
996
997 zc.flags = CONST_PERSISTENT|CONST_CS;
998 zc.module_number = EG(current_module)->module_number;
999
1000 for (i = 0; i < C->consts->count; ++i) {
1001 constant *c = C->consts->list[i];
1002
1003 zc.name = zend_string_init(c->name + (c->name[0] == '\\'), strlen(c->name) - (c->name[0] == '\\'), 1);
1004 ZVAL_NEW_STR(&zc.value, zend_string_init(c->val->text, strlen(c->val->text), 1));
1005
1006 switch (c->type->type) {
1007 case PSI_T_BOOL:
1008 convert_to_boolean(&zc.value);
1009 break;
1010 case PSI_T_INT:
1011 convert_to_long(&zc.value);
1012 break;
1013 case PSI_T_FLOAT:
1014 convert_to_double(&zc.value);
1015 break;
1016 }
1017 zend_register_constant(&zc);
1018 }
1019 }
1020
1021 return C->closures = C->ops->compile(C);
1022 }
1023
1024
1025 void PSI_ContextCall(PSI_Context *C, impl_val *ret_val, decl *decl)
1026 {
1027 C->ops->call(C, ret_val, decl);
1028 }
1029
1030 static inline void dump_decl_type(int fd, decl_type *t) {
1031 const char *pre;
1032
1033 switch (t->type) {
1034 case PSI_T_STRUCT:
1035 pre = "struct ";
1036 break;
1037 default:
1038 pre = "";
1039 }
1040 dprintf(fd, "%s%s", pre, t->name);
1041 }
1042 static inline void dump_decl_var(int fd, decl_var *v) {
1043 dprintf(fd, "%.*s%s", v->pointer_level-!!v->array_size, "**********", v->name);
1044 if (v->array_size) {
1045 dprintf(fd, "[%u]", v->array_size);
1046 }
1047 }
1048 static inline void dump_decl_arg(int fd, decl_arg *a) {
1049 dump_decl_type(fd, a->type);
1050 dprintf(fd, " ");
1051 dump_decl_var(fd, a->var);
1052 }
1053 static inline void dump_level(int fd, unsigned level) {
1054 dprintf(fd, "%.*s", level, "\t\t\t\t\t\t\t\t\t");
1055 }
1056 static inline void dump_impl_set_value(int fd, set_value *set, unsigned level) {
1057 size_t i;
1058
1059 if (level > 1) {
1060 /* only if not directly after `set ...` */
1061 dump_level(fd, level);
1062 }
1063 dprintf(fd, "%s(", set->func->name);
1064
1065 for (i = 0; i < set->vars->count; ++i) {
1066 decl_var *svar = set->vars->vars[i];
1067 if (i) {
1068 dprintf(fd, ", ");
1069 }
1070 dump_decl_var(fd, svar);
1071 }
1072 if (set->inner) {
1073 dprintf(fd, ",\n");
1074 for (i = 0; i < set->count; ++i) {
1075 dump_impl_set_value(fd, set->inner[i], level+1);
1076 }
1077 /* only if inner stmts, i.e. with new lines, were dumped */
1078 dump_level(fd, level);
1079 }
1080 if (level > 1) {
1081 dprintf(fd, "),\n");
1082 } else {
1083 dprintf(fd, ");\n");
1084 }
1085 }
1086 void PSI_ContextDump(PSI_Context *C, int fd)
1087 {
1088 size_t i, j, k, l;
1089
1090 #ifdef HAVE_LIBJIT
1091 if (C->ops == PSI_Libjit()) {
1092 dprintf(fd, "// psi.engine=jit\n");
1093 }
1094 #endif
1095 #ifdef HAVE_LIBFFI
1096 if (C->ops == PSI_Libffi()) {
1097 dprintf(fd, "// psi.engine=ffi\n");
1098 }
1099 #endif
1100 dprintf(fd, "\n");
1101
1102 if (C->defs) {
1103 for (i = 0; i < C->defs->count; ++i) {
1104 decl_typedef *tdef = C->defs->list[i];
1105
1106 dprintf(fd, "typedef ");
1107 dump_decl_type(fd, tdef->type);
1108 dprintf(fd, " %s;\n", tdef->alias);
1109 }
1110 dprintf(fd, "\n");
1111 }
1112
1113 if (C->structs) {
1114 for (i = 0; i < C->structs->count; ++i) {
1115 decl_struct *strct = C->structs->list[i];
1116
1117 dprintf(fd, "struct %s::(%zu) {\n", strct->name, strct->size);
1118 if (strct->args) for (j = 0; j < strct->args->count; ++j) {
1119 decl_arg *sarg = strct->args->args[j];
1120
1121 dprintf(fd, "\t");
1122 dump_decl_arg(fd, sarg);
1123 dprintf(fd, "::(%zu, %zu);\n", sarg->layout->pos, sarg->layout->len);
1124 }
1125 dprintf(fd, "}\n");
1126 }
1127 dprintf(fd, "\n");
1128 }
1129 if (C->consts) {
1130 for (i = 0; i < C->consts->count; ++i) {
1131 constant *cnst = C->consts->list[i];
1132
1133 dprintf(fd, "const %s %s = ", cnst->type->name, cnst->name);
1134 if (cnst->val->type == PSI_T_QUOTED_STRING) {
1135 dprintf(fd, "\"%s\";\n", cnst->val->text);
1136 } else {
1137 dprintf(fd, "%s;\n", cnst->val->text);
1138 }
1139 }
1140 dprintf(fd, "\n");
1141 }
1142 if (C->decls) {
1143 for (i = 0; i < C->decls->count; ++i) {
1144 decl *decl = C->decls->list[i];
1145
1146 dprintf(fd, "%s ", decl->abi->convention);
1147 dump_decl_arg(fd, decl->func);
1148 dprintf(fd, "(");
1149 if (decl->args) for (j = 0; j < decl->args->count; ++j) {
1150 if (j) {
1151 dprintf(fd, ", ");
1152 }
1153 dump_decl_arg(fd, decl->args->args[j]);
1154 }
1155 dprintf(fd, ");\n");
1156 }
1157 dprintf(fd, "\n");
1158 }
1159 if (C->impls) {
1160 for (i = 0; i < C->impls->count; ++i) {
1161 impl *impl = C->impls->list[i];
1162
1163 dprintf(fd, "function %s(", impl->func->name);
1164 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
1165 impl_arg *iarg = impl->func->args->args[j];
1166
1167 dprintf(fd, "%s%s %s$%s",
1168 j ? ", " : "",
1169 iarg->type->name,
1170 iarg->var->reference ? "&" : "",
1171 iarg->var->name);
1172 if (iarg->def) {
1173 dprintf(fd, " = %s", iarg->def->text);
1174 }
1175 }
1176 dprintf(fd, ") : %s%s {\n",
1177 impl->func->return_reference ? "&":"",
1178 impl->func->return_type->name);
1179 if (impl->stmts) {
1180 for (j = 0; j < impl->stmts->let.count; ++j) {
1181 let_stmt *let = impl->stmts->let.list[j];
1182
1183 dprintf(fd, "\tlet %s", let->var->name);
1184 if (let->val) {
1185 dprintf(fd, " = %s", let->val->is_reference ? "&" : "");
1186 if (let->val->func) {
1187 dprintf(fd, "%s(", let->val->func->name);
1188 if (let->val->func->alloc) {
1189 dprintf(fd, "%zu, ", let->val->func->alloc->n);
1190 dump_decl_type(fd, let->val->func->alloc->type);
1191 } else {
1192 dprintf(fd, "$%s", let->val->var->name);
1193 }
1194 dprintf(fd, ");\n");
1195 } else {
1196 dprintf(fd, "NULL;\n");
1197 }
1198 }
1199 }
1200 for (j = 0; j < impl->stmts->ret.count; ++j) {
1201 return_stmt *ret = impl->stmts->ret.list[j];
1202
1203 dprintf(fd, "\treturn ");
1204 dump_impl_set_value(fd, ret->set, 1);
1205 }
1206 for (j = 0; j < impl->stmts->set.count; ++j) {
1207 set_stmt *set = impl->stmts->set.list[j];
1208
1209 dprintf(fd, "\tset $%s = ", set->var->name);
1210 dump_impl_set_value(fd, set->val, 1);
1211 }
1212 for (j = 0; j < impl->stmts->fre.count; ++j) {
1213 free_stmt *fre = impl->stmts->fre.list[j];
1214
1215 dprintf(fd, "\tfree ");
1216 for (k = 0; k < fre->calls->count; ++k) {
1217 free_call *call = fre->calls->list[k];
1218
1219 if (k) {
1220 dprintf(fd, ", ");
1221 }
1222 dprintf(fd, "%s(", call->func);
1223 for (l = 0; l < call->vars->count; ++l) {
1224 decl_var *fvar = call->vars->vars[l];
1225
1226 dump_decl_var(fd, fvar);
1227 }
1228 dprintf(fd, ");\n");
1229 }
1230 }
1231 }
1232 dprintf(fd, "}\n");
1233 }
1234 dprintf(fd, "\n");
1235 }
1236 }
1237
1238 void PSI_ContextDtor(PSI_Context *C)
1239 {
1240 size_t i;
1241 zend_function_entry *zfe;
1242
1243 if (C->ops->dtor) {
1244 C->ops->dtor(C);
1245 }
1246
1247 free_decl_libs(&C->psi.libs);
1248
1249 if (C->data) {
1250 for (i = 0; i < C->count; ++i) {
1251 PSI_DataDtor(&C->data[i]);
1252 }
1253 free(C->data);
1254 }
1255
1256 if (C->closures) {
1257 for (zfe = C->closures; zfe->fname; ++zfe) {
1258 free((void *) zfe->arg_info);
1259 }
1260 free(C->closures);
1261 }
1262
1263 if (C->consts) {
1264 if (C->consts->list) {
1265 free(C->consts->list);
1266 }
1267 free(C->consts);
1268 }
1269 if (C->defs) {
1270 if (C->defs->list) {
1271 free(C->defs->list);
1272 }
1273 free(C->defs);
1274 }
1275 if (C->structs) {
1276 if (C->structs->list) {
1277 free(C->structs->list);
1278 }
1279 free(C->structs);
1280 }
1281 if (C->decls) {
1282 if (C->decls->list) {
1283 free(C->decls->list);
1284 }
1285 free(C->decls);
1286 }
1287 if (C->impls) {
1288 if (C->impls->list) {
1289 free(C->impls->list);
1290 }
1291 free(C->impls);
1292 }
1293
1294 memset(C, 0, sizeof(*C));
1295 }
1296
1297 void PSI_ContextFree(PSI_Context **C)
1298 {
1299 if (*C) {
1300 PSI_ContextDtor(*C);
1301 free(*C);
1302 *C = NULL;
1303 }
1304 }