cbcfbc6b1d6ecd6e32ab0a2a099cf557cad958f1
[m6w6/ext-psi] / src / context.c
1 #ifdef HAVE_CONFIG_H
2 # include "config.h"
3 #endif
4
5 #include "php.h"
6
7 #include <stdio.h>
8 #ifdef HAVE_SYS_TYPES_H
9 # include <sys/types.h>
10 #endif
11 #ifdef HAVE_SYS_STAT_H
12 # include <sys/stat.h>
13 #endif
14 #ifdef STDC_HEADERS
15 # include <stdlib.h>
16 # include <stddef.h>
17 #else
18 # ifdef HAVE_STDLIB_H
19 # include <stdlib.h>
20 # endif
21 #endif
22 #ifdef HAVE_STRING_H
23 # if !defined STDC_HEADERS && defined HAVE_MEMORY_H
24 # include <memory.h>
25 # endif
26 # include <string.h>
27 #endif
28 #ifdef HAVE_STRINGS_H
29 # include <strings.h>
30 #endif
31 #ifdef HAVE_INTTYPES_H
32 # include <inttypes.h>
33 #endif
34 #ifdef HAVE_STDINT_H
35 # include <stdint.h>
36 #endif
37 #ifdef HAVE_UNISTD_H
38 # include <unistd.h>
39 #endif
40
41 #ifdef HAVE_ERRNO_H
42 # include <errno.h>
43 #endif
44 #ifdef HAVE_GLOB_H
45 # include <glob.h>
46 #endif
47 #ifdef HAVE_NETINET_IN_H
48 # include <netinet/in.h>
49 #endif
50 #ifdef HAVE_ARPA_NAMESER_H
51 # include <arpa/nameser.h>
52 #endif
53 #ifdef HAVE_NETDB_H
54 # include <netdb.h>
55 #endif
56 #ifdef HAVE_RESOLV_H
57 # include <resolv.h>
58 #endif
59 #ifdef HAVE_SYS_SELECT_H
60 # include <sys/select.h>
61 #endif
62 #ifdef HAVE_SYS_SOCKET_H
63 # include <sys/socket.h>
64 #endif
65 #ifdef HAVE_SYS_TIME_H
66 # include <sys/time.h>
67 #endif
68 #ifdef HAVE_SYS_TIMES_H
69 # include <sys/times.h>
70 #endif
71 #ifdef HAVE_SYS_UIO_H
72 # include <sys/uio.h>
73 #endif
74 #ifdef HAVE_SYS_UTSNAME_H
75 # include <sys/utsname.h>
76 #endif
77 #ifdef HAVE_TIME_H
78 # include <time.h>
79 #endif
80 #ifdef HAVE_WCHAR_H
81 # include <wchar.h>
82 #endif
83
84 #ifdef HAVE_DIRENT_H
85 # include <dirent.h>
86 # define NAMLEN(dirent) strlen ((dirent)->d_name)
87 #else
88 # define dirent direct
89 # define NAMLEN(dirent) ((dirent)->d_namlen)
90 # ifdef HAVE_SYS_NDIR_H
91 # include <sys/ndir.h>
92 # endif
93 # ifdef HAVE_SYS_DIR_H
94 # include <sys/dir.h>
95 # endif
96 # ifdef HAVE_NDIR_H
97 # include <ndir.h>
98 # endif
99 #endif
100
101 #include <sys/param.h>
102 #include <dlfcn.h>
103 #include <fnmatch.h>
104
105 #include "php.h"
106 #include "php_scandir.h"
107 #include "php_psi.h"
108 #include "context.h"
109 #include "parser.h"
110
111 #include "libjit.h"
112 #include "libffi.h"
113
114 static struct psi_std_type {
115 token_t type_tag;
116 const char *type_name;
117 } psi_std_types[] = {
118 {PSI_T_FLOAT, "float"},
119 {PSI_T_DOUBLE, "double"},
120 {PSI_T_INT8, "int8_t"},
121 {PSI_T_INT16, "int16_t"},
122 {PSI_T_INT32, "int32_t"},
123 {PSI_T_INT64, "int64_t"},
124 {PSI_T_UINT8, "uint8_t"},
125 {PSI_T_UINT16, "uint16_t"},
126 {PSI_T_UINT32, "uint32_t"},
127 {PSI_T_UINT64, "uint64_t"},
128 {0}
129 };
130
131 static struct psi_predef_type {
132 token_t type_tag;
133 const char *type_name;
134 const char *alias;
135 } psi_predef_types[] = {
136 PSI_TYPES
137 {0}
138 };
139
140 static struct psi_predef_const {
141 token_t type_tag;
142 const char *type_name;
143 const char *var_name;
144 const char *val_text;
145 token_t val_type_tag;
146 } psi_predef_consts[] = {
147 PSI_CONSTS
148 {0}
149 };
150
151 PSI_MACROS
152
153 static struct psi_func_redir {
154 const char *name;
155 void (*func)(void);
156 } psi_func_redirs[] = {
157 PSI_REDIRS
158 {0}
159 };
160
161 static struct psi_predef_decl {
162 token_t type_tag;
163 const char *type_name;
164 const char *var_name;
165 size_t pointer_level;
166 size_t array_size;
167 } psi_predef_decls[] = {
168 PSI_DECLS
169 {0}
170 };
171
172 static struct psi_predef_struct {
173 token_t type_tag;
174 const char *type_name;
175 const char *var_name;
176 size_t offset;
177 size_t size;
178 size_t pointer_level;
179 size_t array_size;
180 } psi_predef_structs[] = {
181 PSI_STRUCTS
182 {0}
183 };
184
185 static int validate_lib(PSI_Data *data, void **dlopened) {
186 char lib[MAXPATHLEN];
187 const char *ptr = data->psi.file.ln;
188 size_t len;
189
190 if (!ptr) {
191 /* FIXME: assume stdlib */
192 return 1;
193 } else if (!strchr(ptr, '/')) {
194 len = snprintf(lib, MAXPATHLEN, "lib%s.%s", ptr, PHP_PSI_SHLIB_SUFFIX);
195 if (MAXPATHLEN == len) {
196 data->error(PSI_WARNING, "Library name too long: '%s'", ptr);
197 }
198 lib[len] = 0;
199 ptr = lib;
200 }
201 if (!(*dlopened = dlopen(ptr, RTLD_LAZY|RTLD_LOCAL))) {
202 data->error(PSI_WARNING, "Could not open library '%s': %s.",
203 data->psi.file.ln, dlerror());
204 return 0;
205 }
206 return 1;
207 }
208
209 static inline int locate_decl_type_alias(decl_typedefs *defs, decl_type *type) {
210 size_t i;
211 struct psi_std_type *stdtyp;
212
213 if (type->real) {
214 return 1;
215 }
216 for (i = 0; i < defs->count; ++i) {
217 decl_typedef *def = defs->list[i];
218
219 if (def->type->type != type->type && !strcmp(def->alias, type->name)) {
220 type->real = def->type;
221 return 1;
222 }
223 }
224 for (stdtyp = &psi_std_types[0]; stdtyp->type_tag; ++stdtyp) {
225 if (!strcmp(type->name, stdtyp->type_name)) {
226 type->type = stdtyp->type_tag;
227 return 1;
228 }
229 }
230
231 return 0;
232 }
233 static inline int locate_decl_type_struct(decl_structs *structs, decl_type *type) {
234 size_t i;
235
236 if (type->strct) {
237 return 1;
238 }
239 for (i = 0; i < structs->count; ++i) {
240 if (!strcmp(structs->list[i]->name, type->name)) {
241 type->strct = structs->list[i];
242 return 1;
243 }
244 }
245 return 0;
246 }
247
248 static inline int validate_decl_type(PSI_Data *data, decl_type *type) {
249 switch (type->type) {
250 case PSI_T_NAME:
251 if (!data->defs || !locate_decl_type_alias(data->defs, type)) {
252 return 0;
253 }
254 if (type->real) {
255 return validate_decl_type(data, type->real);
256 }
257 return 1;
258 case PSI_T_STRUCT:
259 if (!data->structs || !locate_decl_type_struct(data->structs, type)) {
260 return 0;
261 }
262 break;
263 }
264 return 1;
265 }
266 static inline int validate_decl_typedef(PSI_Data *data, decl_typedef *def) {
267 if (!validate_decl_type(data, def->type)) {
268 data->error(PSI_WARNING, "Type '%s' cannot be aliased to %s'%s'",
269 def->type->name, def->type->type == PSI_T_STRUCT?"struct ":"",def->alias);
270 return 0;
271 }
272 /* FIXME: check def->alias */
273 return 1;
274 }
275
276 static inline int validate_constant(PSI_Data *data, constant *c) {
277 /* FIXME */
278 return 1;
279 }
280
281 static inline int validate_decl_arg(PSI_Data *data, decl_arg *arg) {
282 if (!validate_decl_type(data, arg->type)) {
283 data->error(PSI_WARNING, "Cannot use '%s'(%d) as type for '%s'",
284 arg->type->name, arg->type->type, arg->var->name);
285 return 0;
286 }
287 return 1;
288 }
289
290 static inline int validate_decl_struct(PSI_Data *data, decl_struct *s) {
291 size_t i;
292
293 for (i = 0; i < s->args->count; ++i) {
294 if (!validate_decl_arg(data, s->args->args[i])) {
295 return 0;
296 }
297 }
298
299 for (i = 0; i < s->args->count; ++i) {
300 decl_arg *darg = s->args->args[i];
301
302 if (!validate_decl_arg(data, darg)) {
303 return 0;
304 }
305
306 ZEND_ASSERT(!darg->var->arg || darg->var->arg == darg);
307 darg->var->arg = darg;
308
309 if (!darg->layout) {
310 token_t t;
311
312 if (darg->var->pointer_level && (!darg->var->array_size || darg->var->pointer_level == 1)) {
313 t = PSI_T_POINTER;
314 } else {
315 t = real_decl_type(darg->type)->type;
316 }
317
318 if (i) {
319 decl_arg *last = s->args->args[i-1];
320 darg->layout = init_decl_struct_layout(
321 psi_t_align(t, last->layout->pos + last->layout->len),
322 psi_t_size(t) * darg->var->array_size);
323 } else {
324 darg->layout = init_decl_struct_layout(0, psi_t_size(t));
325 }
326 }
327 if (s->size < darg->layout->pos + darg->layout->len) {
328 s->size = darg->layout->pos + darg->layout->len;
329 }
330 }
331 return 1;
332 }
333
334 static const char * const abi_ccs[] = {
335 "default", /* \ */
336 "extern", /* > - all the same */
337 "cdecl", /* / */
338 "stdcall",
339 "fastcall",
340 };
341 static inline int validate_decl_abi(PSI_Data *data, decl_abi *abi) {
342 size_t i;
343
344 for (i = 0; i < sizeof(abi_ccs)/sizeof(char*); ++i) {
345 if (strcasecmp(abi->convention, abi_ccs[i])) {
346 return 1;
347 }
348 }
349 data->error(PSI_WARNING, "Invalid calling convention: '%s'", abi->convention);
350 return 0;
351 }
352 static inline int validate_decl_func(PSI_Data *data, void *dl, decl *decl, decl_arg *func)
353 {
354 struct psi_func_redir *redir;
355
356 if (!strcmp(func->var->name, "dlsym")) {
357 data->error(PSI_WARNING, "Cannot dlsym dlsym (sic!)");
358 return 0;
359 }
360
361 if (!validate_decl_arg(data, func)) {
362 return 0;
363 }
364 for (redir = &psi_func_redirs[0]; redir->name; ++redir) {
365 if (!strcmp(func->var->name, redir->name)) {
366 decl->call.sym = redir->func;
367 }
368 }
369 if (!decl->call.sym) {
370 #ifndef RTLD_NEXT
371 # define RTLD_NEXT ((void *) -1l)
372 #endif
373 decl->call.sym = dlsym(dl ?: RTLD_NEXT, func->var->name);
374 if (!decl->call.sym) {
375 data->error(PSI_WARNING, "Failed to locate symbol '%s': %s",
376 func->var->name, dlerror());
377 }
378 }
379 return 1;
380 }
381
382 static inline int validate_decl(PSI_Data *data, void *dl, decl *decl) {
383 if (!validate_decl_abi(data, decl->abi)) {
384 return 0;
385 }
386 if (!validate_decl_func(data, dl, decl, decl->func)) {
387 return 0;
388 }
389 if (decl->args) {
390 size_t i;
391
392 for (i = 0; i < decl->args->count; ++i) {
393 if (!validate_decl_arg(data, decl->args->args[i])) {
394 return 0;
395 }
396 }
397 }
398 return 1;
399 }
400 static inline decl_arg *locate_decl_var_arg(decl_var *var, decl_args *args) {
401 size_t i;
402
403 for (i = 0; i < args->count; ++i) {
404 decl_arg *arg = args->args[i];
405
406 if (!strcmp(var->name, arg->var->name)) {
407 ZEND_ASSERT(!var->arg || var->arg == arg);
408 return var->arg = arg;
409 }
410 }
411
412 return NULL;
413 }
414 static inline decl_arg *locate_struct_member(decl_struct *s, decl_var *var) {
415 if (s->args) {
416 return locate_decl_var_arg(var, s->args);
417 }
418
419 return NULL;
420 }
421 static inline int validate_set_value(PSI_Data *data, set_value *set, decl_arg *ref, decl_args *ref_list) {
422 size_t i;
423 decl_type *ref_type = real_decl_type(ref->type);
424 decl_var *set_var = set->vars->vars[0];
425
426 switch (set->func->type) {
427 case PSI_T_TO_BOOL:
428 set->func->handler = psi_to_bool;
429 break;
430 case PSI_T_TO_INT:
431 set->func->handler = psi_to_int;
432 break;
433 case PSI_T_TO_FLOAT:
434 set->func->handler = psi_to_double;
435 break;
436 case PSI_T_TO_STRING:
437 set->func->handler = psi_to_string;
438 break;
439 case PSI_T_TO_ARRAY:
440 set->func->handler = psi_to_array;
441 break;
442 EMPTY_SWITCH_DEFAULT_CASE();
443 }
444
445 for (i = 1; i < set->vars->count; ++i) {
446 if (!locate_decl_var_arg(set->vars->vars[i], ref_list)) {
447 return 0;
448 }
449 }
450 set_var->arg = ref;
451
452 if (set->count) {
453 int is_to_array = (set->func->type == PSI_T_TO_ARRAY);
454 int is_pointer_to_struct = (ref_type->type == PSI_T_STRUCT && ref->var->pointer_level);
455
456 if (!is_to_array && !is_pointer_to_struct) {
457 data->error(E_WARNING, "Inner `set` statement casts only work with "
458 "to_array() casts on structs or pointers: %s(%s...", set->func->name, set->vars->vars[0]->name);
459 return 0;
460 }
461 }
462
463 if (ref_type->type == PSI_T_STRUCT) {
464 /* to_array(struct, to_...) */
465 for (i = 0; i < set->count; ++i) {
466 decl_var *sub_var = set->inner[i]->vars->vars[0];
467 decl_arg *sub_ref = locate_struct_member(ref_type->strct, sub_var);
468
469 set->inner[i]->outer.set = set;
470 if (sub_ref) {
471 if (!validate_set_value(data, set->inner[i], sub_ref, ref_type->strct->args)) {
472 return 0;
473 }
474 }
475 }
476 } else if (set->count == 1) {
477 /* to_array(ptr, to_string(*ptr)) */
478 decl_var *sub_var = set->inner[0]->vars->vars[0];
479 decl_arg *sub_ref = locate_decl_var_arg(sub_var, ref_list);
480
481 set->inner[0]->outer.set = set;
482 if (sub_ref) {
483 if (strcmp(sub_var->name, set_var->name)) {
484 data->error(E_WARNING, "Inner `set` statement casts on pointers must reference the same variable");
485 return 0;
486 }
487 if (!validate_set_value(data, set->inner[0], sub_ref, ref_list)) {
488 return 0;
489 }
490 }
491 } else if (set->count > 1) {
492 data->error(E_WARNING, "Inner `set` statement casts on pointers may only occur once");
493 return 0;
494 }
495
496 return 1;
497 }
498 static inline decl *locate_impl_decl(decls *decls, return_stmt *ret) {
499 if (decls) {
500 size_t i;
501
502 for (i = 0; i < decls->count; ++i) {
503 if (!strcmp(decls->list[i]->func->var->name, ret->set->vars->vars[0]->name)) {
504 ret->decl = decls->list[i]->func;
505 return decls->list[i];
506 }
507 }
508 }
509
510 return NULL;
511 }
512 static inline int validate_impl_ret_stmt(PSI_Data *data, impl *impl) {
513 return_stmt *ret;
514
515 /* we must have exactly one ret stmt delcaring the native func to call */
516 /* and which type cast to apply */
517 if (impl->stmts->ret.count != 1) {
518 if (impl->stmts->ret.count > 1) {
519 data->error(PSI_WARNING, "Too many `return` statements for implmentation %s;"
520 " found %zu, exactly one is needed",
521 impl->func->name, impl->stmts->ret.count);
522 } else {
523 data->error(PSI_WARNING, "Missing `return` statement for implementation %s",
524 impl->func->name);
525 }
526 return 0;
527 }
528
529 ret = impl->stmts->ret.list[0];
530
531 if (!(impl->decl = locate_impl_decl(data->decls, ret))) {
532 data->error(PSI_WARNING, "Missing declaration for implementation %s",
533 impl->func->name);
534 return 0;
535 }
536
537 if (!validate_set_value(data, ret->set, ret->decl, impl->decl->args)) {
538 return 0;
539 }
540
541 impl->decl->impl = impl;
542
543 return 1;
544 }
545 static inline int validate_impl_let_stmts(PSI_Data *data, impl *impl) {
546 size_t i, j;
547 /* we can have multiple let stmts */
548 /* check that we have a let stmt for every decl arg */
549 if (impl->decl->args) for (i = 0; i < impl->decl->args->count; ++i) {
550 decl_arg *darg = impl->decl->args->args[i];
551 int check = 0;
552
553 for (j = 0; j < impl->stmts->let.count; ++j) {
554 let_stmt *let = impl->stmts->let.list[j];
555
556 if (!strcmp(let->var->name, darg->var->name)) {
557 darg->let = let;
558 check = 1;
559 break;
560 }
561 }
562 if (!check) {
563 data->error(PSI_WARNING, "Missing `let` statement for arg '%s %.*s%s'"
564 " of declaration '%s' for implementation '%s'",
565 darg->type->name, (int) darg->var->pointer_level, "*****",
566 darg->var->name, impl->decl->func->var->name, impl->func->name);
567 return 0;
568 }
569 }
570 /* check that the let_value references a known variable or NULL */
571 for (i = 0; i < impl->stmts->let.count; ++i) {
572 let_stmt *let = impl->stmts->let.list[i];
573 int check = 0;
574
575 if (let->val && let->val->func && let->val->func->alloc) {
576 if (!validate_decl_type(data, let->val->func->alloc->type)) {
577 data->error(PSI_WARNING, "Cannot use '%s' as type for calloc in `let` statement",
578 let->val->func->alloc->type->name);
579 return 0;
580 }
581 }
582 if (let->val && let->val->var) {
583 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
584 impl_arg *iarg = impl->func->args->args[j];
585
586 if (!strcmp(let->val->var->name, iarg->var->name)) {
587 let->arg = iarg;
588 check = 1;
589 break;
590 }
591 }
592 if (!check) {
593 data->error(PSI_WARNING, "Unknown value '$%s' of `let` statement"
594 " for variable '%s' of implementation '%s'",
595 let->val->var->name, let->var->name, impl->func->name);
596 return 0;
597 }
598 }
599 }
600 return 1;
601 }
602 static inline int validate_impl_set_stmts(PSI_Data *data, impl *impl) {
603 size_t i, j, k;
604 /* we can have any count of set stmts; processing out vars */
605 /* check that set stmts reference known variables */
606 for (i = 0; i < impl->stmts->set.count; ++i) {
607 set_stmt *set = impl->stmts->set.list[i];
608 int check = 0;
609
610 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
611 impl_arg *iarg = impl->func->args->args[j];
612
613 if (!strcmp(set->var->name, iarg->var->name)) {
614 set->arg = iarg;
615 check = 1;
616 break;
617 }
618 }
619 if (!check) {
620 data->error(PSI_WARNING, "Unknown variable '$%s' of `set` statement"
621 " of implementation '%s'",
622 set->var->name, impl->func->name);
623 return 0;
624 }
625
626 for (j = 0; j < set->val->vars->count; ++j) {
627 decl_var *set_var = set->val->vars->vars[j];
628
629 check = 0;
630 if (impl->decl->args) for (k = 0; k < impl->decl->args->count; ++k) {
631 decl_arg *set_arg = impl->decl->args->args[k];
632
633 if (!strcmp(set_var->name, set_arg->var->name)) {
634 check = 1;
635 set_var->arg = set_arg;
636 if (!validate_set_value(data, set->val, set_arg, impl->decl->args)) {
637 return 0;
638 }
639 break;
640 }
641 }
642
643 if (!check) {
644 data->error(PSI_WARNING, "Unknown value '%s' of `set` statement"
645 " for variable '$%s' of implementation '%s'",
646 set_var->name, set->arg->var->name, impl->func->name);
647 return 0;
648 }
649 }
650 }
651 return 1;
652 }
653 static inline decl *locate_free_decl(decls *decls, free_call *f) {
654 if (decls) {
655 size_t i;
656
657 for (i = 0; i < decls->count; ++i) {
658 if (!strcmp(decls->list[i]->func->var->name, f->func)) {
659 f->decl = decls->list[i];
660 return decls->list[i];
661 }
662 }
663 }
664
665 return NULL;
666 }
667 static inline int validate_impl_free_stmts(PSI_Data *data, impl *impl) {
668 size_t i, j, k, l;
669 /* we can have any count of free stmts; freeing any out vars */
670 for (i = 0; i < impl->stmts->fre.count; ++i) {
671 free_stmt *fre = impl->stmts->fre.list[i];
672
673 for (j = 0; j < fre->calls->count; ++j) {
674 free_call *free_call = fre->calls->list[j];
675
676 /* first find the decl of the free func */
677 if (!locate_free_decl(data->decls, free_call)) {
678 data->error(PSI_WARNING, "Unknown function '%s' in `free` statement"
679 " of implementation '%s'", free_call->func, impl->func->name);
680 return 0;
681 }
682 if (!impl->decl->args) {
683 data->error(PSI_WARNING, "Declaration '%s' of implementation '%s'"
684 " does not have any arguments to free",
685 impl->decl->func->var->name, impl->func->name);
686 }
687
688 /* now check for known vars */
689 for (l = 0; l < free_call->vars->count; ++l) {
690 int check = 0;
691 decl_var *free_var = free_call->vars->vars[l];
692
693 for (k = 0; k < impl->decl->args->count; ++k) {
694 decl_arg *free_arg = impl->decl->args->args[k];
695
696 if (!strcmp(free_var->name, free_arg->var->name)) {
697 check = 1;
698 free_var->arg = free_arg;
699 break;
700 }
701 }
702
703 if (!check) {
704 data->error(PSI_WARNING, "Unknown variable '%s' of `free` statement"
705 " of implementation '%s'",
706 free_var->name, impl->func->name);
707 return 0;
708 }
709 }
710 }
711 }
712 return 1;
713 }
714 static inline int validate_impl_stmts(PSI_Data *data, impl *impl) {
715 if (!impl->stmts) {
716 data->error(PSI_WARNING, "Missing body for implementation %s!",
717 impl->func->name);
718 return 0;
719 }
720
721 if (!validate_impl_ret_stmt(data, impl)) {
722 return 0;
723 }
724
725 if (!validate_impl_let_stmts(data, impl)) {
726 return 0;
727 }
728 if (!validate_impl_set_stmts(data, impl)) {
729 return 0;
730 }
731 if (!validate_impl_free_stmts(data, impl)) {
732 return 0;
733 }
734
735 return 1;
736 }
737
738 PSI_Context *PSI_ContextInit(PSI_Context *C, PSI_ContextOps *ops, PSI_ContextErrorFunc error)
739 {
740 size_t i;
741 PSI_Data T;
742 struct psi_predef_type *predef_type;
743 struct psi_predef_const *predef_const;
744 struct psi_predef_struct *predef_struct;
745 struct psi_predef_decl *predef_decl;
746
747 if (!C) {
748 C = malloc(sizeof(*C));
749 }
750 memset(C, 0, sizeof(*C));
751
752 C->error = error;
753 C->ops = ops;
754
755 if (ops->init) {
756 ops->init(C);
757 }
758
759 ZEND_ASSERT(ops->call != NULL);
760 ZEND_ASSERT(ops->compile != NULL);
761
762 /* build up predefs in a temporary PSI_Data for validation */
763 memset(&T, 0, sizeof(T));
764 T.error = error;
765
766 for (predef_type = &psi_predef_types[0]; predef_type->type_tag; ++predef_type) {
767 decl_type *type = init_decl_type(predef_type->type_tag, predef_type->type_name);
768 decl_typedef *def = init_decl_typedef(predef_type->alias, type);
769
770 T.defs = add_decl_typedef(T.defs, def);
771 }
772 for (predef_const = &psi_predef_consts[0]; predef_const->type_tag; ++predef_const) {
773 impl_def_val *val = init_impl_def_val(predef_const->val_type_tag, predef_const->val_text);
774 const_type *type = init_const_type(predef_const->type_tag, predef_const->type_name);
775 constant *constant = init_constant(type, predef_const->var_name, val);
776
777 T.consts = add_constant(T.consts, constant);
778 }
779 for (predef_struct = &psi_predef_structs[0]; predef_struct->type_tag; ++predef_struct) {
780 struct psi_predef_struct *member;
781 decl_args *dargs = init_decl_args(NULL);
782 decl_struct *dstruct = init_decl_struct(predef_struct->var_name, dargs);
783
784 dstruct->size = predef_struct->size;
785 for (member = &predef_struct[1]; member->type_tag; ++member) {
786 decl_type *type;
787 decl_var *dvar;
788 decl_arg *darg;
789
790 type = init_decl_type(member->type_tag, member->type_name);
791 dvar = init_decl_var(member->var_name, member->pointer_level, member->array_size);
792 darg = init_decl_arg(type, dvar);
793 darg->layout = init_decl_struct_layout(member->offset, member->size);
794 dargs = add_decl_arg(dargs, darg);
795 }
796
797 T.structs = add_decl_struct(T.structs, dstruct);
798 predef_struct = member;
799 }
800 for (predef_decl = &psi_predef_decls[0]; predef_decl->type_tag; ++predef_decl) {
801 struct psi_predef_decl *farg;
802 decl_type *ftype = init_decl_type(predef_decl->type_tag, predef_decl->type_name);
803 decl_var *fname = init_decl_var(predef_decl->var_name, predef_decl->pointer_level, predef_decl->array_size);
804 decl_arg *func = init_decl_arg(ftype, fname);
805 decl_args *args = init_decl_args(NULL);
806 decl *decl = init_decl(init_decl_abi("default"), func, args);
807
808
809 for (farg = &predef_decl[1]; farg->type_tag; ++farg) {
810 decl_type *arg_type = init_decl_type(farg->type_tag, farg->type_name);
811 decl_var *arg_var = init_decl_var(farg->var_name, farg->pointer_level, farg->array_size);
812 decl_arg *darg = init_decl_arg(arg_type, arg_var);
813 args = add_decl_arg(args, darg);
814 }
815
816 T.decls = add_decl(T.decls, decl);
817 predef_decl = farg;
818 }
819
820 for (i = 0; i < T.defs->count; ++i) {
821 decl_typedef *def = T.defs->list[i];
822
823 if (validate_decl_typedef(&T, def)) {
824 C->defs = add_decl_typedef(C->defs, def);
825 }
826 }
827
828 for (i = 0; i < T.consts->count; ++i) {
829 constant *constant = T.consts->list[i];
830
831 if (validate_constant(&T, constant)) {
832 C->consts = add_constant(C->consts, constant);
833 }
834 }
835
836 for (i = 0; i < T.structs->count; ++i) {
837 decl_struct *dstruct = T.structs->list[i];
838
839 if (validate_decl_struct(&T, dstruct)) {
840 C->structs = add_decl_struct(C->structs, dstruct);
841 }
842 }
843
844 for (i = 0; i < T.decls->count; ++i) {
845 decl *decl = T.decls->list[i];
846
847 if (validate_decl(&T, NULL, decl)) {
848 C->decls = add_decl(C->decls, decl);
849 }
850 }
851
852 C->count = 1;
853 C->data = malloc(sizeof(*C->data));
854 PSI_DataExchange(C->data, &T);
855
856 return C;
857 }
858
859 int PSI_ContextValidate(PSI_Context *C, PSI_Parser *P)
860 {
861 PSI_Data *D;
862 void *dlopened = NULL;
863 size_t count = C->count++;
864
865 C->data = realloc(C->data, C->count * sizeof(*C->data));
866 D = PSI_DataExchange(&C->data[count], PSI_DATA(P));
867
868 if (D->defs) {
869 size_t i;
870
871 for (i = 0; i < D->defs->count; ++i) {
872 if (validate_decl_typedef(PSI_DATA(C), D->defs->list[i])) {
873 C->defs = add_decl_typedef(C->defs, D->defs->list[i]);
874 }
875 }
876 }
877 if (D->structs) {
878 size_t i;
879
880 for (i = 0; i < D->structs->count; ++i) {
881 if (validate_decl_struct(PSI_DATA(C), D->structs->list[i])) {
882 C->structs = add_decl_struct(C->structs, D->structs->list[i]);
883 }
884 }
885 }
886 if (D->consts) {
887 size_t i;
888
889 for (i = 0; i < D->consts->count; ++i) {
890 if (validate_constant(PSI_DATA(C), D->consts->list[i])) {
891 C->consts = add_constant(C->consts, D->consts->list[i]);
892 }
893 }
894 }
895
896 if (!validate_lib(D, &dlopened)) {
897 return 0;
898 }
899
900 add_decl_lib(&C->psi.libs, dlopened);
901
902 if (D->decls) {
903 size_t i;
904
905 for (i = 0; i < D->decls->count; ++i) {
906 if (validate_decl(PSI_DATA(C), dlopened, D->decls->list[i])) {
907 C->decls = add_decl(C->decls, D->decls->list[i]);
908 }
909 }
910 }
911 if (D->impls) {
912 size_t i;
913
914 for (i = 0; i < D->impls->count; ++i) {
915 if (validate_impl_stmts(PSI_DATA(C), D->impls->list[i])) {
916 C->impls = add_impl(C->impls, D->impls->list[i]);
917 }
918 }
919 }
920
921 return 1;
922 }
923
924 static int psi_select_dirent(const struct dirent *entry)
925 {
926 #ifndef FNM_CASEFOLD
927 #define FNM_CASEFOLD 0
928 #endif
929 return 0 == fnmatch("*.psi", entry->d_name, FNM_CASEFOLD);
930 }
931
932 void PSI_ContextBuild(PSI_Context *C, const char *paths)
933 {
934 int i, n, flags = psi_check_env("PSI_DEBUG") ? PSI_PARSER_DEBUG : 0;
935 char *sep = NULL, *cpy = strdup(paths), *ptr = cpy;
936 struct dirent **entries = NULL;
937
938
939 do {
940 sep = strchr(ptr, ':');
941
942 if (sep) {
943 *sep = 0;
944 }
945
946 n = php_scandir(ptr, &entries, psi_select_dirent, alphasort);
947
948 if (n > 0) {
949 for (i = 0; i < n; ++i) {
950 char psi[MAXPATHLEN];
951 PSI_Parser P;
952
953 if (MAXPATHLEN <= slprintf(psi, MAXPATHLEN, "%s/%s", ptr, entries[i]->d_name)) {
954 C->error(PSI_WARNING, "Path to PSI file too long: %s/%s",
955 ptr, entries[i]->d_name);
956 }
957 if (!PSI_ParserInit(&P, psi, C->error, flags)) {
958 C->error(PSI_WARNING, "Failed to init PSI parser (%s): %s",
959 psi, strerror(errno));
960 continue;
961 }
962
963 while (0 < PSI_ParserScan(&P)) {
964 PSI_ParserParse(&P, PSI_TokenAlloc(&P));
965 if (P.num == PSI_T_EOF) {
966 break;
967 }
968 }
969
970 PSI_ParserParse(&P, NULL);
971 PSI_ContextValidate(C, &P);
972 PSI_ParserDtor(&P);
973 }
974 }
975
976 if (entries) {
977 for (i = 0; i < n; ++i) {
978 free(entries[i]);
979 }
980 free(entries);
981 }
982
983 ptr = sep + 1;
984 } while (sep);
985
986
987 if (PSI_ContextCompile(C) && SUCCESS != zend_register_functions(NULL, C->closures, NULL, MODULE_PERSISTENT)) {
988 C->error(PSI_WARNING, "Failed to register functions!");
989 }
990
991 free(cpy);
992
993 }
994
995 zend_function_entry *PSI_ContextCompile(PSI_Context *C)
996 {
997 size_t i;
998
999 if (C->consts) {
1000 zend_constant zc;
1001
1002 zc.flags = CONST_PERSISTENT|CONST_CS;
1003 zc.module_number = EG(current_module)->module_number;
1004
1005 for (i = 0; i < C->consts->count; ++i) {
1006 constant *c = C->consts->list[i];
1007
1008 zc.name = zend_string_init(c->name + (c->name[0] == '\\'), strlen(c->name) - (c->name[0] == '\\'), 1);
1009 ZVAL_NEW_STR(&zc.value, zend_string_init(c->val->text, strlen(c->val->text), 1));
1010
1011 switch (c->type->type) {
1012 case PSI_T_BOOL:
1013 convert_to_boolean(&zc.value);
1014 break;
1015 case PSI_T_INT:
1016 convert_to_long(&zc.value);
1017 break;
1018 case PSI_T_FLOAT:
1019 convert_to_double(&zc.value);
1020 break;
1021 }
1022 zend_register_constant(&zc);
1023 }
1024 }
1025
1026 return C->closures = C->ops->compile(C);
1027 }
1028
1029
1030 void PSI_ContextCall(PSI_Context *C, impl_val *ret_val, decl *decl)
1031 {
1032 C->ops->call(C, ret_val, decl);
1033 }
1034
1035 static inline void dump_decl_type(int fd, decl_type *t) {
1036 const char *pre;
1037
1038 switch (t->type) {
1039 case PSI_T_STRUCT:
1040 pre = "struct ";
1041 break;
1042 default:
1043 pre = "";
1044 }
1045 dprintf(fd, "%s%s", pre, t->name);
1046 }
1047 static inline void dump_decl_var(int fd, decl_var *v) {
1048 dprintf(fd, "%.*s%s", v->pointer_level-!!v->array_size, "**********", v->name);
1049 if (v->array_size) {
1050 dprintf(fd, "[%u]", v->array_size);
1051 }
1052 }
1053 static inline void dump_decl_arg(int fd, decl_arg *a) {
1054 dump_decl_type(fd, a->type);
1055 dprintf(fd, " ");
1056 dump_decl_var(fd, a->var);
1057 }
1058 static inline void dump_level(int fd, unsigned level) {
1059 dprintf(fd, "%.*s", level, "\t\t\t\t\t\t\t\t\t");
1060 }
1061 static inline void dump_impl_set_value(int fd, set_value *set, unsigned level) {
1062 size_t i;
1063
1064 if (level > 1) {
1065 /* only if not directly after `set ...` */
1066 dump_level(fd, level);
1067 }
1068 dprintf(fd, "%s(", set->func->name);
1069
1070 for (i = 0; i < set->vars->count; ++i) {
1071 decl_var *svar = set->vars->vars[i];
1072 if (i) {
1073 dprintf(fd, ", ");
1074 }
1075 dump_decl_var(fd, svar);
1076 }
1077 if (set->inner) {
1078 dprintf(fd, ",\n");
1079 for (i = 0; i < set->count; ++i) {
1080 dump_impl_set_value(fd, set->inner[i], level+1);
1081 }
1082 /* only if inner stmts, i.e. with new lines, were dumped */
1083 dump_level(fd, level);
1084 }
1085 if (level > 1) {
1086 dprintf(fd, "),\n");
1087 } else {
1088 dprintf(fd, ");\n");
1089 }
1090 }
1091 void PSI_ContextDump(PSI_Context *C, int fd)
1092 {
1093 size_t i, j, k, l;
1094
1095 #ifdef HAVE_LIBJIT
1096 if (C->ops == PSI_Libjit()) {
1097 dprintf(fd, "// psi.engine=jit\n");
1098 }
1099 #endif
1100 #ifdef HAVE_LIBFFI
1101 if (C->ops == PSI_Libffi()) {
1102 dprintf(fd, "// psi.engine=ffi\n");
1103 }
1104 #endif
1105 dprintf(fd, "\n");
1106
1107 if (C->defs) {
1108 for (i = 0; i < C->defs->count; ++i) {
1109 decl_typedef *tdef = C->defs->list[i];
1110
1111 dprintf(fd, "typedef ");
1112 dump_decl_type(fd, tdef->type);
1113 dprintf(fd, " %s;\n", tdef->alias);
1114 }
1115 dprintf(fd, "\n");
1116 }
1117
1118 if (C->structs) {
1119 for (i = 0; i < C->structs->count; ++i) {
1120 decl_struct *strct = C->structs->list[i];
1121
1122 dprintf(fd, "struct %s::(%zu) {\n", strct->name, strct->size);
1123 if (strct->args) for (j = 0; j < strct->args->count; ++j) {
1124 decl_arg *sarg = strct->args->args[j];
1125
1126 dprintf(fd, "\t");
1127 dump_decl_arg(fd, sarg);
1128 dprintf(fd, "::(%zu, %zu);\n", sarg->layout->pos, sarg->layout->len);
1129 }
1130 dprintf(fd, "}\n");
1131 }
1132 dprintf(fd, "\n");
1133 }
1134 if (C->consts) {
1135 for (i = 0; i < C->consts->count; ++i) {
1136 constant *cnst = C->consts->list[i];
1137
1138 dprintf(fd, "const %s %s = ", cnst->type->name, cnst->name);
1139 if (cnst->val->type == PSI_T_QUOTED_STRING) {
1140 dprintf(fd, "\"%s\";\n", cnst->val->text);
1141 } else {
1142 dprintf(fd, "%s;\n", cnst->val->text);
1143 }
1144 }
1145 dprintf(fd, "\n");
1146 }
1147 if (C->decls) {
1148 for (i = 0; i < C->decls->count; ++i) {
1149 decl *decl = C->decls->list[i];
1150
1151 dprintf(fd, "%s ", decl->abi->convention);
1152 dump_decl_arg(fd, decl->func);
1153 dprintf(fd, "(");
1154 if (decl->args) for (j = 0; j < decl->args->count; ++j) {
1155 if (j) {
1156 dprintf(fd, ", ");
1157 }
1158 dump_decl_arg(fd, decl->args->args[j]);
1159 }
1160 dprintf(fd, ");\n");
1161 }
1162 dprintf(fd, "\n");
1163 }
1164 if (C->impls) {
1165 for (i = 0; i < C->impls->count; ++i) {
1166 impl *impl = C->impls->list[i];
1167
1168 dprintf(fd, "function %s(", impl->func->name);
1169 if (impl->func->args) for (j = 0; j < impl->func->args->count; ++j) {
1170 impl_arg *iarg = impl->func->args->args[j];
1171
1172 dprintf(fd, "%s%s %s$%s",
1173 j ? ", " : "",
1174 iarg->type->name,
1175 iarg->var->reference ? "&" : "",
1176 iarg->var->name);
1177 if (iarg->def) {
1178 dprintf(fd, " = %s", iarg->def->text);
1179 }
1180 }
1181 dprintf(fd, ") : %s%s {\n",
1182 impl->func->return_reference ? "&":"",
1183 impl->func->return_type->name);
1184 if (impl->stmts) {
1185 for (j = 0; j < impl->stmts->let.count; ++j) {
1186 let_stmt *let = impl->stmts->let.list[j];
1187
1188 dprintf(fd, "\tlet %s", let->var->name);
1189 if (let->val) {
1190 dprintf(fd, " = %s", let->val->is_reference ? "&" : "");
1191 if (let->val->func) {
1192 dprintf(fd, "%s(", let->val->func->name);
1193 if (let->val->func->alloc) {
1194 dprintf(fd, "%zu, ", let->val->func->alloc->n);
1195 dump_decl_type(fd, let->val->func->alloc->type);
1196 } else {
1197 dprintf(fd, "$%s", let->val->var->name);
1198 }
1199 dprintf(fd, ");\n");
1200 } else {
1201 dprintf(fd, "NULL;\n");
1202 }
1203 }
1204 }
1205 for (j = 0; j < impl->stmts->ret.count; ++j) {
1206 return_stmt *ret = impl->stmts->ret.list[j];
1207
1208 dprintf(fd, "\treturn ");
1209 dump_impl_set_value(fd, ret->set, 1);
1210 }
1211 for (j = 0; j < impl->stmts->set.count; ++j) {
1212 set_stmt *set = impl->stmts->set.list[j];
1213
1214 dprintf(fd, "\tset $%s = ", set->var->name);
1215 dump_impl_set_value(fd, set->val, 1);
1216 }
1217 for (j = 0; j < impl->stmts->fre.count; ++j) {
1218 free_stmt *fre = impl->stmts->fre.list[j];
1219
1220 dprintf(fd, "\tfree ");
1221 for (k = 0; k < fre->calls->count; ++k) {
1222 free_call *call = fre->calls->list[k];
1223
1224 if (k) {
1225 dprintf(fd, ", ");
1226 }
1227 dprintf(fd, "%s(", call->func);
1228 for (l = 0; l < call->vars->count; ++l) {
1229 decl_var *fvar = call->vars->vars[l];
1230
1231 dump_decl_var(fd, fvar);
1232 }
1233 dprintf(fd, ");\n");
1234 }
1235 }
1236 }
1237 dprintf(fd, "}\n");
1238 }
1239 dprintf(fd, "\n");
1240 }
1241 }
1242
1243 void PSI_ContextDtor(PSI_Context *C)
1244 {
1245 size_t i;
1246 zend_function_entry *zfe;
1247
1248 if (C->ops->dtor) {
1249 C->ops->dtor(C);
1250 }
1251
1252 free_decl_libs(&C->psi.libs);
1253
1254 if (C->data) {
1255 for (i = 0; i < C->count; ++i) {
1256 PSI_DataDtor(&C->data[i]);
1257 }
1258 free(C->data);
1259 }
1260
1261 if (C->closures) {
1262 for (zfe = C->closures; zfe->fname; ++zfe) {
1263 free((void *) zfe->arg_info);
1264 }
1265 free(C->closures);
1266 }
1267
1268 if (C->consts) {
1269 if (C->consts->list) {
1270 free(C->consts->list);
1271 }
1272 free(C->consts);
1273 }
1274 if (C->defs) {
1275 if (C->defs->list) {
1276 free(C->defs->list);
1277 }
1278 free(C->defs);
1279 }
1280 if (C->structs) {
1281 if (C->structs->list) {
1282 free(C->structs->list);
1283 }
1284 free(C->structs);
1285 }
1286 if (C->decls) {
1287 if (C->decls->list) {
1288 free(C->decls->list);
1289 }
1290 free(C->decls);
1291 }
1292 if (C->impls) {
1293 if (C->impls->list) {
1294 free(C->impls->list);
1295 }
1296 free(C->impls);
1297 }
1298
1299 memset(C, 0, sizeof(*C));
1300 }
1301
1302 void PSI_ContextFree(PSI_Context **C)
1303 {
1304 if (*C) {
1305 PSI_ContextDtor(*C);
1306 free(*C);
1307 *C = NULL;
1308 }
1309 }