X-Git-Url: https://git.m6w6.name/?p=m6w6%2Fext-psi;a=blobdiff_plain;f=src%2Fparser.h;h=5129097dc45d5b14271f4c39ba5ad0b40a0fbbd5;hp=3b4c77faca030b0bef00ce37f9219c0f8ad52880;hb=cfebc76ed7426836f21296cca9a14b422bfa04cf;hpb=3c53642a0adccd4b602d147833da24eb4b73bccc diff --git a/src/parser.h b/src/parser.h index 3b4c77f..5129097 100644 --- a/src/parser.h +++ b/src/parser.h @@ -12,6 +12,7 @@ #define BSIZE 256 +#define PSI_T_POINTER PSI_T_ASTERISK typedef int token_t; /* in php_psi.h */ @@ -20,12 +21,37 @@ size_t psi_t_size(token_t); typedef struct PSI_Token { token_t type; - unsigned line; - size_t size; - char text[1]; + unsigned size, *line; + char *text, *file; + char buf[1]; } PSI_Token; +typedef union impl_val { + char cval; + int8_t i8; + uint8_t u8; + short sval; + int16_t i16; + uint16_t u16; + int ival; + int32_t i32; + uint32_t u32; + long lval; + int64_t i64; + uint64_t u64; + float fval; + double dval; + union { + zend_bool bval; + zend_long lval; + zend_string *str; + } zend; + void *ptr; + uint8_t _dbg[sizeof(void *)]; +} impl_val; + typedef struct decl_type { + PSI_Token *token; char *name; token_t type; struct decl_type *real; @@ -47,11 +73,15 @@ static inline decl_type *real_decl_type(decl_type *type) { } static inline void free_decl_type(decl_type *type) { + if (type->token) { + free(type->token); + } free(type->name); free(type); } typedef struct decl_typedef { + PSI_Token *token; char *alias; decl_type *type; } decl_typedef; @@ -64,6 +94,9 @@ static inline decl_typedef *init_decl_typedef(const char *name, decl_type *type) } static inline void free_decl_typedef(decl_typedef *t) { + if (t->token) { + free(t->token); + } free(t->alias); free_decl_type(t->type); free(t); @@ -94,6 +127,7 @@ static void free_decl_typedefs(decl_typedefs *defs) { } typedef struct decl_var { + PSI_Token *token; char *name; unsigned pointer_level; unsigned array_size; @@ -109,6 +143,9 @@ static inline decl_var *init_decl_var(const char *name, unsigned pl, unsigned as } static inline void free_decl_var(decl_var *var) { + if (var->token) { + free(var->token); + } free(var->name); free(var); } @@ -131,16 +168,23 @@ static inline void free_decl_struct_layout(decl_struct_layout *l) { } typedef struct decl_arg { + PSI_Token *token; decl_type *type; decl_var *var; decl_struct_layout *layout; struct let_stmt *let; + impl_val val; + void *ptr; + void *mem; } decl_arg; static inline decl_arg *init_decl_arg(decl_type *type, decl_var *var) { decl_arg *arg = calloc(1, sizeof(*arg)); + arg->token = var->token; arg->type = type; arg->var = var; + var->arg = arg; + arg->ptr = &arg->val; return arg; } @@ -187,6 +231,7 @@ static inline void free_decl_vars(decl_vars *vars) { typedef struct decl_args { decl_arg **args; size_t count; + unsigned varargs:1; } decl_args; static inline decl_args *init_decl_args(decl_arg *arg) { @@ -216,6 +261,7 @@ static inline void free_decl_args(decl_args *args) { } typedef struct decl_abi { + PSI_Token *token; char *convention; } decl_abi; @@ -226,15 +272,27 @@ static inline decl_abi *init_decl_abi(const char *convention) { } static inline void free_decl_abi(decl_abi *abi) { + if (abi->token) { + free(abi->token); + } free(abi->convention); free(abi); } +typedef struct decl_callinfo { + void *sym; + void *info; + size_t argc; + void **args; + void *rval; +} decl_callinfo; + typedef struct decl { decl_abi *abi; decl_arg *func; decl_args *args; - void *dlptr; + struct impl *impl; + decl_callinfo call; } decl; static inline decl* init_decl(decl_abi *abi, decl_arg *func, decl_args *args) { @@ -279,6 +337,7 @@ static inline void free_decls(decls *decls) { } typedef struct decl_struct { + PSI_Token *token; char *name; decl_args *args; size_t size; @@ -292,6 +351,9 @@ static inline decl_struct *init_decl_struct(const char *name, decl_args *args) { } static inline void free_decl_struct(decl_struct *s) { + if (s->token) { + free(s->token); + } if (s->args) { free_decl_args(s->args); } @@ -323,50 +385,6 @@ static inline void free_decl_structs(decl_structs *ss) { free(ss); } -typedef union impl_val { - char cval; - int8_t i8; - short sval; - int16_t i16; - int ival; - int32_t i32; - long lval; - int64_t i64; - float fval; - double dval; - union { - zend_bool bval; - zend_long lval; - zend_string *str; - } zend; - void *ptr; - uint8_t _dbg[sizeof(void *)]; -} impl_val; - -static inline impl_val *deref_impl_val(impl_val *ret_val, decl_var *var) { - unsigned i; - - if (var->arg->var != var) for (i = 0; i < var->pointer_level; ++i) { - ret_val = *(void **) ret_val; - } - return ret_val; -} - -static inline impl_val *enref_impl_val(void *ptr, decl_var *var) { - impl_val *val, *val_ptr; - unsigned i; - - if (!var->pointer_level) { - return ptr; - } - val = val_ptr = calloc(var->pointer_level, sizeof(void *)); - for (i = 1; i < var->pointer_level; ++i) { - val_ptr->ptr = (void **) val_ptr + 1; - val_ptr = val_ptr->ptr; - } - val_ptr->ptr = ptr; - return val; -} typedef struct impl_type { char *name; token_t type; @@ -386,6 +404,7 @@ static inline void free_impl_type(impl_type *type) { } typedef struct impl_var { + PSI_Token *token; char *name; unsigned reference:1; } impl_var; @@ -398,6 +417,9 @@ static inline impl_var *init_impl_var(const char *name, int is_reference) { } static inline void free_impl_var(impl_var *var) { + if (var->token) { + free(var->token); + } free(var->name); free(var); } @@ -419,6 +441,68 @@ static inline void free_impl_def_val(impl_def_val *def) { free(def); } +typedef struct const_type { + token_t type; + char *name; +} const_type; + +static inline const_type *init_const_type(token_t type, const char *name) { + const_type *ct = calloc(1, sizeof(*ct)); + ct->type = type; + ct->name = strdup(name); + return ct; +} + +static inline void free_const_type(const_type *type) { + free(type->name); + free(type); +} + +typedef struct constant { + const_type *type; + char *name; + impl_def_val *val; +} constant; + +static inline constant *init_constant(const_type *type, const char *name, impl_def_val *val) { + constant *c = calloc(1, sizeof(*c)); + c->type = type; + c->name = strdup(name); + c->val = val; + return c; +} + +static inline void free_constant(constant *constant) { + free_const_type(constant->type); + free(constant->name); + free_impl_def_val(constant->val); + free(constant); +} + +typedef struct constants { + size_t count; + constant **list; +} constants; + +static inline constants *add_constant(constants *constants, constant *constant) { + if (!constants) { + constants = calloc(1, sizeof(*constants)); + } + constants->list = realloc(constants->list, ++constants->count * sizeof(*constants->list)); + constants->list[constants->count-1] = constant; + return constants; +} + +static inline void free_constants(constants *c) { + size_t i; + + for (i = 0; i < c->count; ++i) { + free_constant(c->list[i]); + } + free(c->list); + free(c); +} + typedef struct impl_arg { impl_type *type; impl_var *var; @@ -444,9 +528,18 @@ static inline void free_impl_arg(impl_arg *arg) { free(arg); } +typedef struct impl_vararg { + impl_arg *name; + struct impl_args *args; + token_t *types; + impl_val *values; + void **free_list; +} impl_vararg; + typedef struct impl_args { impl_arg **args; size_t count; + impl_vararg vararg; } impl_args; static inline impl_args *init_impl_args(impl_arg *arg) { @@ -471,11 +564,15 @@ static inline void free_impl_args(impl_args *args) { for (i = 0; i < args->count; ++i) { free_impl_arg(args->args[i]); } + if (args->vararg.name) { + free_impl_arg(args->vararg.name); + } free(args->args); free(args); } typedef struct impl_func { + PSI_Token *token; char *name; impl_args *args; impl_type *return_type; @@ -492,85 +589,177 @@ static inline impl_func *init_impl_func(char *name, impl_args *args, impl_type * } static inline void free_impl_func(impl_func *f) { + if (f->token) { + free(f->token); + } free_impl_type(f->return_type); free_impl_args(f->args); free(f->name); free(f); } +typedef struct num_exp { + PSI_Token *token; + token_t t; + union { + char *numb; + constant *cnst; + decl_var *dvar; + } u; + token_t operator; + int (*calculator)(int t1, impl_val *v1, int t2, impl_val *v2, impl_val *res); + struct num_exp *operand; +} num_exp; + +static inline num_exp *init_num_exp(token_t t, void *num) { + num_exp *exp = calloc(1, sizeof(*exp)); + switch (exp->t = t) { + case PSI_T_NUMBER: + case PSI_T_NSNAME: + exp->u.numb = strdup(num); + break; + case PSI_T_NAME: + exp->u.dvar = num; + break; + EMPTY_SWITCH_DEFAULT_CASE(); + } + return exp; +} + +static inline void free_num_exp(num_exp *exp) { + if (exp->token) { + free(exp->token); + } + switch (exp->t) { + case PSI_T_NUMBER: + free(exp->u.numb); + break; + case PSI_T_NSNAME: + break; + case PSI_T_NAME: + free_decl_var(exp->u.dvar); + break; + EMPTY_SWITCH_DEFAULT_CASE(); + } + if (exp->operand) { + free_num_exp(exp->operand); + } + free(exp); +} + typedef struct let_calloc { - size_t n; - decl_type *type; + num_exp *nmemb; + num_exp *size; } let_calloc; -static inline let_calloc *init_let_calloc(long n, decl_type *type) { +static inline let_calloc *init_let_calloc(num_exp *nmemb, num_exp *size) { let_calloc *alloc = calloc(1, sizeof(*alloc)); - alloc->n = n; - alloc->type = type; + alloc->nmemb = nmemb; + alloc->size = size; return alloc; } static inline void free_let_calloc(let_calloc *alloc) { - free_decl_type(alloc->type); + free_num_exp(alloc->nmemb); + free_num_exp(alloc->size); free(alloc); } typedef struct let_func { token_t type; char *name; - let_calloc *alloc; + impl_var *var; + impl_arg *arg; } let_func; -static inline let_func *init_let_func(token_t type, const char *name, let_calloc *alloc) { +static inline let_func *init_let_func(token_t type, const char *name, impl_var *var) { let_func *func = calloc(1, sizeof(*func)); func->type = type; func->name = strdup(name); - func->alloc = alloc; + func->var = var; return func; } static inline void free_let_func(let_func *func) { - if (func->alloc) { - free_let_calloc(func->alloc); - } + free_impl_var(func->var); free(func->name); free(func); } -typedef struct let_value { - let_func *func; - impl_var *var; - unsigned is_reference:1; -} let_value; - -static inline let_value *init_let_value(let_func *func, impl_var *var, int is_reference) { - let_value *val = calloc(1, sizeof(*val)); - val->is_reference = is_reference; - val->func = func; - val->var = var; - return val; +#define PSI_LET_REFERENCE 0x1; +typedef struct let_val { + enum let_val_kind { + PSI_LET_NULL, + PSI_LET_NUMEXP, + PSI_LET_CALLOC, + PSI_LET_FUNC, + PSI_LET_TMP, + } kind; + union { + num_exp *num; + let_calloc *alloc; + let_func *func; + decl_var *var; + } data; + union { + struct { + unsigned is_reference:1; + } one; + unsigned all; + } flags; +} let_val; + +static inline let_val *init_let_val(enum let_val_kind kind, void *data) { + let_val *let = calloc(1, sizeof(*let)); + switch (let->kind = kind) { + case PSI_LET_NULL: + break; + case PSI_LET_NUMEXP: + let->data.num = data; + break; + case PSI_LET_CALLOC: + let->data.alloc = data; + break; + case PSI_LET_FUNC: + let->data.func = data; + break; + case PSI_LET_TMP: + let->data.var = data; + break; + EMPTY_SWITCH_DEFAULT_CASE(); + } + return let; } -static inline void free_let_value(let_value *val) { - if (val->func) { - free_let_func(val->func); - } - if (val->var) { - free_impl_var(val->var); +static inline void free_let_val(let_val *let) { + switch (let->kind) { + case PSI_LET_NULL: + break; + case PSI_LET_NUMEXP: + free_num_exp(let->data.num); + break; + case PSI_LET_CALLOC: + free_let_calloc(let->data.alloc); + break; + case PSI_LET_FUNC: + free_let_func(let->data.func); + break; + case PSI_LET_TMP: + free_decl_var(let->data.var); + break; + EMPTY_SWITCH_DEFAULT_CASE(); } - free(val); + free(let); } typedef struct let_stmt { decl_var *var; - let_value *val; - impl_arg *arg; - impl_val out; + let_val *val; + void *ptr; - void *mem; } let_stmt; -static inline let_stmt *init_let_stmt(decl_var *var, let_value *val) { +static inline let_stmt *init_let_stmt(decl_var *var, let_val *val) { let_stmt *let = calloc(1, sizeof(*let)); let->var = var; let->val = val; @@ -578,19 +767,23 @@ static inline let_stmt *init_let_stmt(decl_var *var, let_value *val) { } static inline void free_let_stmt(let_stmt *stmt) { - free_decl_var(stmt->var); if (stmt->val) { - free_let_value(stmt->val); + if (stmt->val->kind == PSI_LET_TMP && stmt->var->arg) { + free_decl_arg(stmt->var->arg); + } + free_let_val(stmt->val); } + free_decl_var(stmt->var); free(stmt); } struct set_value; typedef struct set_func { + PSI_Token *token; token_t type; char *name; - void (*handler)(zval *, token_t, impl_val *, struct set_value *set, decl_var *); + void (*handler)(zval *, struct set_value *set, impl_val *ret_val); } set_func; static inline set_func *init_set_func(token_t type, const char *name) { @@ -601,6 +794,9 @@ static inline set_func *init_set_func(token_t type, const char *name) { } static inline void free_set_func(set_func *func) { + if (func->token) { + free(func->token); + } free(func->name); free(func); } @@ -608,6 +804,11 @@ static inline void free_set_func(set_func *func) { typedef struct set_value { set_func *func; decl_vars *vars; + num_exp *num; + struct { + struct set_value *set; + impl_val *val; + } outer; struct set_value **inner; size_t count; } set_value; @@ -621,19 +822,27 @@ static inline set_value *init_set_value(set_func *func, decl_vars *vars) { static inline set_value *add_inner_set_value(set_value *val, set_value *inner) { val->inner = realloc(val->inner, ++val->count * sizeof(*val->inner)); val->inner[val->count-1] = inner; + inner->outer.set = val; return val; } static inline void free_set_value(set_value *val) { - free_set_func(val->func); - free_decl_vars(val->vars); - if (val->inner) { + if (val->func) { + free_set_func(val->func); + } + if (val->vars) { + free_decl_vars(val->vars); + } + if (val->inner && (!val->outer.set || val->outer.set->inner != val->inner)) { size_t i; for (i = 0; i < val->count; ++i) { free_set_value(val->inner[i]); } free(val->inner); } + if (val->num) { + free_num_exp(val->num); + } free(val); } @@ -657,6 +866,7 @@ static inline void free_set_stmt(set_stmt *set) { } typedef struct return_stmt { + PSI_Token *token; set_value *set; decl_arg *decl; } return_stmt; @@ -668,25 +878,80 @@ static inline return_stmt *init_return_stmt(set_value *val) { } static inline void free_return_stmt(return_stmt *ret) { - //free_set_func(ret->func); - //free_decl_var(ret->decl); + if (ret->token) { + free(ret->token); + } free_set_value(ret->set); free(ret); } -typedef struct free_stmt { +typedef struct free_call { + PSI_Token *token; + char *func; decl_vars *vars; + decl *decl; +} free_call; + +static inline free_call *init_free_call(const char *func, decl_vars *vars) { + free_call *f = calloc(1, sizeof(*f)); + f->func = strdup(func); + f->vars = vars; + return f; +} + +static inline void free_free_call(free_call *f) { + if (f->token) { + free(f->token); + } + free(f->func); + free_decl_vars(f->vars); + free(f); +} + +typedef struct free_calls { + free_call **list; + size_t count; +} free_calls; + +static inline free_calls *init_free_calls(free_call *f) { + free_calls *fcs = calloc(1, sizeof(*fcs)); + if (f) { + fcs->count = 1; + fcs->list = calloc(1, sizeof(*fcs->list)); + fcs->list[0] = f; + } + return fcs; +} + +static inline void free_free_calls(free_calls *fcs) { + size_t i; + + for (i = 0; i < fcs->count; ++i) { + free_free_call(fcs->list[i]); + } + free(fcs->list); + free(fcs); +} + +static inline free_calls *add_free_call(free_calls *fcs, free_call *f) { + fcs->list = realloc(fcs->list, ++fcs->count * sizeof(*fcs->list)); + fcs->list[fcs->count-1] = f; + return fcs; +} + +typedef struct free_stmt { + free_calls *calls; } free_stmt; -static inline free_stmt *init_free_stmt(decl_vars *vars) { - free_stmt *free_ = calloc(1, sizeof(*free_)); - free_->vars = vars; - return free_; +static inline free_stmt *init_free_stmt(free_calls *calls) { + free_stmt *f = calloc(1, sizeof(*f)); + f->calls = calls; + return f; } -static inline void free_free_stmt(free_stmt *free_) { - free_decl_vars(free_->vars); - free(free_); +static inline void free_free_stmt(free_stmt *f) { + free_free_calls(f->calls); + free(f); } typedef struct impl_stmt { @@ -839,72 +1104,6 @@ static void free_impls(impls *impls) { free(impls); } -typedef struct const_type { - token_t type; - char *name; -} const_type; - -static inline const_type *init_const_type(token_t type, const char *name) { - const_type *ct = calloc(1, sizeof(*ct)); - ct->type = type; - ct->name = strdup(name); - return ct; -} - -static inline void free_const_type(const_type *type) { - free(type->name); - free(type); -} - -typedef struct constant { - const_type *type; - char *name; - impl_def_val *val; -} constant; - -static inline constant *init_constant(const_type *type, const char *name, impl_def_val *val) { - constant *c = calloc(1, sizeof(*c)); - c->type = type; - c->name = strdup(name); - c->val = val; - return c; -} - -static inline void free_constant(constant *constant) { - free_const_type(constant->type); - free(constant->name); - free_impl_def_val(constant->val); - free(constant); -} - -typedef struct constants { - size_t count; - constant **list; -} constants; - -static inline constants *add_constant(constants *constants, constant *constant) { - if (!constants) { - constants = calloc(1, sizeof(*constants)); - } - constants->list = realloc(constants->list, ++constants->count * sizeof(*constants->list)); - constants->list[constants->count-1] = constant; - return constants; -} - -static inline void free_constants(constants *c) { - size_t i; - - for (i = 0; i < c->count; ++i) { - free_constant(c->list[i]); - } - free(c->list); - free(c); -} - -#define PSI_ERROR 16 -#define PSI_WARNING 32 -typedef void (*psi_error_cb)(int type, const char *msg, ...); - typedef struct decl_file { char *ln; char *fn; @@ -943,6 +1142,63 @@ static inline void add_decl_lib(decl_libs *libs, void *dlopened) { libs->dl[libs->count-1] = dlopened; } +static inline impl_val *deref_impl_val(impl_val *ret_val, decl_var *var) { + unsigned i; + + ZEND_ASSERT(var->arg->var != var); +#if 0 + fprintf(stderr, "deref: %s pl=%u:%u as=%u:%u %p\n", + var->name, var->pointer_level, var->arg->var->pointer_level, + var->array_size, var->arg->var->array_size, ret_val); +#endif + for (i = 0; i < var->pointer_level; ++i) { +#if 0 + fprintf(stderr, "-- %p %p %p\n", ret_val, *(void**)ret_val, ret_val->ptr); +#endif + ret_val = *(void **) ret_val; + } + return ret_val; +} + +static inline impl_val *enref_impl_val(void *ptr, decl_var *var) { + impl_val *val, *val_ptr; + unsigned i; + + ZEND_ASSERT(var->arg->var == var); +#if 0 + fprintf(stderr, "enref: %s pl=%u:%u as=%u:%u\n", + var->name, var->pointer_level, var->arg->var->pointer_level, + var->array_size, var->arg->var->array_size); +#endif + if (!var->pointer_level && real_decl_type(var->arg->type)->type != PSI_T_STRUCT) { + return ptr; + } + + val = val_ptr = calloc(var->pointer_level + 1, sizeof(void *)); + for (i = !var->arg->var->array_size; i < var->pointer_level; ++i) { +#if 0 + fprintf(stderr, "++\n"); +#endif + val_ptr->ptr = (void **) val_ptr + 1; + val_ptr = val_ptr->ptr; + } + val_ptr->ptr = ptr; + return val; +} + +static inline impl_val *struct_member_ref(decl_arg *set_arg, impl_val *struct_ptr, impl_val **to_free) { + void *ptr = (char *) struct_ptr + set_arg->layout->pos; +#if 0 + fprintf(stderr, "struct member %s: %p\n", set_arg->var->name, ptr); +#endif + return ptr; +} + + +#define PSI_ERROR 16 +#define PSI_WARNING 32 +typedef void (*psi_error_cb)(PSI_Token *token, int type, const char *msg, ...); + #define PSI_DATA(D) ((PSI_Data *) (D)) #define PSI_DATA_MEMBERS \ constants *consts; \ @@ -990,41 +1246,63 @@ static inline void PSI_DataDtor(PSI_Data *data) { typedef struct PSI_Parser { PSI_DATA_MEMBERS; FILE *fp; - unsigned flags; - unsigned errors; - void *proc; - size_t line; token_t num; + void *proc; + unsigned flags, errors, line, col; char *cur, *tok, *lim, *eof, *ctx, *mrk, buf[BSIZE]; } PSI_Parser; static inline PSI_Token *PSI_TokenAlloc(PSI_Parser *P) { PSI_Token *T; - size_t token_len; + size_t token_len, fname_len; + token_t token_typ; - if (P->cur <= P->tok) { + if (P->cur < P->tok) { return NULL; } + token_typ = P->num; token_len = P->cur - P->tok; + fname_len = strlen(P->psi.file.fn); - T = calloc(1, sizeof(*T) + token_len); - T->type = P->num; - T->line = P->line; + T = calloc(1, sizeof(*T) + token_len + fname_len + sizeof(unsigned) + 2); + T->type = token_typ; T->size = token_len; - T->text[token_len] = 0; + T->text = &T->buf[0]; + T->file = &T->buf[token_len + 1]; + T->line = (void *) &T->buf[fname_len + token_len + 2]; + memcpy(T->text, P->tok, token_len); + memcpy(T->file, P->psi.file.fn, fname_len); + memcpy(T->line, &P->line, sizeof(unsigned)); return T; } +static inline PSI_Token *PSI_TokenCopy(PSI_Token *src) { + size_t fname_len = strlen(src->file); + size_t strct_len = sizeof(*src) + src->size + fname_len + sizeof(unsigned) + 2; + PSI_Token *ptr = malloc(strct_len); + + memcpy(ptr, src, strct_len); + + ptr->text = &ptr->buf[0]; + ptr->file = &ptr->buf[ptr->size + 1]; + + return ptr; +} + +static inline const char *PSI_TokenLocation(PSI_Token *t) { + return t ? t->file : ":0:0"; +} + #define PSI_PARSER_DEBUG 0x1 PSI_Parser *PSI_ParserInit(PSI_Parser *P, const char *filename, psi_error_cb error, unsigned flags); void PSI_ParserSyntaxError(PSI_Parser *P, const char *fn, size_t ln, const char *msg, ...); size_t PSI_ParserFill(PSI_Parser *P, size_t n); token_t PSI_ParserScan(PSI_Parser *P); -void PSI_ParserParse(PSI_Parser *P, PSI_Token *T); +void PSI_ParserParse(PSI_Parser *P, PSI_Token *src); void PSI_ParserDtor(PSI_Parser *P); void PSI_ParserFree(PSI_Parser **P);