ref: bc3a2a3b871d3126de301b51fd58c452c4ef5ead
dir: /parse/specialize.c/
#include <stdlib.h> #include <stdio.h> #include <stdarg.h> #include <inttypes.h> #include <ctype.h> #include <string.h> #include <assert.h> #include <sys/types.h> #include <sys/stat.h> #include <fcntl.h> #include <unistd.h> #include "util.h" #include "parse.h" static Node *specializenode(Node *g, Tysubst *tsmap); Tysubst *mksubst() { Tysubst *subst; subst = zalloc(sizeof(Tysubst)); substpush(subst); return subst; } void substfree(Tysubst *subst) { size_t i; for (i = 0; i < subst->nsubst; i++) htfree(subst->subst[i]); lfree(&subst->subst, &subst->nsubst); } void substpush(Tysubst *subst) { lappend(&subst->subst, &subst->nsubst, mkht(tyhash, tyeq)); } void substpop(Tysubst *subst) { Htab *ht; ht = lpop(&subst->subst, &subst->nsubst); htfree(ht); } void substput(Tysubst *subst, Type *from, Type *to) { htput(subst->subst[subst->nsubst - 1], from, to); } Type *substget(Tysubst *subst, Type *from) { Type *t; size_t i; t = NULL; for (i = subst->nsubst; i > 0; i--) { t = htget(subst->subst[i-1], from); if (t) break; } return t; } void addtraits(Type *t, Bitset *traits) { size_t b; if (traits) for (b = 0; bsiter(traits, &b); b++) settrait(t, traittab[b]); } /* * Duplicates the type 't', with all bound type * parameters substituted with the substitions * described in 'tsmap' * * Returns a fresh type with all unbound type * parameters (type schemes in most literature) * replaced with type variables that we can unify * against */ Type *tyspecialize(Type *orig, Tysubst *tsmap, Htab *delayed, Htab *trbase) { Type *t, *ret, *tmp, *var, *base; Type **arg; size_t i, narg; t = tysearch(orig); tmp = substget(tsmap, t); if (tmp) return tysearch(tmp); arg = NULL; narg = 0; switch (t->type) { case Typaram: ret = mktyvar(t->loc); addtraits(ret, t->traits); substput(tsmap, t, ret); break; case Tygeneric: var = mktyvar(t->loc); substput(tsmap, t, var); if (orig->type == Tyunres) { substpush(tsmap); for (i = 0; i < orig->narg; i++) substput(tsmap, t->gparam[i], orig->arg[i]); } for (i = 0; i < t->ngparam; i++) lappend(&arg, &narg, tyspecialize(t->gparam[i], tsmap, delayed, trbase)); ret = mktyname(t->loc, t->name, tyspecialize(t->sub[0], tsmap, delayed, trbase)); if (orig->type == Tyunres) substpop(tsmap); ret->arg = arg; ret->narg = narg; ret->traits = bsdup(t->traits); tytab[var->tid] = ret; break; case Tyname: if (!hasparams(t)) return t; var = mktyvar(t->loc); substput(tsmap, t, var); for (i = 0; i < t->narg; i++) lappend(&arg, &narg, tyspecialize(t->arg[i], tsmap, delayed, trbase)); ret = mktyname(t->loc, t->name, tyspecialize(t->sub[0], tsmap, delayed, trbase)); ret->traits = bsdup(t->traits); ret->arg = arg; ret->narg = narg; if (trbase && hthas(trbase, orig) && !hthas(trbase, ret)) { base = htget(trbase, orig); htput(trbase, ret, tyspecialize(base, tsmap, delayed, trbase)); } tytab[var->tid] = ret; break; case Tystruct: ret = tydup(t); substput(tsmap, t, ret); pushstab(NULL); for (i = 0; i < t->nmemb; i++) ret->sdecls[i] = specializenode(t->sdecls[i], tsmap); popstab(); break; case Tyunion: ret = tydup(t); substput(tsmap, t, ret); for (i = 0; i < t->nmemb; i++) { tmp = NULL; if (ret->udecls[i]->etype) tmp = tyspecialize(t->udecls[i]->etype, tsmap, delayed, trbase); ret->udecls[i] = mkucon(t->loc, t->udecls[i]->name, ret, tmp); ret->udecls[i]->utype = ret; ret->udecls[i]->id = i; ret->udecls[i]->synth = 1; } break; case Tyvar: ret = t; if (delayed && hthas(delayed, t)) { tmp = htget(delayed, t); htput(delayed, ret, tyspecialize(tmp, tsmap, delayed, trbase)); } break; default: if (t->nsub > 0) { ret = tydup(t); substput(tsmap, t, ret); for (i = 0; i < t->nsub; i++) ret->sub[i] = tyspecialize(t->sub[i], tsmap, delayed, trbase); } else { ret = t; } break; } return ret; } /* Checks if the type 't' is generic, and if it is * substitutes the types. This is here for efficiency, * so we don't gratuitously duplicate types */ static Type *tysubst(Type *t, Tysubst *tsmap) { if (hasparams(t)) return tyspecialize(t, tsmap, NULL, NULL); else return t; } /* * Fills the substitution map with a mapping from * the type parameter 'from' to it's substititon 'to' */ static void fillsubst(Tysubst *tsmap, Type *to, Type *from) { size_t i; if (from->type == Typaram) { if (debugopt['S']) printf("mapping %s => %s\n", tystr(from), tystr(to)); substput(tsmap, from, to); return; } assert(to->nsub == from->nsub); for (i = 0; i < to->nsub; i++) fillsubst(tsmap, to->sub[i], from->sub[i]); if (to->type == Tyname && to->narg > 0) { for (i = 0; i < to->narg; i++) fillsubst(tsmap, to->arg[i], from->arg[i]); } } /* * Fixes up nodes. This involves fixing up the * declaration identifiers once we specialize */ static void fixup(Node *n) { size_t i; Node *d; Stab *ns; if (!n) return; switch (n->type) { case Nfile: case Nuse: die("Node %s not allowed here\n", nodestr[n->type]); break; case Nexpr: fixup(n->expr.idx); for (i = 0; i < n->expr.nargs; i++) fixup(n->expr.args[i]); if (n->expr.op == Ovar) { ns = curstab(); if (n->expr.args[0]->name.ns) ns = getns(file, n->expr.args[0]->name.ns); if (!ns) fatal(n, "No namespace %s\n", n->expr.args[0]->name.ns); d = getdcl(ns, n->expr.args[0]); if (!d) die("Missing decl %s", namestr(n->expr.args[0])); if (d->decl.isgeneric) d = specializedcl(d, n->expr.type, &n->expr.args[0]); n->expr.did = d->decl.did; } break; case Nlit: switch (n->lit.littype) { case Lfunc: fixup(n->lit.fnval); break; case Lvoid: break; case Lchr: break; case Lint: break; case Lflt: break; case Lstr: break; case Llbl: break; case Lbool: break; } break; case Nifstmt: fixup(n->ifstmt.cond); fixup(n->ifstmt.iftrue); fixup(n->ifstmt.iffalse); break; case Nloopstmt: pushstab(n->loopstmt.scope); fixup(n->loopstmt.init); fixup(n->loopstmt.cond); fixup(n->loopstmt.step); fixup(n->loopstmt.body); popstab(); break; case Niterstmt: pushstab(n->iterstmt.body->block.scope); fixup(n->iterstmt.elt); popstab(); fixup(n->iterstmt.seq); fixup(n->iterstmt.body); break; case Nmatchstmt: fixup(n->matchstmt.val); for (i = 0; i < n->matchstmt.nmatches; i++) fixup(n->matchstmt.matches[i]); break; case Nmatch: /* patterns are evaluated in their block's scope */ pushstab(n->match.block->block.scope); fixup(n->match.pat); popstab(); fixup(n->match.block); break; case Nblock: pushstab(n->block.scope); for (i = 0; i < n->block.nstmts; i++) fixup(n->block.stmts[i]); popstab(); break; case Ndecl: fixup(n->decl.init); break; case Nfunc: pushstab(n->func.scope); fixup(n->func.body); popstab(); break; case Nnone: case Nname: break; case Nimpl: die("trait/impl not implemented"); break; } } /* * Duplicates a node, replacing all things that * need to be specialized to make it concrete * instead of generic, and returns it. */ static Node *specializenode(Node *n, Tysubst *tsmap) { Node *r; size_t i; if (!n) return NULL; r = mknode(n->loc, n->type); switch (n->type) { case Nfile: case Nuse: die("Node %s not allowed here\n", nodestr[n->type]); break; case Nexpr: r->expr.op = n->expr.op; r->expr.type = tysubst(n->expr.type, tsmap); r->expr.isconst = n->expr.isconst; r->expr.nargs = n->expr.nargs; r->expr.idx = specializenode(n->expr.idx, tsmap); r->expr.args = xalloc(n->expr.nargs * sizeof(Node *)); for (i = 0; i < n->expr.nargs; i++) r->expr.args[i] = specializenode(n->expr.args[i], tsmap); break; case Nname: if (n->name.ns) r->name.ns = strdup(n->name.ns); r->name.name = strdup(n->name.name); break; case Nlit: r->lit.littype = n->lit.littype; r->lit.type = tysubst(n->expr.type, tsmap); switch (n->lit.littype) { case Lvoid: break; case Lchr: r->lit.chrval = n->lit.chrval; break; case Lint: r->lit.intval = n->lit.intval; break; case Lflt: r->lit.fltval = n->lit.fltval; break; case Lstr: r->lit.strval = n->lit.strval; break; case Llbl: r->lit.lblval = n->lit.lblval; break; case Lbool: r->lit.boolval = n->lit.boolval; break; case Lfunc: r->lit.fnval = specializenode(n->lit.fnval, tsmap); break; } break; case Nifstmt: r->ifstmt.cond = specializenode(n->ifstmt.cond, tsmap); r->ifstmt.iftrue = specializenode(n->ifstmt.iftrue, tsmap); r->ifstmt.iffalse = specializenode(n->ifstmt.iffalse, tsmap); break; case Nloopstmt: r->loopstmt.scope = mkstab(0); r->loopstmt.scope->super = curstab(); pushstab(r->loopstmt.scope); r->loopstmt.init = specializenode(n->loopstmt.init, tsmap); r->loopstmt.cond = specializenode(n->loopstmt.cond, tsmap); r->loopstmt.step = specializenode(n->loopstmt.step, tsmap); r->loopstmt.body = specializenode(n->loopstmt.body, tsmap); popstab(); break; case Niterstmt: r->iterstmt.elt = specializenode(n->iterstmt.elt, tsmap); r->iterstmt.seq = specializenode(n->iterstmt.seq, tsmap); r->iterstmt.body = specializenode(n->iterstmt.body, tsmap); break; case Nmatchstmt: r->matchstmt.val = specializenode(n->matchstmt.val, tsmap); r->matchstmt.nmatches = n->matchstmt.nmatches; r->matchstmt.matches = xalloc(n->matchstmt.nmatches * sizeof(Node *)); for (i = 0; i < n->matchstmt.nmatches; i++) r->matchstmt.matches[i] = specializenode(n->matchstmt.matches[i], tsmap); break; case Nmatch: r->match.pat = specializenode(n->match.pat, tsmap); r->match.block = specializenode(n->match.block, tsmap); break; case Nblock: r->block.scope = mkstab(0); r->block.scope->super = curstab(); pushstab(r->block.scope); r->block.nstmts = n->block.nstmts; r->block.stmts = xalloc(sizeof(Node *) * n->block.nstmts); for (i = 0; i < n->block.nstmts; i++) r->block.stmts[i] = specializenode(n->block.stmts[i], tsmap); popstab(); break; case Ndecl: r->decl.did = ndecls; /* sym */ r->decl.name = specializenode(n->decl.name, tsmap); r->decl.type = tysubst(n->decl.type, tsmap); /* symflags */ r->decl.isconst = n->decl.isconst; r->decl.isgeneric = n->decl.isgeneric; r->decl.isextern = n->decl.isextern; r->decl.isglobl = n->decl.isglobl; if (curstab()) putdcl(curstab(), r); /* init */ r->decl.init = specializenode(n->decl.init, tsmap); lappend(&decls, &ndecls, r); break; case Nfunc: r->func.scope = mkstab(0); r->func.scope->super = curstab(); pushstab(r->func.scope); r->func.type = tysubst(n->func.type, tsmap); r->func.nargs = n->func.nargs; r->func.args = xalloc(sizeof(Node *) * n->func.nargs); for (i = 0; i < n->func.nargs; i++) r->func.args[i] = specializenode(n->func.args[i], tsmap); r->func.body = specializenode(n->func.body, tsmap); popstab(); break; case Nimpl: die("trait/impl not implemented"); break; case Nnone: die("Nnone should not be seen as node type!"); break; } return r; } Node *genericname(Node *n, Type *t) { char buf[1024]; char *p; char *end; Node *name; if (!n->decl.isgeneric) return n->decl.name; p = buf; end = buf + sizeof buf; p += bprintf(p, end - p, "%s", n->decl.name->name.name); p += bprintf(p, end - p, "$"); p += tyidfmt(p, end - p, t); name = mkname(n->loc, buf); if (n->decl.name->name.ns) setns(name, n->decl.name->name.ns); return name; } /* this doesn't walk through named types, so it can't recurse infinitely. */ int matchquality(Type *pat, Type *to) { int match, q; size_t i; Ucon *puc, *tuc; if (pat->type == Typaram) return 0; else if (pat->type != to->type) return -1; match = 0; switch (pat->type) { case Tystruct: if (pat->nmemb != to->nmemb) return -1; for (i = 0; i < pat->nmemb; i++) { if (!streq(declname(pat->sdecls[i]),declname( to->sdecls[i]))) return -1; q = matchquality(decltype(pat->sdecls[i]), decltype(to->sdecls[i])); if (q < 0) return -1; match += q; } break; case Tyunion: if (pat->nmemb != to->nmemb) return -1; for (i = 0; i < pat->nmemb; i++) { if (!nameeq(pat->udecls[i], to->udecls[i])) return -1; puc = pat->udecls[i]; tuc = to->udecls[i]; if (puc->etype && tuc->etype) { q = matchquality(puc->etype, tuc->etype); if (q < 0) return -1; match += q; } else if (puc->etype != tuc->etype) { return -1; } } break; case Tyname: if (!nameeq(pat->name, to->name)) return -1; if (pat->narg != to->narg) return -1; for (i = 0; i < pat->narg; i++) { q = matchquality(pat->arg[i], to->arg[i]); if (q < 0) return -1; match += q; } break; case Tyarray: /* unsized arrays are ok */ if (pat->asize && to->asize) { if (!!litvaleq(pat->asize->expr.args[0], to->asize->expr.args[0])) return -1; } else if (pat->asize != to->asize) { return -1; } else return matchquality(pat->sub[0], to->sub[0]); break; default: if (pat->nsub != to->nsub) break; if (pat->type == to->type) match = 1; for (i = 0; i < pat->nsub; i++) { q = matchquality(pat->sub[i], to->sub[i]); if (q < 0) return -1; match += q; } break; } return match; } Node *bestimpl(Node *n, Type *to) { Node **gimpl, **ambig, *match; size_t ngimpl, nambig, i; int score; int best; if (hthas(n->decl.impls, to)) return htget(n->decl.impls, to); ambig = NULL; match = NULL; nambig = 0; best = -1; gimpl = n->decl.gimpl; ngimpl = n->decl.ngimpl; for (i = 0; i < ngimpl; i++) { score = matchquality(decltype(gimpl[i]), to); if (score > best) { lfree(&ambig, &nambig); best = score; match = gimpl[i]; } else if (score == best) { lappend(&ambig, &nambig, gimpl[i]); } } if (best < 0) return NULL; else if (nambig > 0) fatal(n, "ambiguous implementation for %s", tystr(to)); return match; } /* * Takes a generic declaration, and creates a specialized * duplicate of it with type 'to'. It also generates * a name for this specialized node, and returns it in '*name'. */ Node *specializedcl(Node *gnode, Type *to, Node **name) { extern int stabstkoff; Tysubst *tsmap; Node *g, *d, *n; Stab *st; assert(gnode->type == Ndecl); assert(gnode->decl.isgeneric); n = genericname(gnode, to); *name = n; if (n->name.ns) st = getns(file, n->name.ns); else st = file->file.globls; if (!st) fatal(n, "Can't find symbol table for %s.%s", n->name.ns, n->name.name); d = getdcl(st, n); if (d) return d; if (gnode->decl.trait) { g = bestimpl(gnode, to); if (!g) fatal(gnode, "no trait implemented for for %s:%s", namestr(gnode->decl.name), tystr(to)); } else { g = gnode; } if (debugopt['S']) printf("depth[%d] specializing [%d]%s => %s\n", stabstkoff, g->loc.line, namestr(g->decl.name), namestr(n)); /* namespaced names need to be looked up in their correct * context. */ if (n->name.ns) pushstab(st); /* specialize */ tsmap = mksubst(); fillsubst(tsmap, to, g->decl.type); d = mkdecl(g->loc, n, tysubst(g->decl.type, tsmap)); d->decl.isconst = g->decl.isconst; d->decl.isextern = g->decl.isextern; d->decl.isglobl = g->decl.isglobl; d->decl.init = specializenode(g->decl.init, tsmap); putdcl(st, d); fixup(d); lappend(&file->file.stmts, &file->file.nstmts, d); if (d->decl.name->name.ns) popstab(); substfree(tsmap); return d; } /* * Not really specialization, but close enough. * * Generate an init function that's the equivalent of * this code: * * const __init__ { * file1$myr$__init__ * file2$myr$__init__ * ... * } */ static Node *initdecl(Node *file, Node *name, Type *tyvoidfn) { Node *dcl; dcl = getdcl(file->file.globls, name); if (!dcl) { dcl = mkdecl(Zloc, name, tyvoidfn); dcl->decl.isconst = 1; dcl->decl.isglobl = 1; dcl->decl.isinit = 1; dcl->decl.isextern = 1; dcl->decl.ishidden = 1; putdcl(file->file.globls, dcl); } return dcl; } static void callinit(Node *block, Node *init, Type *tyvoid, Type *tyvoidfn) { Node *call, *var; var = mkexpr(Zloc, Ovar, init->decl.name, NULL); call = mkexpr(Zloc, Ocall, var, NULL); var->expr.type = tyvoidfn; call->expr.type = tyvoid; var->expr.did = init->decl.did; var->expr.isconst = 1; lappend(&block->block.stmts, &block->block.nstmts, call); } void geninit(Node *file) { Node *name, *decl, *func, *block, *init; Type *tyvoid, *tyvoidfn; size_t i; name = mkname(Zloc, "__init__"); decl = mkdecl(Zloc, name, mktyvar(Zloc)); block = mkblock(Zloc, mkstab(0)); block->block.scope->super = file->file.globls; tyvoid = mktype(Zloc, Tyvoid); tyvoidfn = mktyfunc(Zloc, NULL, 0, tyvoid); for (i = 0; i < file->file.ninit; i++) { init = initdecl(file, file->file.init[i], tyvoidfn); callinit(block, init, tyvoid, tyvoidfn); } if (file->file.localinit) callinit(block, file->file.localinit, tyvoid, tyvoidfn); func = mkfunc(Zloc, NULL, 0, mktype(Zloc, Tyvoid), block); func->expr.type = tyvoidfn; init = mkexpr(Zloc, Olit, func, NULL); init->expr.type = tyvoidfn; decl->decl.init = init; decl->decl.isconst = 1; decl->decl.isglobl = 1; decl->decl.type = tyvoidfn; decl->decl.vis = Vishidden; lappend(&file->file.stmts, &file->file.nstmts, decl); }