ref: ac6c06f906d356b0004ed450558dd890c7057fbf
dir: /parse/specialize.c/
#include <stdlib.h> #include <stdio.h> #include <stdarg.h> #include <inttypes.h> #include <ctype.h> #include <string.h> #include <assert.h> #include <sys/types.h> #include <sys/stat.h> #include <fcntl.h> #include <unistd.h> #include "util.h" #include "parse.h" static Node *specializenode(Node *g, Tysubst *tsmap); static void fillsubst(Tysubst *tsmap, Type *to, Type *from); static void substpush(Tysubst *subst) { lappend(&subst->subst, &subst->nsubst, mkht(tyhash, tyeq)); } static void substpop(Tysubst *subst) { Htab *ht; ht = lpop(&subst->subst, &subst->nsubst); htfree(ht); } void substput(Tysubst *subst, Type *from, Type *to) { htput(subst->subst[subst->nsubst - 1], from, to); } Type * substget(Tysubst *subst, Type *from) { Type *t; size_t i; t = NULL; for (i = subst->nsubst; i > 0; i--) { t = htget(subst->subst[i-1], from); if (t) break; } return t; } Tysubst * mksubst(void) { Tysubst *subst; subst = zalloc(sizeof(Tysubst)); substpush(subst); return subst; } void substfree(Tysubst *subst) { size_t i; for (i = 0; i < subst->nsubst; i++) htfree(subst->subst[i]); lfree(&subst->subst, &subst->nsubst); } /* * Duplicates the type 't', with all bound type * parameters substituted with the substition * described in 'tsmap' * * Returns a fresh type with all unbound type * parameters (type schemes in most literature) * replaced with type variables that we can unify * against */ Type * tyspecialize(Type *orig, Tysubst *tsmap, Htab *delayed, Htab *trbase) { Type *t, *ret, *tmp, *var, *base; Traitspec *ts; size_t i, narg; Type **arg; t = tysearch(orig); tmp = substget(tsmap, t); if (tmp) return tysearch(tmp); arg = NULL; narg = 0; switch (t->type) { case Typaram: ret = mktyvar(t->loc); ret->trneed = bsdup(t->trneed); substput(tsmap, t, ret); for (i = 0; i < t->nspec; i++) { ts = zalloc(sizeof(Traitspec)); ts->trait = t->spec[i]->trait; ts->ntrait = t->spec[i]->ntrait; ts->param = tyspecialize(t->spec[i]->param, tsmap, delayed, trbase); if (t->spec[i]->aux) ts->aux = tyspecialize(t->spec[i]->aux, tsmap, delayed, trbase); lappend(&ret->spec, &ret->nspec, ts); } tmp = htget(seqbase, t); if (tmp) { tmp = tyspecialize(tmp, tsmap, delayed, trbase); htput(trbase, ret, tmp); } break; case Tygeneric: var = mktyvar(t->loc); substput(tsmap, t, var); if (orig->type == Tyunres) { substpush(tsmap); for (i = 0; i < orig->narg; i++) substput(tsmap, t->gparam[i], orig->arg[i]); } for (i = 0; i < t->ngparam; i++) lappend(&arg, &narg, tyspecialize(t->gparam[i], tsmap, delayed, trbase)); ret = mktyname(t->loc, t->name, tyspecialize(t->sub[0], tsmap, delayed, trbase)); if (orig->type == Tyunres) substpop(tsmap); ret->arg = arg; ret->narg = narg; tytab[var->tid] = ret; break; case Tyname: if (!hasparams(t)) return t; var = mktyvar(t->loc); substput(tsmap, t, var); for (i = 0; i < t->narg; i++) lappend(&arg, &narg, tyspecialize(t->arg[i], tsmap, delayed, trbase)); ret = mktyname(t->loc, t->name, tyspecialize(t->sub[0], tsmap, delayed, trbase)); ret->arg = arg; ret->narg = narg; if (trbase && hthas(trbase, orig) && !hthas(trbase, ret)) { base = htget(trbase, orig); htput(trbase, ret, tyspecialize(base, tsmap, delayed, trbase)); } tytab[var->tid] = ret; break; case Tystruct: ret = tydup(t); substput(tsmap, t, ret); pushstab(NULL); for (i = 0; i < t->nmemb; i++) ret->sdecls[i] = specializenode(t->sdecls[i], tsmap); popstab(); break; case Tyunion: ret = tydup(t); substput(tsmap, t, ret); for (i = 0; i < t->nmemb; i++) { tmp = NULL; if (ret->udecls[i]->etype) tmp = tyspecialize(t->udecls[i]->etype, tsmap, delayed, trbase); ret->udecls[i] = mkucon(t->loc, t->udecls[i]->name, ret, tmp); ret->udecls[i]->utype = ret; ret->udecls[i]->id = i; ret->udecls[i]->synth = 1; } break; case Tyvar: ret = t; if (delayed && hthas(delayed, t)) { tmp = htget(delayed, t); htput(delayed, ret, tyspecialize(tmp, tsmap, delayed, trbase)); } break; default: if (t->nsub > 0) { ret = tydup(t); substput(tsmap, t, ret); for (i = 0; i < t->nsub; i++) ret->sub[i] = tyspecialize(t->sub[i], tsmap, delayed, trbase); } else { ret = t; } break; } return ret; } /* Checks if the type 't' is generic, and if it i * substitutes the types. This is here for efficiency, * so we don't gratuitously duplicate types */ static Type * tysubst(Type *t, Tysubst *tsmap) { if (hasparams(t)) return tyspecialize(t, tsmap, NULL, NULL); else return t; } static void substputspec(Tysubst *tsmap, Type *from, Type *to) { size_t ai, aj, bi, bj; for (ai = 0; ai < from->nspec; ai++) { for (aj = 0; aj < from->spec[ai]->ntrait; aj++) { for (bi = 0; bi < to->nspec; bi++) { for (bj = 0; bj < to->spec[bi]->ntrait; bj++) { if (nameeq(from->spec[ai]->trait[aj], to->spec[bi]->trait[bj])) fillsubst(tsmap, to->spec[ai]->aux, from->spec[bi]->aux); } } if (nameeq(from->spec[ai]->trait[aj], traittab[Tciter]->name)) if (to->type == Tyslice || to->type == Tyarray) fillsubst(tsmap, to->sub[0], from->spec[ai]->aux); } } } /* * Fills the substitution map with a mapping from * the type parameter 'from' to it's substititon 'to' */ static void fillsubst(Tysubst *tsmap, Type *to, Type *from) { size_t i; if (from->type == Typaram) { if (debugopt['S']) printf("mapping %s => %s\n", tystr(from), tystr(to)); substput(tsmap, from, to); substputspec(tsmap, from, to); return; } assert(to->nsub == from->nsub); for (i = 0; i < to->nsub; i++) fillsubst(tsmap, to->sub[i], from->sub[i]); if (to->type == Tyname && to->narg > 0) { for (i = 0; i < to->narg; i++) fillsubst(tsmap, to->arg[i], from->arg[i]); } } /* * Fixes up nodes. This involves fixing up the * declaration identifiers once we specialize */ static void fixup(Node *n) { size_t i; Node *d; Stab *ns; if (!n) return; switch (n->type) { case Nfile: case Nuse: die("Node %s not allowed here\n", nodestr[n->type]); break; case Nexpr: fixup(n->expr.idx); for (i = 0; i < n->expr.nargs; i++) fixup(n->expr.args[i]); if (n->expr.op == Ovar) { ns = curstab(); if (n->expr.args[0]->name.ns) ns = getns(n->expr.args[0]->name.ns); if (!ns) fatal(n, "No namespace %s\n", n->expr.args[0]->name.ns); d = getdcl(ns, n->expr.args[0]); if (!d) die("Missing decl %s", namestr(n->expr.args[0])); if (d->decl.isgeneric) d = specializedcl(d, n->expr.param, n->expr.type, &n->expr.args[0]); n->expr.did = d->decl.did; } break; case Nlit: switch (n->lit.littype) { case Lfunc: fixup(n->lit.fnval); break; case Lvoid: break; case Lchr: break; case Lint: break; case Lflt: break; case Lstr: break; case Llbl: break; case Lbool: break; } break; case Nifstmt: fixup(n->ifstmt.cond); fixup(n->ifstmt.iftrue); fixup(n->ifstmt.iffalse); break; case Nloopstmt: pushstab(n->loopstmt.scope); fixup(n->loopstmt.init); fixup(n->loopstmt.cond); fixup(n->loopstmt.step); fixup(n->loopstmt.body); popstab(); break; case Niterstmt: pushstab(n->iterstmt.body->block.scope); fixup(n->iterstmt.elt); popstab(); fixup(n->iterstmt.seq); fixup(n->iterstmt.body); break; case Nmatchstmt: fixup(n->matchstmt.val); for (i = 0; i < n->matchstmt.nmatches; i++) fixup(n->matchstmt.matches[i]); break; case Nmatch: /* patterns are evaluated in their block's scope */ pushstab(n->match.block->block.scope); fixup(n->match.pat); popstab(); fixup(n->match.block); break; case Nblock: pushstab(n->block.scope); for (i = 0; i < n->block.nstmts; i++) fixup(n->block.stmts[i]); popstab(); break; case Ndecl: fixup(n->decl.init); break; case Nfunc: pushstab(n->func.scope); fixup(n->func.body); popstab(); break; case Nnone: case Nname: break; case Nimpl: die("trait/impl not implemented"); break; } } /* * Duplicates a node, replacing all things that * need to be specialized to make it concrete * instead of generic, and returns it. */ static Node * specializenode(Node *n, Tysubst *tsmap) { Node *r; size_t i; if (!n) return NULL; r = mknode(n->loc, n->type); switch (n->type) { case Nfile: case Nuse: die("Node %s not allowed here\n", nodestr[n->type]); break; case Nexpr: r->expr.op = n->expr.op; r->expr.type = tysubst(n->expr.type, tsmap); if (n->expr.param) r->expr.param = tysubst(n->expr.param, tsmap); r->expr.isconst = n->expr.isconst; r->expr.nargs = n->expr.nargs; r->expr.idx = specializenode(n->expr.idx, tsmap); r->expr.args = xalloc(n->expr.nargs * sizeof(Node *)); for (i = 0; i < n->expr.nargs; i++) r->expr.args[i] = specializenode(n->expr.args[i], tsmap); break; case Nname: if (n->name.ns) r->name.ns = strdup(n->name.ns); r->name.name = strdup(n->name.name); break; case Nlit: r->lit.littype = n->lit.littype; r->lit.type = tysubst(n->expr.type, tsmap); switch (n->lit.littype) { case Lvoid: break; case Lchr: r->lit.chrval = n->lit.chrval; break; case Lint: r->lit.intval = n->lit.intval; break; case Lflt: r->lit.fltval = n->lit.fltval; break; case Lstr: r->lit.strval = n->lit.strval; break; case Llbl: r->lit.lblval = n->lit.lblval; break; case Lbool: r->lit.boolval = n->lit.boolval; break; case Lfunc: r->lit.fnval = specializenode(n->lit.fnval, tsmap); break; } break; case Nifstmt: r->ifstmt.cond = specializenode(n->ifstmt.cond, tsmap); r->ifstmt.iftrue = specializenode(n->ifstmt.iftrue, tsmap); r->ifstmt.iffalse = specializenode(n->ifstmt.iffalse, tsmap); break; case Nloopstmt: r->loopstmt.scope = mkstab(0); r->loopstmt.scope->super = curstab(); pushstab(r->loopstmt.scope); r->loopstmt.init = specializenode(n->loopstmt.init, tsmap); r->loopstmt.cond = specializenode(n->loopstmt.cond, tsmap); r->loopstmt.step = specializenode(n->loopstmt.step, tsmap); r->loopstmt.body = specializenode(n->loopstmt.body, tsmap); popstab(); break; case Niterstmt: r->iterstmt.elt = specializenode(n->iterstmt.elt, tsmap); r->iterstmt.seq = specializenode(n->iterstmt.seq, tsmap); r->iterstmt.body = specializenode(n->iterstmt.body, tsmap); break; case Nmatchstmt: r->matchstmt.val = specializenode(n->matchstmt.val, tsmap); r->matchstmt.nmatches = n->matchstmt.nmatches; r->matchstmt.matches = xalloc(n->matchstmt.nmatches * sizeof(Node *)); for (i = 0; i < n->matchstmt.nmatches; i++) r->matchstmt.matches[i] = specializenode(n->matchstmt.matches[i], tsmap); break; case Nmatch: r->match.pat = specializenode(n->match.pat, tsmap); r->match.block = specializenode(n->match.block, tsmap); break; case Nblock: r->block.scope = mkstab(0); r->block.scope->super = curstab(); pushstab(r->block.scope); r->block.nstmts = n->block.nstmts; r->block.stmts = xalloc(sizeof(Node *) * n->block.nstmts); for (i = 0; i < n->block.nstmts; i++) r->block.stmts[i] = specializenode(n->block.stmts[i], tsmap); popstab(); break; case Ndecl: r->decl.did = ndecls; /* sym */ r->decl.name = specializenode(n->decl.name, tsmap); r->decl.type = tysubst(n->decl.type, tsmap); /* symflags */ r->decl.isconst = n->decl.isconst; r->decl.isgeneric = n->decl.isgeneric; r->decl.isextern = n->decl.isextern; r->decl.isglobl = n->decl.isglobl; if (curstab()) putdcl(curstab(), r); /* init */ r->decl.init = specializenode(n->decl.init, tsmap); lappend(&decls, &ndecls, r); break; case Nfunc: r->func.scope = mkstab(1); r->func.scope->super = curstab(); pushstab(r->func.scope); r->func.type = tysubst(n->func.type, tsmap); r->func.nargs = n->func.nargs; r->func.args = xalloc(sizeof(Node *) * n->func.nargs); for (i = 0; i < n->func.nargs; i++) r->func.args[i] = specializenode(n->func.args[i], tsmap); r->func.body = specializenode(n->func.body, tsmap); popstab(); break; case Nimpl: die("trait/impl not implemented"); break; case Nnone: die("Nnone should not be seen as node type!"); break; } return r; } Node * genericname(Node *n, Type *param, Type *t) { char buf[1024]; char *p; char *end; Node *name; if (!n->decl.isgeneric) return n->decl.name; p = buf; end = buf + sizeof buf; p += bprintf(p, end - p, "%s", n->decl.name->name.name); if (param) { p += bprintf(p, end - p, "$"); p += tyidfmt(p, end - p, param); } p += bprintf(p, end - p, "$"); p += tyidfmt(p, end - p, t); name = mkname(n->loc, buf); if (n->decl.name->name.ns) setns(name, n->decl.name->name.ns); return name; } static Node * bestimpl(Node *n, Type *to) { Node **gimpl, **ambig, *match; size_t ngimpl, nambig, i; int score; int best; if (hthas(n->decl.impls, to)) return htget(n->decl.impls, to); ambig = NULL; match = NULL; nambig = 0; best = -1; gimpl = n->decl.gimpl; ngimpl = n->decl.ngimpl; for (i = 0; i < ngimpl; i++) { score = tymatchrank(decltype(gimpl[i]), to); if (score > best) { lfree(&ambig, &nambig); best = score; match = gimpl[i]; } else if (score == best) { lappend(&ambig, &nambig, gimpl[i]); } } if (best < 0) return NULL; else if (nambig > 0) fatal(n, "ambiguous implementation for %s", tystr(to)); return match; } /* * Takes a generic declaration, and creates a specialized * duplicate of it with type 'to'. It also generate * a name for this specialized node, and returns it in '*name'. */ Node * specializedcl(Node *gnode, Type *param, Type *to, Node **name) { Tysubst *tsmap; Node *g, *d, *n; Stab *st; assert(gnode->type == Ndecl); assert(gnode->decl.isgeneric); n = genericname(gnode, param, to); *name = n; if (n->name.ns) st = getns(n->name.ns); else st = file->file.globls; if (!st) fatal(n, "Can't find symbol table for %s.%s", n->name.ns, n->name.name); d = getdcl(st, n); if (d) return d; if (gnode->decl.trait) { g = bestimpl(gnode, to); if (!g) fatal(gnode, "type %s does not implement %s:%s", tystr(param), namestr(gnode->decl.name), tystr(to)); } else { g = gnode; } if (debugopt['S']) printf("specializing [%d]%s => %s\n", g->loc.line, namestr(g->decl.name), namestr(n)); /* namespaced names need to be looked up in their correct * context. */ if (n->name.ns) pushstab(st); /* specialize */ tsmap = mksubst(); fillsubst(tsmap, to, g->decl.type); d = mkdecl(g->loc, n, tysubst(g->decl.type, tsmap)); d->decl.isconst = g->decl.isconst; d->decl.isextern = g->decl.isextern; d->decl.isglobl = g->decl.isglobl; d->decl.init = specializenode(g->decl.init, tsmap); putdcl(st, d); fixup(d); lappend(&file->file.stmts, &file->file.nstmts, d); if (d->decl.name->name.ns) popstab(); substfree(tsmap); return d; } /* * Not really specialization, but close enough. * * Generate an init function that's the equivalent of * this code: * * const __init__ { * file1$myr$__init__ * file2$myr$__init__ * ... * } */ static Node * initdecl(Node *file, Node *name, Type *tyvoidfn) { Node *dcl; dcl = getdcl(file->file.globls, name); if (!dcl) { dcl = mkdecl(Zloc, name, tyvoidfn); dcl->decl.isconst = 1; dcl->decl.isglobl = 1; dcl->decl.isinit = 1; dcl->decl.isextern = 1; dcl->decl.ishidden = 1; putdcl(file->file.globls, dcl); } return dcl; } static void callinit(Node *block, Node *init, Type *tyvoid, Type *tyvoidfn) { Node *call, *var; var = mkexpr(Zloc, Ovar, init->decl.name, NULL); call = mkexpr(Zloc, Ocall, var, NULL); var->expr.type = tyvoidfn; call->expr.type = tyvoid; var->expr.did = init->decl.did; var->expr.isconst = 1; lappend(&block->block.stmts, &block->block.nstmts, call); } void geninit(void) { Node *name, *decl, *func, *block, *init; Type *tyvoid, *tyvoidfn; size_t i; name = mkname(Zloc, "__init__"); decl = mkdecl(Zloc, name, mktyvar(Zloc)); block = mkblock(Zloc, mkstab(0)); block->block.scope->super = file->file.globls; tyvoid = mktype(Zloc, Tyvoid); tyvoidfn = mktyfunc(Zloc, NULL, 0, tyvoid); for (i = 0; i < file->file.ninit; i++) { init = initdecl(file, file->file.init[i], tyvoidfn); callinit(block, init, tyvoid, tyvoidfn); } if (file->file.localinit) callinit(block, file->file.localinit, tyvoid, tyvoidfn); func = mkfunc(Zloc, NULL, 0, mktype(Zloc, Tyvoid), block); func->expr.type = tyvoidfn; init = mkexpr(Zloc, Olit, func, NULL); init->expr.type = tyvoidfn; decl->decl.init = init; decl->decl.isconst = 1; decl->decl.isglobl = 1; decl->decl.type = tyvoidfn; decl->decl.vis = Vishidden; lappend(&file->file.stmts, &file->file.nstmts, decl); }