// Copyright 2009 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. #include #include #include "gg.h" /* * generate: * res = n; * simplifies and calls gmove. */ void cgen(Node *n, Node *res) { Node *nl, *nr, *r; Node n1, n2; int a, f; Prog *p1, *p2, *p3; Addr addr; if(debug['g']) { dump("\ncgen-n", n); dump("cgen-res", res); } if(n == N || n->type == T) goto ret; if(res == N || res->type == T) fatal("cgen: res nil"); while(n->op == OCONVNOP) n = n->left; switch(n->op) { case OSLICE: case OSLICEARR: case OSLICESTR: case OSLICE3: case OSLICE3ARR: if (res->op != ONAME || !res->addable) { tempname(&n1, n->type); cgen_slice(n, &n1); cgen(&n1, res); } else cgen_slice(n, res); goto ret; case OEFACE: if (res->op != ONAME || !res->addable) { tempname(&n1, n->type); cgen_eface(n, &n1); cgen(&n1, res); } else cgen_eface(n, res); goto ret; } if(n->ullman >= UINF) { if(n->op == OINDREG) fatal("cgen: this is going to misscompile"); if(res->ullman >= UINF) { tempname(&n1, n->type); cgen(n, &n1); cgen(&n1, res); goto ret; } } if(isfat(n->type)) { if(n->type->width < 0) fatal("forgot to compute width for %T", n->type); sgen(n, res, n->type->width); goto ret; } if(!res->addable) { if(n->ullman > res->ullman) { regalloc(&n1, n->type, res); cgen(n, &n1); if(n1.ullman > res->ullman) { dump("n1", &n1); dump("res", res); fatal("loop in cgen"); } cgen(&n1, res); regfree(&n1); goto ret; } if(res->ullman >= UINF) goto gen; if(complexop(n, res)) { complexgen(n, res); goto ret; } f = 1; // gen thru register switch(n->op) { case OLITERAL: if(smallintconst(n)) f = 0; break; case OREGISTER: f = 0; break; } if(!iscomplex[n->type->etype]) { a = optoas(OAS, res->type); if(sudoaddable(a, res, &addr)) { if(f) { regalloc(&n2, res->type, N); cgen(n, &n2); p1 = gins(a, &n2, N); regfree(&n2); } else p1 = gins(a, n, N); p1->to = addr; if(debug['g']) print("%P [ignore previous line]\n", p1); sudoclean(); goto ret; } } gen: igen(res, &n1, N); cgen(n, &n1); regfree(&n1); goto ret; } // update addressability for string, slice // can't do in walk because n->left->addable // changes if n->left is an escaping local variable. switch(n->op) { case OSPTR: case OLEN: if(isslice(n->left->type) || istype(n->left->type, TSTRING)) n->addable = n->left->addable; break; case OCAP: if(isslice(n->left->type)) n->addable = n->left->addable; break; case OITAB: n->addable = n->left->addable; break; } if(complexop(n, res)) { complexgen(n, res); goto ret; } if(n->addable) { gmove(n, res); goto ret; } nl = n->left; nr = n->right; if(nl != N && nl->ullman >= UINF) if(nr != N && nr->ullman >= UINF) { tempname(&n1, nl->type); cgen(nl, &n1); n2 = *n; n2.left = &n1; cgen(&n2, res); goto ret; } if(!iscomplex[n->type->etype]) { a = optoas(OAS, n->type); if(sudoaddable(a, n, &addr)) { if(res->op == OREGISTER) { p1 = gins(a, N, res); p1->from = addr; } else { regalloc(&n2, n->type, N); p1 = gins(a, N, &n2); p1->from = addr; gins(a, &n2, res); regfree(&n2); } sudoclean(); goto ret; } } switch(n->op) { default: dump("cgen", n); fatal("cgen: unknown op %+hN", n); break; // these call bgen to get a bool value case OOROR: case OANDAND: case OEQ: case ONE: case OLT: case OLE: case OGE: case OGT: case ONOT: p1 = gbranch(AJMP, T, 0); p2 = pc; gmove(nodbool(1), res); p3 = gbranch(AJMP, T, 0); patch(p1, pc); bgen(n, 1, 0, p2); gmove(nodbool(0), res); patch(p3, pc); goto ret; case OPLUS: cgen(nl, res); goto ret; // unary case OCOM: a = optoas(OXOR, nl->type); regalloc(&n1, nl->type, N); cgen(nl, &n1); nodconst(&n2, nl->type, -1); gins(a, &n2, &n1); gmove(&n1, res); regfree(&n1); goto ret; case OMINUS: if(isfloat[nl->type->etype]) { nr = nodintconst(-1); convlit(&nr, n->type); a = optoas(OMUL, nl->type); goto sbop; } a = optoas(n->op, nl->type); goto uop; // symmetric binary case OAND: case OOR: case OXOR: case OADD: case OMUL: a = optoas(n->op, nl->type); if(a == AIMULB) { cgen_bmul(n->op, nl, nr, res); break; } goto sbop; // asymmetric binary case OSUB: a = optoas(n->op, nl->type); goto abop; case OHMUL: cgen_hmul(nl, nr, res); break; case OCONV: if(n->type->width > nl->type->width) { // If loading from memory, do conversion during load, // so as to avoid use of 8-bit register in, say, int(*byteptr). switch(nl->op) { case ODOT: case ODOTPTR: case OINDEX: case OIND: case ONAME: igen(nl, &n1, res); regalloc(&n2, n->type, res); gmove(&n1, &n2); gmove(&n2, res); regfree(&n2); regfree(&n1); goto ret; } } regalloc(&n1, nl->type, res); regalloc(&n2, n->type, &n1); cgen(nl, &n1); // if we do the conversion n1 -> n2 here // reusing the register, then gmove won't // have to allocate its own register. gmove(&n1, &n2); gmove(&n2, res); regfree(&n2); regfree(&n1); break; case ODOT: case ODOTPTR: case OINDEX: case OIND: case ONAME: // PHEAP or PPARAMREF var igen(n, &n1, res); gmove(&n1, res); regfree(&n1); break; case OITAB: // interface table is first word of interface value igen(nl, &n1, res); n1.type = n->type; gmove(&n1, res); regfree(&n1); break; case OSPTR: // pointer is the first word of string or slice. if(isconst(nl, CTSTR)) { regalloc(&n1, types[tptr], res); p1 = gins(ALEAQ, N, &n1); datastring(nl->val.u.sval->s, nl->val.u.sval->len, &p1->from); gmove(&n1, res); regfree(&n1); break; } igen(nl, &n1, res); n1.type = n->type; gmove(&n1, res); regfree(&n1); break; case OLEN: if(istype(nl->type, TMAP) || istype(nl->type, TCHAN)) { // map and chan have len in the first int-sized word. // a zero pointer means zero length regalloc(&n1, types[tptr], res); cgen(nl, &n1); nodconst(&n2, types[tptr], 0); gins(optoas(OCMP, types[tptr]), &n1, &n2); p1 = gbranch(optoas(OEQ, types[tptr]), T, 0); n2 = n1; n2.op = OINDREG; n2.type = types[simtype[TINT]]; gmove(&n2, &n1); patch(p1, pc); gmove(&n1, res); regfree(&n1); break; } if(istype(nl->type, TSTRING) || isslice(nl->type)) { // both slice and string have len one pointer into the struct. // a zero pointer means zero length igen(nl, &n1, res); n1.type = types[simtype[TUINT]]; n1.xoffset += Array_nel; gmove(&n1, res); regfree(&n1); break; } fatal("cgen: OLEN: unknown type %lT", nl->type); break; case OCAP: if(istype(nl->type, TCHAN)) { // chan has cap in the second int-sized word. // a zero pointer means zero length regalloc(&n1, types[tptr], res); cgen(nl, &n1); nodconst(&n2, types[tptr], 0); gins(optoas(OCMP, types[tptr]), &n1, &n2); p1 = gbranch(optoas(OEQ, types[tptr]), T, 0); n2 = n1; n2.op = OINDREG; n2.xoffset = widthint; n2.type = types[simtype[TINT]]; gmove(&n2, &n1); patch(p1, pc); gmove(&n1, res); regfree(&n1); break; } if(isslice(nl->type)) { igen(nl, &n1, res); n1.type = types[simtype[TUINT]]; n1.xoffset += Array_cap; gmove(&n1, res); regfree(&n1); break; } fatal("cgen: OCAP: unknown type %lT", nl->type); break; case OADDR: if(n->bounded) // let race detector avoid nil checks disable_checknil++; agen(nl, res); if(n->bounded) disable_checknil--; break; case OCALLMETH: cgen_callmeth(n, 0); cgen_callret(n, res); break; case OCALLINTER: cgen_callinter(n, res, 0); cgen_callret(n, res); break; case OCALLFUNC: cgen_call(n, 0); cgen_callret(n, res); break; case OMOD: case ODIV: if(isfloat[n->type->etype]) { a = optoas(n->op, nl->type); goto abop; } if(nl->ullman >= nr->ullman) { regalloc(&n1, nl->type, res); cgen(nl, &n1); cgen_div(n->op, &n1, nr, res); regfree(&n1); } else { if(!smallintconst(nr)) { regalloc(&n2, nr->type, res); cgen(nr, &n2); } else { n2 = *nr; } cgen_div(n->op, nl, &n2, res); if(n2.op != OLITERAL) regfree(&n2); } break; case OLSH: case ORSH: case OLROT: cgen_shift(n->op, n->bounded, nl, nr, res); break; } goto ret; sbop: // symmetric binary /* * put simplest on right - we'll generate into left * and then adjust it using the computation of right. * constants and variables have the same ullman * count, so look for constants specially. * * an integer constant we can use as an immediate * is simpler than a variable - we can use the immediate * in the adjustment instruction directly - so it goes * on the right. * * other constants, like big integers or floating point * constants, require a mov into a register, so those * might as well go on the left, so we can reuse that * register for the computation. */ if(nl->ullman < nr->ullman || (nl->ullman == nr->ullman && (smallintconst(nl) || (nr->op == OLITERAL && !smallintconst(nr))))) { r = nl; nl = nr; nr = r; } abop: // asymmetric binary if(nl->ullman >= nr->ullman) { regalloc(&n1, nl->type, res); cgen(nl, &n1); /* * This generates smaller code - it avoids a MOV - but it's * easily 10% slower due to not being able to * optimize/manipulate the move. * To see, run: go test -bench . crypto/md5 * with and without. * if(sudoaddable(a, nr, &addr)) { p1 = gins(a, N, &n1); p1->from = addr; gmove(&n1, res); sudoclean(); regfree(&n1); goto ret; } * */ if(smallintconst(nr)) n2 = *nr; else { regalloc(&n2, nr->type, N); cgen(nr, &n2); } } else { if(smallintconst(nr)) n2 = *nr; else { regalloc(&n2, nr->type, res); cgen(nr, &n2); } regalloc(&n1, nl->type, N); cgen(nl, &n1); } gins(a, &n2, &n1); gmove(&n1, res); regfree(&n1); if(n2.op != OLITERAL) regfree(&n2); goto ret; uop: // unary regalloc(&n1, nl->type, res); cgen(nl, &n1); gins(a, N, &n1); gmove(&n1, res); regfree(&n1); goto ret; ret: ; } /* * allocate a register (reusing res if possible) and generate * a = n * The caller must call regfree(a). */ void cgenr(Node *n, Node *a, Node *res) { Node n1; if(debug['g']) dump("cgenr-n", n); if(isfat(n->type)) fatal("cgenr on fat node"); if(n->addable) { regalloc(a, n->type, res); gmove(n, a); return; } switch(n->op) { case ONAME: case ODOT: case ODOTPTR: case OINDEX: case OCALLFUNC: case OCALLMETH: case OCALLINTER: igen(n, &n1, res); regalloc(a, types[tptr], &n1); gmove(&n1, a); regfree(&n1); break; default: regalloc(a, n->type, res); cgen(n, a); break; } } /* * allocate a register (reusing res if possible) and generate * a = &n * The caller must call regfree(a). * The generated code checks that the result is not nil. */ void agenr(Node *n, Node *a, Node *res) { Node *nl, *nr; Node n1, n2, n3, n5, tmp, tmp2, nlen; Prog *p1; Type *t; uint64 w; uint64 v; int freelen; if(debug['g']) { dump("\nagenr-n", n); } nl = n->left; nr = n->right; switch(n->op) { case ODOT: case ODOTPTR: case OCALLFUNC: case OCALLMETH: case OCALLINTER: igen(n, &n1, res); regalloc(a, types[tptr], &n1); agen(&n1, a); regfree(&n1); break; case OIND: cgenr(n->left, a, res); cgen_checknil(a); break; case OINDEX: freelen = 0; w = n->type->width; // Generate the non-addressable child first. if(nr->addable) goto irad; if(nl->addable) { cgenr(nr, &n1, N); if(!isconst(nl, CTSTR)) { if(isfixedarray(nl->type)) { agenr(nl, &n3, res); } else { igen(nl, &nlen, res); freelen = 1; nlen.type = types[tptr]; nlen.xoffset += Array_array; regalloc(&n3, types[tptr], res); gmove(&nlen, &n3); nlen.type = types[simtype[TUINT]]; nlen.xoffset += Array_nel-Array_array; } } goto index; } tempname(&tmp, nr->type); cgen(nr, &tmp); nr = &tmp; irad: if(!isconst(nl, CTSTR)) { if(isfixedarray(nl->type)) { agenr(nl, &n3, res); } else { if(!nl->addable) { // igen will need an addressable node. tempname(&tmp2, nl->type); cgen(nl, &tmp2); nl = &tmp2; } igen(nl, &nlen, res); freelen = 1; nlen.type = types[tptr]; nlen.xoffset += Array_array; regalloc(&n3, types[tptr], res); gmove(&nlen, &n3); nlen.type = types[simtype[TUINT]]; nlen.xoffset += Array_nel-Array_array; } } if(!isconst(nr, CTINT)) { cgenr(nr, &n1, N); } goto index; index: // &a is in &n3 (allocated in res) // i is in &n1 (if not constant) // len(a) is in nlen (if needed) // w is width // constant index if(isconst(nr, CTINT)) { if(isconst(nl, CTSTR)) fatal("constant string constant index"); // front end should handle v = mpgetfix(nr->val.u.xval); if(isslice(nl->type) || nl->type->etype == TSTRING) { if(!debug['B'] && !n->bounded) { nodconst(&n2, types[simtype[TUINT]], v); if(smallintconst(nr)) { gins(optoas(OCMP, types[simtype[TUINT]]), &nlen, &n2); } else { regalloc(&tmp, types[simtype[TUINT]], N); gmove(&n2, &tmp); gins(optoas(OCMP, types[simtype[TUINT]]), &nlen, &tmp); regfree(&tmp); } p1 = gbranch(optoas(OGT, types[simtype[TUINT]]), T, +1); ginscall(panicindex, -1); patch(p1, pc); } regfree(&nlen); } if (v*w != 0) ginscon(optoas(OADD, types[tptr]), v*w, &n3); *a = n3; break; } // type of the index t = types[TUINT64]; if(issigned[n1.type->etype]) t = types[TINT64]; regalloc(&n2, t, &n1); // i gmove(&n1, &n2); regfree(&n1); if(!debug['B'] && !n->bounded) { // check bounds t = types[simtype[TUINT]]; if(is64(nr->type)) t = types[TUINT64]; if(isconst(nl, CTSTR)) { nodconst(&nlen, t, nl->val.u.sval->len); } else if(isslice(nl->type) || nl->type->etype == TSTRING) { if(is64(nr->type)) { regalloc(&n5, t, N); gmove(&nlen, &n5); regfree(&nlen); nlen = n5; } } else { nodconst(&nlen, t, nl->type->bound); if(!smallintconst(&nlen)) { regalloc(&n5, t, N); gmove(&nlen, &n5); nlen = n5; freelen = 1; } } gins(optoas(OCMP, t), &n2, &nlen); p1 = gbranch(optoas(OLT, t), T, +1); ginscall(panicindex, -1); patch(p1, pc); } if(isconst(nl, CTSTR)) { regalloc(&n3, types[tptr], res); p1 = gins(ALEAQ, N, &n3); datastring(nl->val.u.sval->s, nl->val.u.sval->len, &p1->from); if(flag_largemodel) { gins(AADDQ, &n2, &n3); } else { p1->from.scale = 1; p1->from.index = n2.val.u.reg; } goto indexdone; } if(w == 0) { // nothing to do } else if(w == 1 || w == 2 || w == 4 || w == 8) { p1 = gins(ALEAQ, &n2, &n3); p1->from.scale = w; p1->from.index = p1->from.type; p1->from.type = p1->to.type + D_INDIR; } else { ginscon(optoas(OMUL, t), w, &n2); gins(optoas(OADD, types[tptr]), &n2, &n3); } indexdone: *a = n3; regfree(&n2); if(freelen) regfree(&nlen); break; default: regalloc(a, types[tptr], res); agen(n, a); break; } } /* * generate: * res = &n; * The generated code checks that the result is not nil. */ void agen(Node *n, Node *res) { Node *nl, *nr; Node n1, n2; if(debug['g']) { dump("\nagen-res", res); dump("agen-r", n); } if(n == N || n->type == T) return; while(n->op == OCONVNOP) n = n->left; if(isconst(n, CTNIL) && n->type->width > widthptr) { // Use of a nil interface or nil slice. // Create a temporary we can take the address of and read. // The generated code is just going to panic, so it need not // be terribly efficient. See issue 3670. tempname(&n1, n->type); clearfat(&n1); regalloc(&n2, types[tptr], res); gins(ALEAQ, &n1, &n2); gmove(&n2, res); regfree(&n2); goto ret; } if(n->addable) { regalloc(&n1, types[tptr], res); gins(ALEAQ, n, &n1); gmove(&n1, res); regfree(&n1); goto ret; } nl = n->left; nr = n->right; USED(nr); switch(n->op) { default: fatal("agen: unknown op %+hN", n); break; case OCALLMETH: cgen_callmeth(n, 0); cgen_aret(n, res); break; case OCALLINTER: cgen_callinter(n, res, 0); cgen_aret(n, res); break; case OCALLFUNC: cgen_call(n, 0); cgen_aret(n, res); break; case OSLICE: case OSLICEARR: case OSLICESTR: case OSLICE3: case OSLICE3ARR: tempname(&n1, n->type); cgen_slice(n, &n1); agen(&n1, res); break; case OEFACE: tempname(&n1, n->type); cgen_eface(n, &n1); agen(&n1, res); break; case OINDEX: agenr(n, &n1, res); gmove(&n1, res); regfree(&n1); break; case ONAME: // should only get here with names in this func. if(n->funcdepth > 0 && n->funcdepth != funcdepth) { dump("bad agen", n); fatal("agen: bad ONAME funcdepth %d != %d", n->funcdepth, funcdepth); } // should only get here for heap vars or paramref if(!(n->class & PHEAP) && n->class != PPARAMREF) { dump("bad agen", n); fatal("agen: bad ONAME class %#x", n->class); } cgen(n->heapaddr, res); if(n->xoffset != 0) ginscon(optoas(OADD, types[tptr]), n->xoffset, res); break; case OIND: cgen(nl, res); cgen_checknil(res); break; case ODOT: agen(nl, res); if(n->xoffset != 0) ginscon(optoas(OADD, types[tptr]), n->xoffset, res); break; case ODOTPTR: cgen(nl, res); cgen_checknil(res); if(n->xoffset != 0) ginscon(optoas(OADD, types[tptr]), n->xoffset, res); break; } ret: ; } /* * generate: * newreg = &n; * res = newreg * * on exit, a has been changed to be *newreg. * caller must regfree(a). * The generated code checks that the result is not *nil. */ void igen(Node *n, Node *a, Node *res) { Type *fp; Iter flist; Node n1; if(debug['g']) { dump("\nigen-n", n); } switch(n->op) { case ONAME: if((n->class&PHEAP) || n->class == PPARAMREF) break; *a = *n; return; case OINDREG: // Increase the refcount of the register so that igen's caller // has to call regfree. if(n->val.u.reg != D_SP) reg[n->val.u.reg]++; *a = *n; return; case ODOT: igen(n->left, a, res); a->xoffset += n->xoffset; a->type = n->type; fixlargeoffset(a); return; case ODOTPTR: cgenr(n->left, a, res); cgen_checknil(a); a->op = OINDREG; a->xoffset += n->xoffset; a->type = n->type; fixlargeoffset(a); return; case OCALLFUNC: case OCALLMETH: case OCALLINTER: switch(n->op) { case OCALLFUNC: cgen_call(n, 0); break; case OCALLMETH: cgen_callmeth(n, 0); break; case OCALLINTER: cgen_callinter(n, N, 0); break; } fp = structfirst(&flist, getoutarg(n->left->type)); memset(a, 0, sizeof *a); a->op = OINDREG; a->val.u.reg = D_SP; a->addable = 1; a->xoffset = fp->width; a->type = n->type; return; case OINDEX: // Index of fixed-size array by constant can // put the offset in the addressing. // Could do the same for slice except that we need // to use the real index for the bounds checking. if(isfixedarray(n->left->type) || (isptr[n->left->type->etype] && isfixedarray(n->left->left->type))) if(isconst(n->right, CTINT)) { // Compute &a. if(!isptr[n->left->type->etype]) igen(n->left, a, res); else { igen(n->left, &n1, res); cgen_checknil(&n1); regalloc(a, types[tptr], res); gmove(&n1, a); regfree(&n1); a->op = OINDREG; } // Compute &a[i] as &a + i*width. a->type = n->type; a->xoffset += mpgetfix(n->right->val.u.xval)*n->type->width; fixlargeoffset(a); return; } break; } agenr(n, a, res); a->op = OINDREG; a->type = n->type; } /* * generate: * if(n == true) goto to; */ void bgen(Node *n, int true, int likely, Prog *to) { int et, a; Node *nl, *nr, *l, *r; Node n1, n2, tmp; NodeList *ll; Prog *p1, *p2; if(debug['g']) { dump("\nbgen", n); } if(n == N) n = nodbool(1); if(n->ninit != nil) genlist(n->ninit); if(n->type == T) { convlit(&n, types[TBOOL]); if(n->type == T) goto ret; } et = n->type->etype; if(et != TBOOL) { yyerror("cgen: bad type %T for %O", n->type, n->op); patch(gins(AEND, N, N), to); goto ret; } nr = N; switch(n->op) { default: def: regalloc(&n1, n->type, N); cgen(n, &n1); nodconst(&n2, n->type, 0); gins(optoas(OCMP, n->type), &n1, &n2); a = AJNE; if(!true) a = AJEQ; patch(gbranch(a, n->type, likely), to); regfree(&n1); goto ret; case OLITERAL: // need to ask if it is bool? if(!true == !n->val.u.bval) patch(gbranch(AJMP, T, likely), to); goto ret; case ONAME: if(n->addable == 0) goto def; nodconst(&n1, n->type, 0); gins(optoas(OCMP, n->type), n, &n1); a = AJNE; if(!true) a = AJEQ; patch(gbranch(a, n->type, likely), to); goto ret; case OANDAND: if(!true) goto caseor; caseand: p1 = gbranch(AJMP, T, 0); p2 = gbranch(AJMP, T, 0); patch(p1, pc); bgen(n->left, !true, -likely, p2); bgen(n->right, !true, -likely, p2); p1 = gbranch(AJMP, T, 0); patch(p1, to); patch(p2, pc); goto ret; case OOROR: if(!true) goto caseand; caseor: bgen(n->left, true, likely, to); bgen(n->right, true, likely, to); goto ret; case OEQ: case ONE: case OLT: case OGT: case OLE: case OGE: nr = n->right; if(nr == N || nr->type == T) goto ret; case ONOT: // unary nl = n->left; if(nl == N || nl->type == T) goto ret; break; } switch(n->op) { case ONOT: bgen(nl, !true, likely, to); goto ret; case OEQ: case ONE: case OLT: case OGT: case OLE: case OGE: a = n->op; if(!true) { if(isfloat[nr->type->etype]) { // brcom is not valid on floats when NaN is involved. p1 = gbranch(AJMP, T, 0); p2 = gbranch(AJMP, T, 0); patch(p1, pc); ll = n->ninit; // avoid re-genning ninit n->ninit = nil; bgen(n, 1, -likely, p2); n->ninit = ll; patch(gbranch(AJMP, T, 0), to); patch(p2, pc); goto ret; } a = brcom(a); true = !true; } // make simplest on right if(nl->op == OLITERAL || (nl->ullman < nr->ullman && nl->ullman < UINF)) { a = brrev(a); r = nl; nl = nr; nr = r; } if(isslice(nl->type)) { // front end should only leave cmp to literal nil if((a != OEQ && a != ONE) || nr->op != OLITERAL) { yyerror("illegal slice comparison"); break; } a = optoas(a, types[tptr]); igen(nl, &n1, N); n1.xoffset += Array_array; n1.type = types[tptr]; nodconst(&tmp, types[tptr], 0); gins(optoas(OCMP, types[tptr]), &n1, &tmp); patch(gbranch(a, types[tptr], likely), to); regfree(&n1); break; } if(isinter(nl->type)) { // front end should only leave cmp to literal nil if((a != OEQ && a != ONE) || nr->op != OLITERAL) { yyerror("illegal interface comparison"); break; } a = optoas(a, types[tptr]); igen(nl, &n1, N); n1.type = types[tptr]; nodconst(&tmp, types[tptr], 0); gins(optoas(OCMP, types[tptr]), &n1, &tmp); patch(gbranch(a, types[tptr], likely), to); regfree(&n1); break; } if(iscomplex[nl->type->etype]) { complexbool(a, nl, nr, true, likely, to); break; } if(nr->ullman >= UINF) { regalloc(&n1, nl->type, N); cgen(nl, &n1); tempname(&tmp, nl->type); gmove(&n1, &tmp); regfree(&n1); regalloc(&n2, nr->type, N); cgen(nr, &n2); regalloc(&n1, nl->type, N); cgen(&tmp, &n1); goto cmp; } regalloc(&n1, nl->type, N); cgen(nl, &n1); if(smallintconst(nr)) { gins(optoas(OCMP, nr->type), &n1, nr); patch(gbranch(optoas(a, nr->type), nr->type, likely), to); regfree(&n1); break; } regalloc(&n2, nr->type, N); cgen(nr, &n2); cmp: // only < and <= work right with NaN; reverse if needed l = &n1; r = &n2; if(isfloat[nl->type->etype] && (a == OGT || a == OGE)) { l = &n2; r = &n1; a = brrev(a); } gins(optoas(OCMP, nr->type), l, r); if(isfloat[nr->type->etype] && (n->op == OEQ || n->op == ONE)) { if(n->op == OEQ) { // neither NE nor P p1 = gbranch(AJNE, T, -likely); p2 = gbranch(AJPS, T, -likely); patch(gbranch(AJMP, T, 0), to); patch(p1, pc); patch(p2, pc); } else { // either NE or P patch(gbranch(AJNE, T, likely), to); patch(gbranch(AJPS, T, likely), to); } } else patch(gbranch(optoas(a, nr->type), nr->type, likely), to); regfree(&n1); regfree(&n2); break; } goto ret; ret: ; } /* * n is on stack, either local variable * or return value from function call. * return n's offset from SP. */ int64 stkof(Node *n) { Type *t; Iter flist; int64 off; switch(n->op) { case OINDREG: return n->xoffset; case ODOT: t = n->left->type; if(isptr[t->etype]) break; off = stkof(n->left); if(off == -1000 || off == 1000) return off; return off + n->xoffset; case OINDEX: t = n->left->type; if(!isfixedarray(t)) break; off = stkof(n->left); if(off == -1000 || off == 1000) return off; if(isconst(n->right, CTINT)) return off + t->type->width * mpgetfix(n->right->val.u.xval); return 1000; case OCALLMETH: case OCALLINTER: case OCALLFUNC: t = n->left->type; if(isptr[t->etype]) t = t->type; t = structfirst(&flist, getoutarg(t)); if(t != T) return t->width; break; } // botch - probably failing to recognize address // arithmetic on the above. eg INDEX and DOT return -1000; } /* * block copy: * memmove(&ns, &n, w); */ void sgen(Node *n, Node *ns, int64 w) { Node nodl, nodr, nodsi, noddi, cx, oldcx, tmp; vlong c, q, odst, osrc; if(debug['g']) { print("\nsgen w=%lld\n", w); dump("r", n); dump("res", ns); } if(n->ullman >= UINF && ns->ullman >= UINF) fatal("sgen UINF"); if(w < 0) fatal("sgen copy %lld", w); // Avoid taking the address for simple enough types. if(componentgen(n, ns)) return; if(w == 0) { // evaluate side effects only regalloc(&nodr, types[tptr], N); agen(ns, &nodr); agen(n, &nodr); regfree(&nodr); return; } // offset on the stack osrc = stkof(n); odst = stkof(ns); if(osrc != -1000 && odst != -1000 && (osrc == 1000 || odst == 1000)) { // osrc and odst both on stack, and at least one is in // an unknown position. Could generate code to test // for forward/backward copy, but instead just copy // to a temporary location first. tempname(&tmp, n->type); sgen(n, &tmp, w); sgen(&tmp, ns, w); return; } if(n->ullman >= ns->ullman) { agenr(n, &nodr, N); agenr(ns, &nodl, N); } else { agenr(ns, &nodl, N); agenr(n, &nodr, N); } nodreg(&noddi, types[tptr], D_DI); nodreg(&nodsi, types[tptr], D_SI); gmove(&nodl, &noddi); gmove(&nodr, &nodsi); regfree(&nodl); regfree(&nodr); c = w % 8; // bytes q = w / 8; // quads savex(D_CX, &cx, &oldcx, N, types[TINT64]); // if we are copying forward on the stack and // the src and dst overlap, then reverse direction if(osrc < odst && odst < osrc+w) { // reverse direction gins(ASTD, N, N); // set direction flag if(c > 0) { gconreg(AADDQ, w-1, D_SI); gconreg(AADDQ, w-1, D_DI); gconreg(AMOVQ, c, D_CX); gins(AREP, N, N); // repeat gins(AMOVSB, N, N); // MOVB *(SI)-,*(DI)- } if(q > 0) { if(c > 0) { gconreg(AADDQ, -7, D_SI); gconreg(AADDQ, -7, D_DI); } else { gconreg(AADDQ, w-8, D_SI); gconreg(AADDQ, w-8, D_DI); } gconreg(AMOVQ, q, D_CX); gins(AREP, N, N); // repeat gins(AMOVSQ, N, N); // MOVQ *(SI)-,*(DI)- } // we leave with the flag clear gins(ACLD, N, N); } else { // normal direction if(q >= 4) { gconreg(AMOVQ, q, D_CX); gins(AREP, N, N); // repeat gins(AMOVSQ, N, N); // MOVQ *(SI)+,*(DI)+ } else while(q > 0) { gins(AMOVSQ, N, N); // MOVQ *(SI)+,*(DI)+ q--; } if(c >= 4) { gins(AMOVSL, N, N); // MOVL *(SI)+,*(DI)+ c -= 4; } while(c > 0) { gins(AMOVSB, N, N); // MOVB *(SI)+,*(DI)+ c--; } } restx(&cx, &oldcx); } static int cadable(Node *n) { if(!n->addable) { // dont know how it happens, // but it does return 0; } switch(n->op) { case ONAME: return 1; } return 0; } /* * copy a composite value by moving its individual components. * Slices, strings and interfaces are supported. * Small structs or arrays with elements of basic type are * also supported. * nr is N when assigning a zero value. * return 1 if can do, 0 if can't. */ int componentgen(Node *nr, Node *nl) { Node nodl, nodr; Type *t; int freel, freer; vlong fldcount; vlong loffset, roffset; freel = 0; freer = 0; switch(nl->type->etype) { default: goto no; case TARRAY: t = nl->type; // Slices are ok. if(isslice(t)) break; // Small arrays are ok. if(t->bound > 0 && t->bound <= 3 && !isfat(t->type)) break; goto no; case TSTRUCT: // Small structs with non-fat types are ok. // Zero-sized structs are treated separately elsewhere. fldcount = 0; for(t=nl->type->type; t; t=t->down) { if(isfat(t->type)) goto no; if(t->etype != TFIELD) fatal("componentgen: not a TFIELD: %lT", t); fldcount++; } if(fldcount == 0 || fldcount > 3) goto no; break; case TSTRING: case TINTER: break; } nodl = *nl; if(!cadable(nl)) { if(nr == N || !cadable(nr)) goto no; igen(nl, &nodl, N); freel = 1; } if(nr != N) { nodr = *nr; if(!cadable(nr)) { igen(nr, &nodr, N); freer = 1; } } switch(nl->type->etype) { case TARRAY: // componentgen for arrays. t = nl->type; if(!isslice(t)) { nodl.type = t->type; nodr.type = nodl.type; for(fldcount=0; fldcount < t->bound; fldcount++) { if(nr == N) clearslim(&nodl); else gmove(&nodr, &nodl); nodl.xoffset += t->type->width; nodr.xoffset += t->type->width; } goto yes; } // componentgen for slices. nodl.xoffset += Array_array; nodl.type = ptrto(nl->type->type); if(nr != N) { nodr.xoffset += Array_array; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); nodl.xoffset += Array_nel-Array_array; nodl.type = types[simtype[TUINT]]; if(nr != N) { nodr.xoffset += Array_nel-Array_array; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); nodl.xoffset += Array_cap-Array_nel; nodl.type = types[simtype[TUINT]]; if(nr != N) { nodr.xoffset += Array_cap-Array_nel; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); goto yes; case TSTRING: nodl.xoffset += Array_array; nodl.type = ptrto(types[TUINT8]); if(nr != N) { nodr.xoffset += Array_array; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); nodl.xoffset += Array_nel-Array_array; nodl.type = types[simtype[TUINT]]; if(nr != N) { nodr.xoffset += Array_nel-Array_array; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); goto yes; case TINTER: nodl.xoffset += Array_array; nodl.type = ptrto(types[TUINT8]); if(nr != N) { nodr.xoffset += Array_array; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); nodl.xoffset += Array_nel-Array_array; nodl.type = ptrto(types[TUINT8]); if(nr != N) { nodr.xoffset += Array_nel-Array_array; nodr.type = nodl.type; } else nodconst(&nodr, nodl.type, 0); gmove(&nodr, &nodl); goto yes; case TSTRUCT: loffset = nodl.xoffset; roffset = nodr.xoffset; // funarg structs may not begin at offset zero. if(nl->type->etype == TSTRUCT && nl->type->funarg && nl->type->type) loffset -= nl->type->type->width; if(nr != N && nr->type->etype == TSTRUCT && nr->type->funarg && nr->type->type) roffset -= nr->type->type->width; for(t=nl->type->type; t; t=t->down) { nodl.xoffset = loffset + t->width; nodl.type = t->type; if(nr == N) clearslim(&nodl); else { nodr.xoffset = roffset + t->width; nodr.type = nodl.type; gmove(&nodr, &nodl); } } goto yes; } no: if(freer) regfree(&nodr); if(freel) regfree(&nodl); return 0; yes: if(freer) regfree(&nodr); if(freel) regfree(&nodl); return 1; }