| 1 | #include "all.h" | 
|---|
| 2 |  | 
|---|
| 3 |  | 
|---|
| 4 | #define CMP(X) \ | 
|---|
| 5 | X(Ciule,      "be") \ | 
|---|
| 6 | X(Ciult,      "b")  \ | 
|---|
| 7 | X(Cisle,      "le") \ | 
|---|
| 8 | X(Cislt,      "l")  \ | 
|---|
| 9 | X(Cisgt,      "g")  \ | 
|---|
| 10 | X(Cisge,      "ge") \ | 
|---|
| 11 | X(Ciugt,      "a")  \ | 
|---|
| 12 | X(Ciuge,      "ae") \ | 
|---|
| 13 | X(Cieq,       "z")  \ | 
|---|
| 14 | X(Cine,       "nz") \ | 
|---|
| 15 | X(NCmpI+Cfle, "be") \ | 
|---|
| 16 | X(NCmpI+Cflt, "b")  \ | 
|---|
| 17 | X(NCmpI+Cfgt, "a")  \ | 
|---|
| 18 | X(NCmpI+Cfge, "ae") \ | 
|---|
| 19 | X(NCmpI+Cfeq, "z")  \ | 
|---|
| 20 | X(NCmpI+Cfne, "nz") \ | 
|---|
| 21 | X(NCmpI+Cfo,  "np") \ | 
|---|
| 22 | X(NCmpI+Cfuo, "p") | 
|---|
| 23 |  | 
|---|
| 24 | enum { | 
|---|
| 25 | SLong = 0, | 
|---|
| 26 | SWord = 1, | 
|---|
| 27 | SShort = 2, | 
|---|
| 28 | SByte = 3, | 
|---|
| 29 |  | 
|---|
| 30 | Ki = -1, /* matches Kw and Kl */ | 
|---|
| 31 | Ka = -2, /* matches all classes */ | 
|---|
| 32 | }; | 
|---|
| 33 |  | 
|---|
| 34 | /* Instruction format strings: | 
|---|
| 35 | * | 
|---|
| 36 | * if the format string starts with -, the instruction | 
|---|
| 37 | * is assumed to be 3-address and is put in 2-address | 
|---|
| 38 | * mode using an extra mov if necessary | 
|---|
| 39 | * | 
|---|
| 40 | * if the format string starts with +, the same as the | 
|---|
| 41 | * above applies, but commutativity is also assumed | 
|---|
| 42 | * | 
|---|
| 43 | * %k  is used to set the class of the instruction, | 
|---|
| 44 | *     it'll expand to "l", "q", "ss", "sd", depending | 
|---|
| 45 | *     on the instruction class | 
|---|
| 46 | * %0  designates the first argument | 
|---|
| 47 | * %1  designates the second argument | 
|---|
| 48 | * %=  designates the result | 
|---|
| 49 | * | 
|---|
| 50 | * if %k is not used, a prefix to 0, 1, or = must be | 
|---|
| 51 | * added, it can be: | 
|---|
| 52 | *   M - memory reference | 
|---|
| 53 | *   L - long  (64 bits) | 
|---|
| 54 | *   W - word  (32 bits) | 
|---|
| 55 | *   H - short (16 bits) | 
|---|
| 56 | *   B - byte  (8 bits) | 
|---|
| 57 | *   S - single precision float | 
|---|
| 58 | *   D - double precision float | 
|---|
| 59 | */ | 
|---|
| 60 | static struct { | 
|---|
| 61 | short op; | 
|---|
| 62 | short cls; | 
|---|
| 63 | char *asm; | 
|---|
| 64 | } omap[] = { | 
|---|
| 65 | { Oadd,    Ka, "+add%k %1, %="}, | 
|---|
| 66 | { Osub,    Ka, "-sub%k %1, %="}, | 
|---|
| 67 | { Oand,    Ki, "+and%k %1, %="}, | 
|---|
| 68 | { Oor,     Ki, "+or%k %1, %="}, | 
|---|
| 69 | { Oxor,    Ki, "+xor%k %1, %="}, | 
|---|
| 70 | { Osar,    Ki, "-sar%k %B1, %="}, | 
|---|
| 71 | { Oshr,    Ki, "-shr%k %B1, %="}, | 
|---|
| 72 | { Oshl,    Ki, "-shl%k %B1, %="}, | 
|---|
| 73 | { Omul,    Ki, "+imul%k %1, %="}, | 
|---|
| 74 | { Omul,    Ks, "+mulss %1, %="}, | 
|---|
| 75 | { Omul,    Kd, "+mulsd %1, %="}, | 
|---|
| 76 | { Odiv,    Ka, "-div%k %1, %="}, | 
|---|
| 77 | { Ostorel, Ka, "movq %L0, %M1"}, | 
|---|
| 78 | { Ostorew, Ka, "movl %W0, %M1"}, | 
|---|
| 79 | { Ostoreh, Ka, "movw %H0, %M1"}, | 
|---|
| 80 | { Ostoreb, Ka, "movb %B0, %M1"}, | 
|---|
| 81 | { Ostores, Ka, "movss %S0, %M1"}, | 
|---|
| 82 | { Ostored, Ka, "movsd %D0, %M1"}, | 
|---|
| 83 | { Oload,   Ka, "mov%k %M0, %="}, | 
|---|
| 84 | { Oloadsw, Kl, "movslq %M0, %L="}, | 
|---|
| 85 | { Oloadsw, Kw, "movl %M0, %W="}, | 
|---|
| 86 | { Oloaduw, Ki, "movl %M0, %W="}, | 
|---|
| 87 | { Oloadsh, Ki, "movsw%k %M0, %="}, | 
|---|
| 88 | { Oloaduh, Ki, "movzw%k %M0, %="}, | 
|---|
| 89 | { Oloadsb, Ki, "movsb%k %M0, %="}, | 
|---|
| 90 | { Oloadub, Ki, "movzb%k %M0, %="}, | 
|---|
| 91 | { Oextsw,  Kl, "movslq %W0, %L="}, | 
|---|
| 92 | { Oextuw,  Kl, "movl %W0, %W="}, | 
|---|
| 93 | { Oextsh,  Ki, "movsw%k %H0, %="}, | 
|---|
| 94 | { Oextuh,  Ki, "movzw%k %H0, %="}, | 
|---|
| 95 | { Oextsb,  Ki, "movsb%k %B0, %="}, | 
|---|
| 96 | { Oextub,  Ki, "movzb%k %B0, %="}, | 
|---|
| 97 |  | 
|---|
| 98 | { Oexts,   Kd, "cvtss2sd %0, %="}, | 
|---|
| 99 | { Otruncd, Ks, "cvtsd2ss %0, %="}, | 
|---|
| 100 | { Ostosi,  Ki, "cvttss2si%k %0, %="}, | 
|---|
| 101 | { Odtosi,  Ki, "cvttsd2si%k %0, %="}, | 
|---|
| 102 | { Oswtof,  Ka, "cvtsi2%k %W0, %="}, | 
|---|
| 103 | { Osltof,  Ka, "cvtsi2%k %L0, %="}, | 
|---|
| 104 | { Ocast,   Ki, "movq %D0, %L="}, | 
|---|
| 105 | { Ocast,   Ka, "movq %L0, %D="}, | 
|---|
| 106 |  | 
|---|
| 107 | { Oaddr,   Ki, "lea%k %M0, %="}, | 
|---|
| 108 | { Oswap,   Ki, "xchg%k %0, %1"}, | 
|---|
| 109 | { Osign,   Kl, "cqto"}, | 
|---|
| 110 | { Osign,   Kw, "cltd"}, | 
|---|
| 111 | { Oxdiv,   Ki, "div%k %0"}, | 
|---|
| 112 | { Oxidiv,  Ki, "idiv%k %0"}, | 
|---|
| 113 | { Oxcmp,   Ks, "ucomiss %S0, %S1"}, | 
|---|
| 114 | { Oxcmp,   Kd, "ucomisd %D0, %D1"}, | 
|---|
| 115 | { Oxcmp,   Ki, "cmp%k %0, %1"}, | 
|---|
| 116 | { Oxtest,  Ki, "test%k %0, %1"}, | 
|---|
| 117 | #define X(c, s) \ | 
|---|
| 118 | { Oflag+c, Ki, "set" s " %B=\n\tmovzb%k %B=, %=" }, | 
|---|
| 119 | CMP(X) | 
|---|
| 120 | #undef X | 
|---|
| 121 | { NOp, 0, 0 } | 
|---|
| 122 | }; | 
|---|
| 123 |  | 
|---|
| 124 | static char *rname[][4] = { | 
|---|
| 125 | [RAX] = { "rax", "eax", "ax", "al"}, | 
|---|
| 126 | [RBX] = { "rbx", "ebx", "bx", "bl"}, | 
|---|
| 127 | [RCX] = { "rcx", "ecx", "cx", "cl"}, | 
|---|
| 128 | [RDX] = { "rdx", "edx", "dx", "dl"}, | 
|---|
| 129 | [RSI] = { "rsi", "esi", "si", "sil"}, | 
|---|
| 130 | [RDI] = { "rdi", "edi", "di", "dil"}, | 
|---|
| 131 | [RBP] = { "rbp", "ebp", "bp", "bpl"}, | 
|---|
| 132 | [RSP] = { "rsp", "esp", "sp", "spl"}, | 
|---|
| 133 | [R8 ] = { "r8", "r8d", "r8w", "r8b"}, | 
|---|
| 134 | [R9 ] = { "r9", "r9d", "r9w", "r9b"}, | 
|---|
| 135 | [R10] = { "r10", "r10d", "r10w", "r10b"}, | 
|---|
| 136 | [R11] = { "r11", "r11d", "r11w", "r11b"}, | 
|---|
| 137 | [R12] = { "r12", "r12d", "r12w", "r12b"}, | 
|---|
| 138 | [R13] = { "r13", "r13d", "r13w", "r13b"}, | 
|---|
| 139 | [R14] = { "r14", "r14d", "r14w", "r14b"}, | 
|---|
| 140 | [R15] = { "r15", "r15d", "r15w", "r15b"}, | 
|---|
| 141 | }; | 
|---|
| 142 |  | 
|---|
| 143 |  | 
|---|
| 144 | static int | 
|---|
| 145 | slot(int s, Fn *fn) | 
|---|
| 146 | { | 
|---|
| 147 | struct { int i:29; } x; | 
|---|
| 148 |  | 
|---|
| 149 | /* sign extend s using a bitfield */ | 
|---|
| 150 | x.i = s; | 
|---|
| 151 | assert(x.i <= fn->slot); | 
|---|
| 152 | /* specific to NAlign == 3 */ | 
|---|
| 153 | if (x.i < 0) | 
|---|
| 154 | return -4 * x.i; | 
|---|
| 155 | else if (fn->vararg) | 
|---|
| 156 | return -176 + -4 * (fn->slot - x.i); | 
|---|
| 157 | else | 
|---|
| 158 | return -4 * (fn->slot - x.i); | 
|---|
| 159 | } | 
|---|
| 160 |  | 
|---|
| 161 | static void | 
|---|
| 162 | emitcon(Con *con, FILE *f) | 
|---|
| 163 | { | 
|---|
| 164 | char *p, *l; | 
|---|
| 165 |  | 
|---|
| 166 | switch (con->type) { | 
|---|
| 167 | case CAddr: | 
|---|
| 168 | l = str(con->label); | 
|---|
| 169 | p = con->local ? gasloc : l[0] == '"' ? "": gassym; | 
|---|
| 170 | fprintf(f, "%s%s", p, l); | 
|---|
| 171 | if (con->bits.i) | 
|---|
| 172 | fprintf(f, "%+"PRId64, con->bits.i); | 
|---|
| 173 | break; | 
|---|
| 174 | case CBits: | 
|---|
| 175 | fprintf(f, "%"PRId64, con->bits.i); | 
|---|
| 176 | break; | 
|---|
| 177 | default: | 
|---|
| 178 | die( "unreachable"); | 
|---|
| 179 | } | 
|---|
| 180 | } | 
|---|
| 181 |  | 
|---|
| 182 | static char * | 
|---|
| 183 | regtoa(int reg, int sz) | 
|---|
| 184 | { | 
|---|
| 185 | static char buf[6]; | 
|---|
| 186 |  | 
|---|
| 187 | assert(reg <= XMM15); | 
|---|
| 188 | if (reg >= XMM0) { | 
|---|
| 189 | sprintf(buf, "xmm%d", reg-XMM0); | 
|---|
| 190 | return buf; | 
|---|
| 191 | } else | 
|---|
| 192 | return rname[reg][sz]; | 
|---|
| 193 | } | 
|---|
| 194 |  | 
|---|
| 195 | static Ref | 
|---|
| 196 | getarg(char c, Ins *i) | 
|---|
| 197 | { | 
|---|
| 198 | switch (c) { | 
|---|
| 199 | case '0': | 
|---|
| 200 | return i->arg[0]; | 
|---|
| 201 | case '1': | 
|---|
| 202 | return i->arg[1]; | 
|---|
| 203 | case '=': | 
|---|
| 204 | return i->to; | 
|---|
| 205 | default: | 
|---|
| 206 | die( "invalid arg letter %c", c); | 
|---|
| 207 | } | 
|---|
| 208 | } | 
|---|
| 209 |  | 
|---|
| 210 | static void emitins(Ins, Fn *, FILE *); | 
|---|
| 211 |  | 
|---|
| 212 | static void | 
|---|
| 213 | emitcopy(Ref r1, Ref r2, int k, Fn *fn, FILE *f) | 
|---|
| 214 | { | 
|---|
| 215 | Ins icp; | 
|---|
| 216 |  | 
|---|
| 217 | icp.op = Ocopy; | 
|---|
| 218 | icp.arg[0] = r2; | 
|---|
| 219 | icp.to = r1; | 
|---|
| 220 | icp.cls = k; | 
|---|
| 221 | emitins(icp, fn, f); | 
|---|
| 222 | } | 
|---|
| 223 |  | 
|---|
| 224 | static void | 
|---|
| 225 | emitf(char *s, Ins *i, Fn *fn, FILE *f) | 
|---|
| 226 | { | 
|---|
| 227 | static char clstoa[][3] = { "l", "q", "ss", "sd"}; | 
|---|
| 228 | char c; | 
|---|
| 229 | int sz; | 
|---|
| 230 | Ref ref; | 
|---|
| 231 | Mem *m; | 
|---|
| 232 | Con off; | 
|---|
| 233 |  | 
|---|
| 234 | switch (*s) { | 
|---|
| 235 | case '+': | 
|---|
| 236 | if (req(i->arg[1], i->to)) { | 
|---|
| 237 | ref = i->arg[0]; | 
|---|
| 238 | i->arg[0] = i->arg[1]; | 
|---|
| 239 | i->arg[1] = ref; | 
|---|
| 240 | } | 
|---|
| 241 | /* fall through */ | 
|---|
| 242 | case '-': | 
|---|
| 243 | assert((!req(i->arg[1], i->to) || req(i->arg[0], i->to)) && | 
|---|
| 244 | "cannot convert to 2-address"); | 
|---|
| 245 | emitcopy(i->to, i->arg[0], i->cls, fn, f); | 
|---|
| 246 | s++; | 
|---|
| 247 | break; | 
|---|
| 248 | } | 
|---|
| 249 |  | 
|---|
| 250 | fputc('\t', f); | 
|---|
| 251 | Next: | 
|---|
| 252 | while ((c = *s++) != '%') | 
|---|
| 253 | if (!c) { | 
|---|
| 254 | fputc('\n', f); | 
|---|
| 255 | return; | 
|---|
| 256 | } else | 
|---|
| 257 | fputc(c, f); | 
|---|
| 258 | switch ((c = *s++)) { | 
|---|
| 259 | case '%': | 
|---|
| 260 | fputc('%', f); | 
|---|
| 261 | break; | 
|---|
| 262 | case 'k': | 
|---|
| 263 | fputs(clstoa[i->cls], f); | 
|---|
| 264 | break; | 
|---|
| 265 | case '0': | 
|---|
| 266 | case '1': | 
|---|
| 267 | case '=': | 
|---|
| 268 | sz = KWIDE(i->cls) ? SLong : SWord; | 
|---|
| 269 | s--; | 
|---|
| 270 | goto Ref; | 
|---|
| 271 | case 'D': | 
|---|
| 272 | case 'S': | 
|---|
| 273 | sz = SLong; /* does not matter for floats */ | 
|---|
| 274 | Ref: | 
|---|
| 275 | c = *s++; | 
|---|
| 276 | ref = getarg(c, i); | 
|---|
| 277 | switch (rtype(ref)) { | 
|---|
| 278 | case RTmp: | 
|---|
| 279 | assert(isreg(ref)); | 
|---|
| 280 | fprintf(f, "%%%s", regtoa(ref.val, sz)); | 
|---|
| 281 | break; | 
|---|
| 282 | case RSlot: | 
|---|
| 283 | fprintf(f, "%d(%%rbp)", slot(ref.val, fn)); | 
|---|
| 284 | break; | 
|---|
| 285 | case RMem: | 
|---|
| 286 | Mem: | 
|---|
| 287 | m = &fn->mem[ref.val]; | 
|---|
| 288 | if (rtype(m->base) == RSlot) { | 
|---|
| 289 | off.type = CBits; | 
|---|
| 290 | off.bits.i = slot(m->base.val, fn); | 
|---|
| 291 | addcon(&m->offset, &off); | 
|---|
| 292 | m->base = TMP(RBP); | 
|---|
| 293 | } | 
|---|
| 294 | if (m->offset.type != CUndef) | 
|---|
| 295 | emitcon(&m->offset, f); | 
|---|
| 296 | fputc('(', f); | 
|---|
| 297 | if (!req(m->base, R)) | 
|---|
| 298 | fprintf(f, "%%%s", regtoa(m->base.val, SLong)); | 
|---|
| 299 | else if (m->offset.type == CAddr) | 
|---|
| 300 | fprintf(f, "%%rip"); | 
|---|
| 301 | if (!req(m->index, R)) | 
|---|
| 302 | fprintf(f, ", %%%s, %d", | 
|---|
| 303 | regtoa(m->index.val, SLong), | 
|---|
| 304 | m->scale | 
|---|
| 305 | ); | 
|---|
| 306 | fputc(')', f); | 
|---|
| 307 | break; | 
|---|
| 308 | case RCon: | 
|---|
| 309 | fputc('$', f); | 
|---|
| 310 | emitcon(&fn->con[ref.val], f); | 
|---|
| 311 | break; | 
|---|
| 312 | default: | 
|---|
| 313 | die( "unreachable"); | 
|---|
| 314 | } | 
|---|
| 315 | break; | 
|---|
| 316 | case 'L': | 
|---|
| 317 | sz = SLong; | 
|---|
| 318 | goto Ref; | 
|---|
| 319 | case 'W': | 
|---|
| 320 | sz = SWord; | 
|---|
| 321 | goto Ref; | 
|---|
| 322 | case 'H': | 
|---|
| 323 | sz = SShort; | 
|---|
| 324 | goto Ref; | 
|---|
| 325 | case 'B': | 
|---|
| 326 | sz = SByte; | 
|---|
| 327 | goto Ref; | 
|---|
| 328 | case 'M': | 
|---|
| 329 | c = *s++; | 
|---|
| 330 | ref = getarg(c, i); | 
|---|
| 331 | switch (rtype(ref)) { | 
|---|
| 332 | case RMem: | 
|---|
| 333 | goto Mem; | 
|---|
| 334 | case RSlot: | 
|---|
| 335 | fprintf(f, "%d(%%rbp)", slot(ref.val, fn)); | 
|---|
| 336 | break; | 
|---|
| 337 | case RCon: | 
|---|
| 338 | off = fn->con[ref.val]; | 
|---|
| 339 | emitcon(&off, f); | 
|---|
| 340 | if (off.type == CAddr) | 
|---|
| 341 | fprintf(f, "(%%rip)"); | 
|---|
| 342 | break; | 
|---|
| 343 | case RTmp: | 
|---|
| 344 | assert(isreg(ref)); | 
|---|
| 345 | fprintf(f, "(%%%s)", regtoa(ref.val, SLong)); | 
|---|
| 346 | break; | 
|---|
| 347 | default: | 
|---|
| 348 | die( "unreachable"); | 
|---|
| 349 | } | 
|---|
| 350 | break; | 
|---|
| 351 | default: | 
|---|
| 352 | die( "invalid format specifier %%%c", c); | 
|---|
| 353 | } | 
|---|
| 354 | goto Next; | 
|---|
| 355 | } | 
|---|
| 356 |  | 
|---|
| 357 | static void *negmask[4] = { | 
|---|
| 358 | [Ks] = (uint32_t[4]){ 0x80000000 }, | 
|---|
| 359 | [Kd] = (uint64_t[2]){ 0x8000000000000000 }, | 
|---|
| 360 | }; | 
|---|
| 361 |  | 
|---|
| 362 | static void | 
|---|
| 363 | emitins(Ins i, Fn *fn, FILE *f) | 
|---|
| 364 | { | 
|---|
| 365 | Ref r; | 
|---|
| 366 | int64_t val; | 
|---|
| 367 | int o, t0; | 
|---|
| 368 | Ins ineg; | 
|---|
| 369 |  | 
|---|
| 370 | switch (i.op) { | 
|---|
| 371 | default: | 
|---|
| 372 | Table: | 
|---|
| 373 | /* most instructions are just pulled out of | 
|---|
| 374 | * the table omap[], some special cases are | 
|---|
| 375 | * detailed below */ | 
|---|
| 376 | for (o=0;; o++) { | 
|---|
| 377 | /* this linear search should really be a binary | 
|---|
| 378 | * search */ | 
|---|
| 379 | if (omap[o].op == NOp) | 
|---|
| 380 | die( "no match for %s(%c)", | 
|---|
| 381 | optab[i.op].name, "wlsd"[i.cls]); | 
|---|
| 382 | if (omap[o].op == i.op) | 
|---|
| 383 | if (omap[o].cls == i.cls | 
|---|
| 384 | || (omap[o].cls == Ki && KBASE(i.cls) == 0) | 
|---|
| 385 | || (omap[o].cls == Ka)) | 
|---|
| 386 | break; | 
|---|
| 387 | } | 
|---|
| 388 | emitf(omap[o].asm, &i, fn, f); | 
|---|
| 389 | break; | 
|---|
| 390 | case Onop: | 
|---|
| 391 | /* just do nothing for nops, they are inserted | 
|---|
| 392 | * by some passes */ | 
|---|
| 393 | break; | 
|---|
| 394 | case Omul: | 
|---|
| 395 | /* here, we try to use the 3-addresss form | 
|---|
| 396 | * of multiplication when possible */ | 
|---|
| 397 | if (rtype(i.arg[1]) == RCon) { | 
|---|
| 398 | r = i.arg[0]; | 
|---|
| 399 | i.arg[0] = i.arg[1]; | 
|---|
| 400 | i.arg[1] = r; | 
|---|
| 401 | } | 
|---|
| 402 | if (KBASE(i.cls) == 0 /* only available for ints */ | 
|---|
| 403 | && rtype(i.arg[0]) == RCon | 
|---|
| 404 | && rtype(i.arg[1]) == RTmp) { | 
|---|
| 405 | emitf( "imul%k %0, %1, %=", &i, fn, f); | 
|---|
| 406 | break; | 
|---|
| 407 | } | 
|---|
| 408 | goto Table; | 
|---|
| 409 | case Osub: | 
|---|
| 410 | /* we have to use the negation trick to handle | 
|---|
| 411 | * some 3-address subtractions */ | 
|---|
| 412 | if (req(i.to, i.arg[1]) && !req(i.arg[0], i.to)) { | 
|---|
| 413 | ineg = (Ins){Oneg, i.cls, i.to, {i.to}}; | 
|---|
| 414 | emitins(ineg, fn, f); | 
|---|
| 415 | emitf( "add%k %0, %=", &i, fn, f); | 
|---|
| 416 | break; | 
|---|
| 417 | } | 
|---|
| 418 | goto Table; | 
|---|
| 419 | case Oneg: | 
|---|
| 420 | if (!req(i.to, i.arg[0])) | 
|---|
| 421 | emitf( "mov%k %0, %=", &i, fn, f); | 
|---|
| 422 | if (KBASE(i.cls) == 0) | 
|---|
| 423 | emitf( "neg%k %=", &i, fn, f); | 
|---|
| 424 | else | 
|---|
| 425 | fprintf(f, | 
|---|
| 426 | "\txorp%c %sfp%d(%%rip), %%%s\n", | 
|---|
| 427 | "xxsd"[i.cls], | 
|---|
| 428 | gasloc, | 
|---|
| 429 | gasstash(negmask[i.cls], 16), | 
|---|
| 430 | regtoa(i.to.val, SLong) | 
|---|
| 431 | ); | 
|---|
| 432 | break; | 
|---|
| 433 | case Odiv: | 
|---|
| 434 | /* use xmm15 to adjust the instruction when the | 
|---|
| 435 | * conversion to 2-address in emitf() would fail */ | 
|---|
| 436 | if (req(i.to, i.arg[1])) { | 
|---|
| 437 | i.arg[1] = TMP(XMM0+15); | 
|---|
| 438 | emitf( "mov%k %=, %1", &i, fn, f); | 
|---|
| 439 | emitf( "mov%k %0, %=", &i, fn, f); | 
|---|
| 440 | i.arg[0] = i.to; | 
|---|
| 441 | } | 
|---|
| 442 | goto Table; | 
|---|
| 443 | case Ocopy: | 
|---|
| 444 | /* copies are used for many things; see my note | 
|---|
| 445 | * to understand how to load big constants: | 
|---|
| 446 | * https://c9x.me/notes/2015-09-19.html */ | 
|---|
| 447 | assert(rtype(i.to) != RMem); | 
|---|
| 448 | if (req(i.to, R) || req(i.arg[0], R)) | 
|---|
| 449 | break; | 
|---|
| 450 | if (req(i.to, i.arg[0])) | 
|---|
| 451 | break; | 
|---|
| 452 | t0 = rtype(i.arg[0]); | 
|---|
| 453 | if (i.cls == Kl | 
|---|
| 454 | && t0 == RCon | 
|---|
| 455 | && fn->con[i.arg[0].val].type == CBits) { | 
|---|
| 456 | val = fn->con[i.arg[0].val].bits.i; | 
|---|
| 457 | if (isreg(i.to)) | 
|---|
| 458 | if (val >= 0 && val <= UINT32_MAX) { | 
|---|
| 459 | emitf( "movl %W0, %W=", &i, fn, f); | 
|---|
| 460 | break; | 
|---|
| 461 | } | 
|---|
| 462 | if (rtype(i.to) == RSlot) | 
|---|
| 463 | if (val < INT32_MIN || val > INT32_MAX) { | 
|---|
| 464 | emitf( "movl %0, %=", &i, fn, f); | 
|---|
| 465 | emitf( "movl %0>>32, 4+%=", &i, fn, f); | 
|---|
| 466 | break; | 
|---|
| 467 | } | 
|---|
| 468 | } | 
|---|
| 469 | if (isreg(i.to) | 
|---|
| 470 | && t0 == RCon | 
|---|
| 471 | && fn->con[i.arg[0].val].type == CAddr) { | 
|---|
| 472 | emitf( "lea%k %M0, %=", &i, fn, f); | 
|---|
| 473 | break; | 
|---|
| 474 | } | 
|---|
| 475 | if (rtype(i.to) == RSlot | 
|---|
| 476 | && (t0 == RSlot || t0 == RMem)) { | 
|---|
| 477 | i.cls = KWIDE(i.cls) ? Kd : Ks; | 
|---|
| 478 | i.arg[1] = TMP(XMM0+15); | 
|---|
| 479 | emitf( "mov%k %0, %1", &i, fn, f); | 
|---|
| 480 | emitf( "mov%k %1, %=", &i, fn, f); | 
|---|
| 481 | break; | 
|---|
| 482 | } | 
|---|
| 483 | /* conveniently, the assembler knows if it | 
|---|
| 484 | * should use movabsq when reading movq */ | 
|---|
| 485 | emitf( "mov%k %0, %=", &i, fn, f); | 
|---|
| 486 | break; | 
|---|
| 487 | case Ocall: | 
|---|
| 488 | /* calls simply have a weird syntax in AT&T | 
|---|
| 489 | * assembly... */ | 
|---|
| 490 | switch (rtype(i.arg[0])) { | 
|---|
| 491 | case RCon: | 
|---|
| 492 | fprintf(f, "\tcallq "); | 
|---|
| 493 | emitcon(&fn->con[i.arg[0].val], f); | 
|---|
| 494 | fprintf(f, "\n"); | 
|---|
| 495 | break; | 
|---|
| 496 | case RTmp: | 
|---|
| 497 | emitf( "callq *%L0", &i, fn, f); | 
|---|
| 498 | break; | 
|---|
| 499 | default: | 
|---|
| 500 | die( "invalid call argument"); | 
|---|
| 501 | } | 
|---|
| 502 | break; | 
|---|
| 503 | case Osalloc: | 
|---|
| 504 | /* there is no good reason why this is here | 
|---|
| 505 | * maybe we should split Osalloc in 2 different | 
|---|
| 506 | * instructions depending on the result | 
|---|
| 507 | */ | 
|---|
| 508 | emitf( "subq %L0, %%rsp", &i, fn, f); | 
|---|
| 509 | if (!req(i.to, R)) | 
|---|
| 510 | emitcopy(i.to, TMP(RSP), Kl, fn, f); | 
|---|
| 511 | break; | 
|---|
| 512 | case Oswap: | 
|---|
| 513 | if (KBASE(i.cls) == 0) | 
|---|
| 514 | goto Table; | 
|---|
| 515 | /* for floats, there is no swap instruction | 
|---|
| 516 | * so we use xmm15 as a temporary | 
|---|
| 517 | */ | 
|---|
| 518 | emitcopy(TMP(XMM0+15), i.arg[0], i.cls, fn, f); | 
|---|
| 519 | emitcopy(i.arg[0], i.arg[1], i.cls, fn, f); | 
|---|
| 520 | emitcopy(i.arg[1], TMP(XMM0+15), i.cls, fn, f); | 
|---|
| 521 | break; | 
|---|
| 522 | } | 
|---|
| 523 | } | 
|---|
| 524 |  | 
|---|
| 525 | static uint64_t | 
|---|
| 526 | framesz(Fn *fn) | 
|---|
| 527 | { | 
|---|
| 528 | uint64_t i, o, f; | 
|---|
| 529 |  | 
|---|
| 530 | /* specific to NAlign == 3 */ | 
|---|
| 531 | for (i=0, o=0; i<NCLR; i++) | 
|---|
| 532 | o ^= 1 & (fn->reg >> amd64_sysv_rclob[i]); | 
|---|
| 533 | f = fn->slot; | 
|---|
| 534 | f = (f + 3) & -4; | 
|---|
| 535 | return 4*f + 8*o + 176*fn->vararg; | 
|---|
| 536 | } | 
|---|
| 537 |  | 
|---|
| 538 | void | 
|---|
| 539 | amd64_emitfn(Fn *fn, FILE *f) | 
|---|
| 540 | { | 
|---|
| 541 | static char *ctoa[] = { | 
|---|
| 542 | #define X(c, s) [c] = s, | 
|---|
| 543 | CMP(X) | 
|---|
| 544 | #undef X | 
|---|
| 545 | }; | 
|---|
| 546 | static int id0; | 
|---|
| 547 | Blk *b, *s; | 
|---|
| 548 | Ins *i, itmp; | 
|---|
| 549 | int *r, c, o, n, lbl; | 
|---|
| 550 | uint64_t fs; | 
|---|
| 551 |  | 
|---|
| 552 | gasemitlnk(fn->name, &fn->lnk, ".text", f); | 
|---|
| 553 | fputs( "\tpushq %rbp\n\tmovq %rsp, %rbp\n", f); | 
|---|
| 554 | fs = framesz(fn); | 
|---|
| 555 | if (fs) | 
|---|
| 556 | fprintf(f, "\tsubq $%"PRIu64 ", %%rsp\n", fs); | 
|---|
| 557 | if (fn->vararg) { | 
|---|
| 558 | o = -176; | 
|---|
| 559 | for (r=amd64_sysv_rsave; r<&amd64_sysv_rsave[6]; r++, o+=8) | 
|---|
| 560 | fprintf(f, "\tmovq %%%s, %d(%%rbp)\n", rname[*r][0], o); | 
|---|
| 561 | for (n=0; n<8; ++n, o+=16) | 
|---|
| 562 | fprintf(f, "\tmovaps %%xmm%d, %d(%%rbp)\n", n, o); | 
|---|
| 563 | } | 
|---|
| 564 | for (r=amd64_sysv_rclob; r<&amd64_sysv_rclob[NCLR]; r++) | 
|---|
| 565 | if (fn->reg & BIT(*r)) { | 
|---|
| 566 | itmp.arg[0] = TMP(*r); | 
|---|
| 567 | emitf( "pushq %L0", &itmp, fn, f); | 
|---|
| 568 | fs += 8; | 
|---|
| 569 | } | 
|---|
| 570 |  | 
|---|
| 571 | for (lbl=0, b=fn->start; b; b=b->link) { | 
|---|
| 572 | if (lbl || b->npred > 1) | 
|---|
| 573 | fprintf(f, "%sbb%d:\n", gasloc, id0+b->id); | 
|---|
| 574 | for (i=b->ins; i!=&b->ins[b->nins]; i++) | 
|---|
| 575 | emitins(*i, fn, f); | 
|---|
| 576 | lbl = 1; | 
|---|
| 577 | switch (b->jmp.type) { | 
|---|
| 578 | case Jret0: | 
|---|
| 579 | if (fn->dynalloc) | 
|---|
| 580 | fprintf(f, | 
|---|
| 581 | "\tmovq %%rbp, %%rsp\n" | 
|---|
| 582 | "\tsubq $%"PRIu64 ", %%rsp\n", | 
|---|
| 583 | fs | 
|---|
| 584 | ); | 
|---|
| 585 | for (r=&amd64_sysv_rclob[NCLR]; r>amd64_sysv_rclob;) | 
|---|
| 586 | if (fn->reg & BIT(*--r)) { | 
|---|
| 587 | itmp.arg[0] = TMP(*r); | 
|---|
| 588 | emitf( "popq %L0", &itmp, fn, f); | 
|---|
| 589 | } | 
|---|
| 590 | fprintf(f, | 
|---|
| 591 | "\tleave\n" | 
|---|
| 592 | "\tret\n" | 
|---|
| 593 | ); | 
|---|
| 594 | break; | 
|---|
| 595 | case Jjmp: | 
|---|
| 596 | Jmp: | 
|---|
| 597 | if (b->s1 != b->link) | 
|---|
| 598 | fprintf(f, "\tjmp %sbb%d\n", | 
|---|
| 599 | gasloc, id0+b->s1->id); | 
|---|
| 600 | else | 
|---|
| 601 | lbl = 0; | 
|---|
| 602 | break; | 
|---|
| 603 | default: | 
|---|
| 604 | c = b->jmp.type - Jjf; | 
|---|
| 605 | if (0 <= c && c <= NCmp) { | 
|---|
| 606 | if (b->link == b->s2) { | 
|---|
| 607 | s = b->s1; | 
|---|
| 608 | b->s1 = b->s2; | 
|---|
| 609 | b->s2 = s; | 
|---|
| 610 | } else | 
|---|
| 611 | c = cmpneg(c); | 
|---|
| 612 | fprintf(f, "\tj%s %sbb%d\n", ctoa[c], | 
|---|
| 613 | gasloc, id0+b->s2->id); | 
|---|
| 614 | goto Jmp; | 
|---|
| 615 | } | 
|---|
| 616 | die( "unhandled jump %d", b->jmp.type); | 
|---|
| 617 | } | 
|---|
| 618 | } | 
|---|
| 619 | id0 += fn->nblk; | 
|---|
| 620 | } | 
|---|
| 621 |  | 
|---|