github.com/mdempsky/go@v0.0.0-20151201204031-5dd372bd1e70/src/cmd/compile/internal/ppc64/gsubr.go (about) 1 // Derived from Inferno utils/6c/txt.c 2 // http://code.google.com/p/inferno-os/source/browse/utils/6c/txt.c 3 // 4 // Copyright © 1994-1999 Lucent Technologies Inc. All rights reserved. 5 // Portions Copyright © 1995-1997 C H Forsyth (forsyth@terzarima.net) 6 // Portions Copyright © 1997-1999 Vita Nuova Limited 7 // Portions Copyright © 2000-2007 Vita Nuova Holdings Limited (www.vitanuova.com) 8 // Portions Copyright © 2004,2006 Bruce Ellis 9 // Portions Copyright © 2005-2007 C H Forsyth (forsyth@terzarima.net) 10 // Revisions Copyright © 2000-2007 Lucent Technologies Inc. and others 11 // Portions Copyright © 2009 The Go Authors. All rights reserved. 12 // 13 // Permission is hereby granted, free of charge, to any person obtaining a copy 14 // of this software and associated documentation files (the "Software"), to deal 15 // in the Software without restriction, including without limitation the rights 16 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 17 // copies of the Software, and to permit persons to whom the Software is 18 // furnished to do so, subject to the following conditions: 19 // 20 // The above copyright notice and this permission notice shall be included in 21 // all copies or substantial portions of the Software. 22 // 23 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 24 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 25 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 26 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 27 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 28 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 29 // THE SOFTWARE. 30 31 package ppc64 32 33 import ( 34 "cmd/compile/internal/big" 35 "cmd/compile/internal/gc" 36 "cmd/internal/obj" 37 "cmd/internal/obj/ppc64" 38 "fmt" 39 ) 40 41 var resvd = []int{ 42 ppc64.REGZERO, 43 ppc64.REGSP, // reserved for SP 44 // We need to preserve the C ABI TLS pointer because sigtramp 45 // may happen during C code and needs to access the g. C 46 // clobbers REGG, so if Go were to clobber REGTLS, sigtramp 47 // won't know which convention to use. By preserving REGTLS, 48 // we can just retrieve g from TLS when we aren't sure. 49 ppc64.REGTLS, 50 51 // TODO(austin): Consolidate REGTLS and REGG? 52 ppc64.REGG, 53 ppc64.REGTMP, // REGTMP 54 ppc64.FREGCVI, 55 ppc64.FREGZERO, 56 ppc64.FREGHALF, 57 ppc64.FREGONE, 58 ppc64.FREGTWO, 59 } 60 61 /* 62 * generate 63 * as $c, n 64 */ 65 func ginscon(as int, c int64, n2 *gc.Node) { 66 var n1 gc.Node 67 68 gc.Nodconst(&n1, gc.Types[gc.TINT64], c) 69 70 if as != ppc64.AMOVD && (c < -ppc64.BIG || c > ppc64.BIG) || n2.Op != gc.OREGISTER || as == ppc64.AMULLD { 71 // cannot have more than 16-bit of immediate in ADD, etc. 72 // instead, MOV into register first. 73 var ntmp gc.Node 74 gc.Regalloc(&ntmp, gc.Types[gc.TINT64], nil) 75 76 rawgins(ppc64.AMOVD, &n1, &ntmp) 77 rawgins(as, &ntmp, n2) 78 gc.Regfree(&ntmp) 79 return 80 } 81 82 rawgins(as, &n1, n2) 83 } 84 85 /* 86 * generate 87 * as n, $c (CMP/CMPU) 88 */ 89 func ginscon2(as int, n2 *gc.Node, c int64) { 90 var n1 gc.Node 91 92 gc.Nodconst(&n1, gc.Types[gc.TINT64], c) 93 94 switch as { 95 default: 96 gc.Fatalf("ginscon2") 97 98 case ppc64.ACMP: 99 if -ppc64.BIG <= c && c <= ppc64.BIG { 100 rawgins(as, n2, &n1) 101 return 102 } 103 104 case ppc64.ACMPU: 105 if 0 <= c && c <= 2*ppc64.BIG { 106 rawgins(as, n2, &n1) 107 return 108 } 109 } 110 111 // MOV n1 into register first 112 var ntmp gc.Node 113 gc.Regalloc(&ntmp, gc.Types[gc.TINT64], nil) 114 115 rawgins(ppc64.AMOVD, &n1, &ntmp) 116 rawgins(as, n2, &ntmp) 117 gc.Regfree(&ntmp) 118 } 119 120 func ginscmp(op gc.Op, t *gc.Type, n1, n2 *gc.Node, likely int) *obj.Prog { 121 if gc.Isint[t.Etype] && n1.Op == gc.OLITERAL && n2.Op != gc.OLITERAL { 122 // Reverse comparison to place constant last. 123 op = gc.Brrev(op) 124 n1, n2 = n2, n1 125 } 126 127 var r1, r2, g1, g2 gc.Node 128 gc.Regalloc(&r1, t, n1) 129 gc.Regalloc(&g1, n1.Type, &r1) 130 gc.Cgen(n1, &g1) 131 gmove(&g1, &r1) 132 if gc.Isint[t.Etype] && gc.Isconst(n2, gc.CTINT) { 133 ginscon2(optoas(gc.OCMP, t), &r1, n2.Int()) 134 } else { 135 gc.Regalloc(&r2, t, n2) 136 gc.Regalloc(&g2, n1.Type, &r2) 137 gc.Cgen(n2, &g2) 138 gmove(&g2, &r2) 139 rawgins(optoas(gc.OCMP, t), &r1, &r2) 140 gc.Regfree(&g2) 141 gc.Regfree(&r2) 142 } 143 gc.Regfree(&g1) 144 gc.Regfree(&r1) 145 return gc.Gbranch(optoas(op, t), nil, likely) 146 } 147 148 // set up nodes representing 2^63 149 var ( 150 bigi gc.Node 151 bigf gc.Node 152 bignodes_did bool 153 ) 154 155 func bignodes() { 156 if bignodes_did { 157 return 158 } 159 bignodes_did = true 160 161 var i big.Int 162 i.SetInt64(1) 163 i.Lsh(&i, 63) 164 165 gc.Nodconst(&bigi, gc.Types[gc.TUINT64], 0) 166 bigi.SetBigInt(&i) 167 168 bigi.Convconst(&bigf, gc.Types[gc.TFLOAT64]) 169 } 170 171 /* 172 * generate move: 173 * t = f 174 * hard part is conversions. 175 */ 176 func gmove(f *gc.Node, t *gc.Node) { 177 if gc.Debug['M'] != 0 { 178 fmt.Printf("gmove %v -> %v\n", gc.Nconv(f, obj.FmtLong), gc.Nconv(t, obj.FmtLong)) 179 } 180 181 ft := int(gc.Simsimtype(f.Type)) 182 tt := int(gc.Simsimtype(t.Type)) 183 cvt := (*gc.Type)(t.Type) 184 185 if gc.Iscomplex[ft] || gc.Iscomplex[tt] { 186 gc.Complexmove(f, t) 187 return 188 } 189 190 // cannot have two memory operands 191 var r2 gc.Node 192 var r1 gc.Node 193 var a int 194 if gc.Ismem(f) && gc.Ismem(t) { 195 goto hard 196 } 197 198 // convert constant to desired type 199 if f.Op == gc.OLITERAL { 200 var con gc.Node 201 switch tt { 202 default: 203 f.Convconst(&con, t.Type) 204 205 case gc.TINT32, 206 gc.TINT16, 207 gc.TINT8: 208 var con gc.Node 209 f.Convconst(&con, gc.Types[gc.TINT64]) 210 var r1 gc.Node 211 gc.Regalloc(&r1, con.Type, t) 212 gins(ppc64.AMOVD, &con, &r1) 213 gmove(&r1, t) 214 gc.Regfree(&r1) 215 return 216 217 case gc.TUINT32, 218 gc.TUINT16, 219 gc.TUINT8: 220 var con gc.Node 221 f.Convconst(&con, gc.Types[gc.TUINT64]) 222 var r1 gc.Node 223 gc.Regalloc(&r1, con.Type, t) 224 gins(ppc64.AMOVD, &con, &r1) 225 gmove(&r1, t) 226 gc.Regfree(&r1) 227 return 228 } 229 230 f = &con 231 ft = tt // so big switch will choose a simple mov 232 233 // constants can't move directly to memory. 234 if gc.Ismem(t) { 235 goto hard 236 } 237 } 238 239 // float constants come from memory. 240 //if(isfloat[tt]) 241 // goto hard; 242 243 // 64-bit immediates are also from memory. 244 //if(isint[tt]) 245 // goto hard; 246 //// 64-bit immediates are really 32-bit sign-extended 247 //// unless moving into a register. 248 //if(isint[tt]) { 249 // if(mpcmpfixfix(con.val.u.xval, minintval[TINT32]) < 0) 250 // goto hard; 251 // if(mpcmpfixfix(con.val.u.xval, maxintval[TINT32]) > 0) 252 // goto hard; 253 //} 254 255 // value -> value copy, only one memory operand. 256 // figure out the instruction to use. 257 // break out of switch for one-instruction gins. 258 // goto rdst for "destination must be register". 259 // goto hard for "convert to cvt type first". 260 // otherwise handle and return. 261 262 switch uint32(ft)<<16 | uint32(tt) { 263 default: 264 gc.Fatalf("gmove %v -> %v", gc.Tconv(f.Type, obj.FmtLong), gc.Tconv(t.Type, obj.FmtLong)) 265 266 /* 267 * integer copy and truncate 268 */ 269 case gc.TINT8<<16 | gc.TINT8, // same size 270 gc.TUINT8<<16 | gc.TINT8, 271 gc.TINT16<<16 | gc.TINT8, 272 // truncate 273 gc.TUINT16<<16 | gc.TINT8, 274 gc.TINT32<<16 | gc.TINT8, 275 gc.TUINT32<<16 | gc.TINT8, 276 gc.TINT64<<16 | gc.TINT8, 277 gc.TUINT64<<16 | gc.TINT8: 278 a = ppc64.AMOVB 279 280 case gc.TINT8<<16 | gc.TUINT8, // same size 281 gc.TUINT8<<16 | gc.TUINT8, 282 gc.TINT16<<16 | gc.TUINT8, 283 // truncate 284 gc.TUINT16<<16 | gc.TUINT8, 285 gc.TINT32<<16 | gc.TUINT8, 286 gc.TUINT32<<16 | gc.TUINT8, 287 gc.TINT64<<16 | gc.TUINT8, 288 gc.TUINT64<<16 | gc.TUINT8: 289 a = ppc64.AMOVBZ 290 291 case gc.TINT16<<16 | gc.TINT16, // same size 292 gc.TUINT16<<16 | gc.TINT16, 293 gc.TINT32<<16 | gc.TINT16, 294 // truncate 295 gc.TUINT32<<16 | gc.TINT16, 296 gc.TINT64<<16 | gc.TINT16, 297 gc.TUINT64<<16 | gc.TINT16: 298 a = ppc64.AMOVH 299 300 case gc.TINT16<<16 | gc.TUINT16, // same size 301 gc.TUINT16<<16 | gc.TUINT16, 302 gc.TINT32<<16 | gc.TUINT16, 303 // truncate 304 gc.TUINT32<<16 | gc.TUINT16, 305 gc.TINT64<<16 | gc.TUINT16, 306 gc.TUINT64<<16 | gc.TUINT16: 307 a = ppc64.AMOVHZ 308 309 case gc.TINT32<<16 | gc.TINT32, // same size 310 gc.TUINT32<<16 | gc.TINT32, 311 gc.TINT64<<16 | gc.TINT32, 312 // truncate 313 gc.TUINT64<<16 | gc.TINT32: 314 a = ppc64.AMOVW 315 316 case gc.TINT32<<16 | gc.TUINT32, // same size 317 gc.TUINT32<<16 | gc.TUINT32, 318 gc.TINT64<<16 | gc.TUINT32, 319 gc.TUINT64<<16 | gc.TUINT32: 320 a = ppc64.AMOVWZ 321 322 case gc.TINT64<<16 | gc.TINT64, // same size 323 gc.TINT64<<16 | gc.TUINT64, 324 gc.TUINT64<<16 | gc.TINT64, 325 gc.TUINT64<<16 | gc.TUINT64: 326 a = ppc64.AMOVD 327 328 /* 329 * integer up-conversions 330 */ 331 case gc.TINT8<<16 | gc.TINT16, // sign extend int8 332 gc.TINT8<<16 | gc.TUINT16, 333 gc.TINT8<<16 | gc.TINT32, 334 gc.TINT8<<16 | gc.TUINT32, 335 gc.TINT8<<16 | gc.TINT64, 336 gc.TINT8<<16 | gc.TUINT64: 337 a = ppc64.AMOVB 338 339 goto rdst 340 341 case gc.TUINT8<<16 | gc.TINT16, // zero extend uint8 342 gc.TUINT8<<16 | gc.TUINT16, 343 gc.TUINT8<<16 | gc.TINT32, 344 gc.TUINT8<<16 | gc.TUINT32, 345 gc.TUINT8<<16 | gc.TINT64, 346 gc.TUINT8<<16 | gc.TUINT64: 347 a = ppc64.AMOVBZ 348 349 goto rdst 350 351 case gc.TINT16<<16 | gc.TINT32, // sign extend int16 352 gc.TINT16<<16 | gc.TUINT32, 353 gc.TINT16<<16 | gc.TINT64, 354 gc.TINT16<<16 | gc.TUINT64: 355 a = ppc64.AMOVH 356 357 goto rdst 358 359 case gc.TUINT16<<16 | gc.TINT32, // zero extend uint16 360 gc.TUINT16<<16 | gc.TUINT32, 361 gc.TUINT16<<16 | gc.TINT64, 362 gc.TUINT16<<16 | gc.TUINT64: 363 a = ppc64.AMOVHZ 364 365 goto rdst 366 367 case gc.TINT32<<16 | gc.TINT64, // sign extend int32 368 gc.TINT32<<16 | gc.TUINT64: 369 a = ppc64.AMOVW 370 371 goto rdst 372 373 case gc.TUINT32<<16 | gc.TINT64, // zero extend uint32 374 gc.TUINT32<<16 | gc.TUINT64: 375 a = ppc64.AMOVWZ 376 377 goto rdst 378 379 //warn("gmove: convert float to int not implemented: %N -> %N\n", f, t); 380 //return; 381 // algorithm is: 382 // if small enough, use native float64 -> int64 conversion. 383 // otherwise, subtract 2^63, convert, and add it back. 384 /* 385 * float to integer 386 */ 387 case gc.TFLOAT32<<16 | gc.TINT32, 388 gc.TFLOAT64<<16 | gc.TINT32, 389 gc.TFLOAT32<<16 | gc.TINT64, 390 gc.TFLOAT64<<16 | gc.TINT64, 391 gc.TFLOAT32<<16 | gc.TINT16, 392 gc.TFLOAT32<<16 | gc.TINT8, 393 gc.TFLOAT32<<16 | gc.TUINT16, 394 gc.TFLOAT32<<16 | gc.TUINT8, 395 gc.TFLOAT64<<16 | gc.TINT16, 396 gc.TFLOAT64<<16 | gc.TINT8, 397 gc.TFLOAT64<<16 | gc.TUINT16, 398 gc.TFLOAT64<<16 | gc.TUINT8, 399 gc.TFLOAT32<<16 | gc.TUINT32, 400 gc.TFLOAT64<<16 | gc.TUINT32, 401 gc.TFLOAT32<<16 | gc.TUINT64, 402 gc.TFLOAT64<<16 | gc.TUINT64: 403 bignodes() 404 405 var r1 gc.Node 406 gc.Regalloc(&r1, gc.Types[ft], f) 407 gmove(f, &r1) 408 if tt == gc.TUINT64 { 409 gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], nil) 410 gmove(&bigf, &r2) 411 gins(ppc64.AFCMPU, &r1, &r2) 412 p1 := (*obj.Prog)(gc.Gbranch(optoas(gc.OLT, gc.Types[gc.TFLOAT64]), nil, +1)) 413 gins(ppc64.AFSUB, &r2, &r1) 414 gc.Patch(p1, gc.Pc) 415 gc.Regfree(&r2) 416 } 417 418 gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], nil) 419 var r3 gc.Node 420 gc.Regalloc(&r3, gc.Types[gc.TINT64], t) 421 gins(ppc64.AFCTIDZ, &r1, &r2) 422 p1 := (*obj.Prog)(gins(ppc64.AFMOVD, &r2, nil)) 423 p1.To.Type = obj.TYPE_MEM 424 p1.To.Reg = ppc64.REGSP 425 p1.To.Offset = -8 426 p1 = gins(ppc64.AMOVD, nil, &r3) 427 p1.From.Type = obj.TYPE_MEM 428 p1.From.Reg = ppc64.REGSP 429 p1.From.Offset = -8 430 gc.Regfree(&r2) 431 gc.Regfree(&r1) 432 if tt == gc.TUINT64 { 433 p1 := (*obj.Prog)(gc.Gbranch(optoas(gc.OLT, gc.Types[gc.TFLOAT64]), nil, +1)) // use CR0 here again 434 gc.Nodreg(&r1, gc.Types[gc.TINT64], ppc64.REGTMP) 435 gins(ppc64.AMOVD, &bigi, &r1) 436 gins(ppc64.AADD, &r1, &r3) 437 gc.Patch(p1, gc.Pc) 438 } 439 440 gmove(&r3, t) 441 gc.Regfree(&r3) 442 return 443 444 //warn("gmove: convert int to float not implemented: %N -> %N\n", f, t); 445 //return; 446 // algorithm is: 447 // if small enough, use native int64 -> uint64 conversion. 448 // otherwise, halve (rounding to odd?), convert, and double. 449 /* 450 * integer to float 451 */ 452 case gc.TINT32<<16 | gc.TFLOAT32, 453 gc.TINT32<<16 | gc.TFLOAT64, 454 gc.TINT64<<16 | gc.TFLOAT32, 455 gc.TINT64<<16 | gc.TFLOAT64, 456 gc.TINT16<<16 | gc.TFLOAT32, 457 gc.TINT16<<16 | gc.TFLOAT64, 458 gc.TINT8<<16 | gc.TFLOAT32, 459 gc.TINT8<<16 | gc.TFLOAT64, 460 gc.TUINT16<<16 | gc.TFLOAT32, 461 gc.TUINT16<<16 | gc.TFLOAT64, 462 gc.TUINT8<<16 | gc.TFLOAT32, 463 gc.TUINT8<<16 | gc.TFLOAT64, 464 gc.TUINT32<<16 | gc.TFLOAT32, 465 gc.TUINT32<<16 | gc.TFLOAT64, 466 gc.TUINT64<<16 | gc.TFLOAT32, 467 gc.TUINT64<<16 | gc.TFLOAT64: 468 bignodes() 469 470 var r1 gc.Node 471 gc.Regalloc(&r1, gc.Types[gc.TINT64], nil) 472 gmove(f, &r1) 473 if ft == gc.TUINT64 { 474 gc.Nodreg(&r2, gc.Types[gc.TUINT64], ppc64.REGTMP) 475 gmove(&bigi, &r2) 476 gins(ppc64.ACMPU, &r1, &r2) 477 p1 := (*obj.Prog)(gc.Gbranch(optoas(gc.OLT, gc.Types[gc.TUINT64]), nil, +1)) 478 p2 := (*obj.Prog)(gins(ppc64.ASRD, nil, &r1)) 479 p2.From.Type = obj.TYPE_CONST 480 p2.From.Offset = 1 481 gc.Patch(p1, gc.Pc) 482 } 483 484 gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], t) 485 p1 := (*obj.Prog)(gins(ppc64.AMOVD, &r1, nil)) 486 p1.To.Type = obj.TYPE_MEM 487 p1.To.Reg = ppc64.REGSP 488 p1.To.Offset = -8 489 p1 = gins(ppc64.AFMOVD, nil, &r2) 490 p1.From.Type = obj.TYPE_MEM 491 p1.From.Reg = ppc64.REGSP 492 p1.From.Offset = -8 493 gins(ppc64.AFCFID, &r2, &r2) 494 gc.Regfree(&r1) 495 if ft == gc.TUINT64 { 496 p1 := (*obj.Prog)(gc.Gbranch(optoas(gc.OLT, gc.Types[gc.TUINT64]), nil, +1)) // use CR0 here again 497 gc.Nodreg(&r1, gc.Types[gc.TFLOAT64], ppc64.FREGTWO) 498 gins(ppc64.AFMUL, &r1, &r2) 499 gc.Patch(p1, gc.Pc) 500 } 501 502 gmove(&r2, t) 503 gc.Regfree(&r2) 504 return 505 506 /* 507 * float to float 508 */ 509 case gc.TFLOAT32<<16 | gc.TFLOAT32: 510 a = ppc64.AFMOVS 511 512 case gc.TFLOAT64<<16 | gc.TFLOAT64: 513 a = ppc64.AFMOVD 514 515 case gc.TFLOAT32<<16 | gc.TFLOAT64: 516 a = ppc64.AFMOVS 517 goto rdst 518 519 case gc.TFLOAT64<<16 | gc.TFLOAT32: 520 a = ppc64.AFRSP 521 goto rdst 522 } 523 524 gins(a, f, t) 525 return 526 527 // requires register destination 528 rdst: 529 { 530 gc.Regalloc(&r1, t.Type, t) 531 532 gins(a, f, &r1) 533 gmove(&r1, t) 534 gc.Regfree(&r1) 535 return 536 } 537 538 // requires register intermediate 539 hard: 540 gc.Regalloc(&r1, cvt, t) 541 542 gmove(f, &r1) 543 gmove(&r1, t) 544 gc.Regfree(&r1) 545 return 546 } 547 548 // gins is called by the front end. 549 // It synthesizes some multiple-instruction sequences 550 // so the front end can stay simpler. 551 func gins(as int, f, t *gc.Node) *obj.Prog { 552 if as >= obj.A_ARCHSPECIFIC { 553 if x, ok := f.IntLiteral(); ok { 554 ginscon(as, x, t) 555 return nil // caller must not use 556 } 557 } 558 if as == ppc64.ACMP || as == ppc64.ACMPU { 559 if x, ok := t.IntLiteral(); ok { 560 ginscon2(as, f, x) 561 return nil // caller must not use 562 } 563 } 564 return rawgins(as, f, t) 565 } 566 567 /* 568 * generate one instruction: 569 * as f, t 570 */ 571 func rawgins(as int, f *gc.Node, t *gc.Node) *obj.Prog { 572 // TODO(austin): Add self-move test like in 6g (but be careful 573 // of truncation moves) 574 575 p := gc.Prog(as) 576 gc.Naddr(&p.From, f) 577 gc.Naddr(&p.To, t) 578 579 switch as { 580 case obj.ACALL: 581 if p.To.Type == obj.TYPE_REG && p.To.Reg != ppc64.REG_CTR { 582 // Allow front end to emit CALL REG, and rewrite into MOV REG, CTR; CALL CTR. 583 if gc.Ctxt.Flag_shared != 0 { 584 // Make sure function pointer is in R12 as well when 585 // compiling Go into PIC. 586 // TODO(mwhudson): it would obviously be better to 587 // change the register allocation to put the value in 588 // R12 already, but I don't know how to do that. 589 q := gc.Prog(as) 590 q.As = ppc64.AMOVD 591 q.From = p.To 592 q.To.Type = obj.TYPE_REG 593 q.To.Reg = ppc64.REG_R12 594 } 595 pp := gc.Prog(as) 596 pp.From = p.From 597 pp.To.Type = obj.TYPE_REG 598 pp.To.Reg = ppc64.REG_CTR 599 600 p.As = ppc64.AMOVD 601 p.From = p.To 602 p.To.Type = obj.TYPE_REG 603 p.To.Reg = ppc64.REG_CTR 604 605 if gc.Ctxt.Flag_shared != 0 { 606 // When compiling Go into PIC, the function we just 607 // called via pointer might have been implemented in 608 // a separate module and so overwritten the TOC 609 // pointer in R2; reload it. 610 q := gc.Prog(ppc64.AMOVD) 611 q.From.Type = obj.TYPE_MEM 612 q.From.Offset = 24 613 q.From.Reg = ppc64.REGSP 614 q.To.Type = obj.TYPE_REG 615 q.To.Reg = ppc64.REG_R2 616 } 617 618 if gc.Debug['g'] != 0 { 619 fmt.Printf("%v\n", p) 620 fmt.Printf("%v\n", pp) 621 } 622 623 return pp 624 } 625 626 // Bad things the front end has done to us. Crash to find call stack. 627 case ppc64.AAND, ppc64.AMULLD: 628 if p.From.Type == obj.TYPE_CONST { 629 gc.Debug['h'] = 1 630 gc.Fatalf("bad inst: %v", p) 631 } 632 case ppc64.ACMP, ppc64.ACMPU: 633 if p.From.Type == obj.TYPE_MEM || p.To.Type == obj.TYPE_MEM { 634 gc.Debug['h'] = 1 635 gc.Fatalf("bad inst: %v", p) 636 } 637 } 638 639 if gc.Debug['g'] != 0 { 640 fmt.Printf("%v\n", p) 641 } 642 643 w := int32(0) 644 switch as { 645 case ppc64.AMOVB, 646 ppc64.AMOVBU, 647 ppc64.AMOVBZ, 648 ppc64.AMOVBZU: 649 w = 1 650 651 case ppc64.AMOVH, 652 ppc64.AMOVHU, 653 ppc64.AMOVHZ, 654 ppc64.AMOVHZU: 655 w = 2 656 657 case ppc64.AMOVW, 658 ppc64.AMOVWU, 659 ppc64.AMOVWZ, 660 ppc64.AMOVWZU: 661 w = 4 662 663 case ppc64.AMOVD, 664 ppc64.AMOVDU: 665 if p.From.Type == obj.TYPE_CONST || p.From.Type == obj.TYPE_ADDR { 666 break 667 } 668 w = 8 669 } 670 671 if w != 0 && ((f != nil && p.From.Width < int64(w)) || (t != nil && p.To.Type != obj.TYPE_REG && p.To.Width > int64(w))) { 672 gc.Dump("f", f) 673 gc.Dump("t", t) 674 gc.Fatalf("bad width: %v (%d, %d)\n", p, p.From.Width, p.To.Width) 675 } 676 677 return p 678 } 679 680 /* 681 * return Axxx for Oxxx on type t. 682 */ 683 func optoas(op gc.Op, t *gc.Type) int { 684 if t == nil { 685 gc.Fatalf("optoas: t is nil") 686 } 687 688 // avoid constant conversions in switches below 689 const ( 690 OMINUS_ = uint32(gc.OMINUS) << 16 691 OLSH_ = uint32(gc.OLSH) << 16 692 ORSH_ = uint32(gc.ORSH) << 16 693 OADD_ = uint32(gc.OADD) << 16 694 OSUB_ = uint32(gc.OSUB) << 16 695 OMUL_ = uint32(gc.OMUL) << 16 696 ODIV_ = uint32(gc.ODIV) << 16 697 OOR_ = uint32(gc.OOR) << 16 698 OAND_ = uint32(gc.OAND) << 16 699 OXOR_ = uint32(gc.OXOR) << 16 700 OEQ_ = uint32(gc.OEQ) << 16 701 ONE_ = uint32(gc.ONE) << 16 702 OLT_ = uint32(gc.OLT) << 16 703 OLE_ = uint32(gc.OLE) << 16 704 OGE_ = uint32(gc.OGE) << 16 705 OGT_ = uint32(gc.OGT) << 16 706 OCMP_ = uint32(gc.OCMP) << 16 707 OAS_ = uint32(gc.OAS) << 16 708 OHMUL_ = uint32(gc.OHMUL) << 16 709 ) 710 711 a := int(obj.AXXX) 712 switch uint32(op)<<16 | uint32(gc.Simtype[t.Etype]) { 713 default: 714 gc.Fatalf("optoas: no entry for op=%v type=%v", gc.Oconv(int(op), 0), t) 715 716 case OEQ_ | gc.TBOOL, 717 OEQ_ | gc.TINT8, 718 OEQ_ | gc.TUINT8, 719 OEQ_ | gc.TINT16, 720 OEQ_ | gc.TUINT16, 721 OEQ_ | gc.TINT32, 722 OEQ_ | gc.TUINT32, 723 OEQ_ | gc.TINT64, 724 OEQ_ | gc.TUINT64, 725 OEQ_ | gc.TPTR32, 726 OEQ_ | gc.TPTR64, 727 OEQ_ | gc.TFLOAT32, 728 OEQ_ | gc.TFLOAT64: 729 a = ppc64.ABEQ 730 731 case ONE_ | gc.TBOOL, 732 ONE_ | gc.TINT8, 733 ONE_ | gc.TUINT8, 734 ONE_ | gc.TINT16, 735 ONE_ | gc.TUINT16, 736 ONE_ | gc.TINT32, 737 ONE_ | gc.TUINT32, 738 ONE_ | gc.TINT64, 739 ONE_ | gc.TUINT64, 740 ONE_ | gc.TPTR32, 741 ONE_ | gc.TPTR64, 742 ONE_ | gc.TFLOAT32, 743 ONE_ | gc.TFLOAT64: 744 a = ppc64.ABNE 745 746 case OLT_ | gc.TINT8, // ACMP 747 OLT_ | gc.TINT16, 748 OLT_ | gc.TINT32, 749 OLT_ | gc.TINT64, 750 OLT_ | gc.TUINT8, 751 // ACMPU 752 OLT_ | gc.TUINT16, 753 OLT_ | gc.TUINT32, 754 OLT_ | gc.TUINT64, 755 OLT_ | gc.TFLOAT32, 756 // AFCMPU 757 OLT_ | gc.TFLOAT64: 758 a = ppc64.ABLT 759 760 case OLE_ | gc.TINT8, // ACMP 761 OLE_ | gc.TINT16, 762 OLE_ | gc.TINT32, 763 OLE_ | gc.TINT64, 764 OLE_ | gc.TUINT8, 765 // ACMPU 766 OLE_ | gc.TUINT16, 767 OLE_ | gc.TUINT32, 768 OLE_ | gc.TUINT64: 769 // No OLE for floats, because it mishandles NaN. 770 // Front end must reverse comparison or use OLT and OEQ together. 771 a = ppc64.ABLE 772 773 case OGT_ | gc.TINT8, 774 OGT_ | gc.TINT16, 775 OGT_ | gc.TINT32, 776 OGT_ | gc.TINT64, 777 OGT_ | gc.TUINT8, 778 OGT_ | gc.TUINT16, 779 OGT_ | gc.TUINT32, 780 OGT_ | gc.TUINT64, 781 OGT_ | gc.TFLOAT32, 782 OGT_ | gc.TFLOAT64: 783 a = ppc64.ABGT 784 785 case OGE_ | gc.TINT8, 786 OGE_ | gc.TINT16, 787 OGE_ | gc.TINT32, 788 OGE_ | gc.TINT64, 789 OGE_ | gc.TUINT8, 790 OGE_ | gc.TUINT16, 791 OGE_ | gc.TUINT32, 792 OGE_ | gc.TUINT64: 793 // No OGE for floats, because it mishandles NaN. 794 // Front end must reverse comparison or use OLT and OEQ together. 795 a = ppc64.ABGE 796 797 case OCMP_ | gc.TBOOL, 798 OCMP_ | gc.TINT8, 799 OCMP_ | gc.TINT16, 800 OCMP_ | gc.TINT32, 801 OCMP_ | gc.TPTR32, 802 OCMP_ | gc.TINT64: 803 a = ppc64.ACMP 804 805 case OCMP_ | gc.TUINT8, 806 OCMP_ | gc.TUINT16, 807 OCMP_ | gc.TUINT32, 808 OCMP_ | gc.TUINT64, 809 OCMP_ | gc.TPTR64: 810 a = ppc64.ACMPU 811 812 case OCMP_ | gc.TFLOAT32, 813 OCMP_ | gc.TFLOAT64: 814 a = ppc64.AFCMPU 815 816 case OAS_ | gc.TBOOL, 817 OAS_ | gc.TINT8: 818 a = ppc64.AMOVB 819 820 case OAS_ | gc.TUINT8: 821 a = ppc64.AMOVBZ 822 823 case OAS_ | gc.TINT16: 824 a = ppc64.AMOVH 825 826 case OAS_ | gc.TUINT16: 827 a = ppc64.AMOVHZ 828 829 case OAS_ | gc.TINT32: 830 a = ppc64.AMOVW 831 832 case OAS_ | gc.TUINT32, 833 OAS_ | gc.TPTR32: 834 a = ppc64.AMOVWZ 835 836 case OAS_ | gc.TINT64, 837 OAS_ | gc.TUINT64, 838 OAS_ | gc.TPTR64: 839 a = ppc64.AMOVD 840 841 case OAS_ | gc.TFLOAT32: 842 a = ppc64.AFMOVS 843 844 case OAS_ | gc.TFLOAT64: 845 a = ppc64.AFMOVD 846 847 case OADD_ | gc.TINT8, 848 OADD_ | gc.TUINT8, 849 OADD_ | gc.TINT16, 850 OADD_ | gc.TUINT16, 851 OADD_ | gc.TINT32, 852 OADD_ | gc.TUINT32, 853 OADD_ | gc.TPTR32, 854 OADD_ | gc.TINT64, 855 OADD_ | gc.TUINT64, 856 OADD_ | gc.TPTR64: 857 a = ppc64.AADD 858 859 case OADD_ | gc.TFLOAT32: 860 a = ppc64.AFADDS 861 862 case OADD_ | gc.TFLOAT64: 863 a = ppc64.AFADD 864 865 case OSUB_ | gc.TINT8, 866 OSUB_ | gc.TUINT8, 867 OSUB_ | gc.TINT16, 868 OSUB_ | gc.TUINT16, 869 OSUB_ | gc.TINT32, 870 OSUB_ | gc.TUINT32, 871 OSUB_ | gc.TPTR32, 872 OSUB_ | gc.TINT64, 873 OSUB_ | gc.TUINT64, 874 OSUB_ | gc.TPTR64: 875 a = ppc64.ASUB 876 877 case OSUB_ | gc.TFLOAT32: 878 a = ppc64.AFSUBS 879 880 case OSUB_ | gc.TFLOAT64: 881 a = ppc64.AFSUB 882 883 case OMINUS_ | gc.TINT8, 884 OMINUS_ | gc.TUINT8, 885 OMINUS_ | gc.TINT16, 886 OMINUS_ | gc.TUINT16, 887 OMINUS_ | gc.TINT32, 888 OMINUS_ | gc.TUINT32, 889 OMINUS_ | gc.TPTR32, 890 OMINUS_ | gc.TINT64, 891 OMINUS_ | gc.TUINT64, 892 OMINUS_ | gc.TPTR64: 893 a = ppc64.ANEG 894 895 case OAND_ | gc.TINT8, 896 OAND_ | gc.TUINT8, 897 OAND_ | gc.TINT16, 898 OAND_ | gc.TUINT16, 899 OAND_ | gc.TINT32, 900 OAND_ | gc.TUINT32, 901 OAND_ | gc.TPTR32, 902 OAND_ | gc.TINT64, 903 OAND_ | gc.TUINT64, 904 OAND_ | gc.TPTR64: 905 a = ppc64.AAND 906 907 case OOR_ | gc.TINT8, 908 OOR_ | gc.TUINT8, 909 OOR_ | gc.TINT16, 910 OOR_ | gc.TUINT16, 911 OOR_ | gc.TINT32, 912 OOR_ | gc.TUINT32, 913 OOR_ | gc.TPTR32, 914 OOR_ | gc.TINT64, 915 OOR_ | gc.TUINT64, 916 OOR_ | gc.TPTR64: 917 a = ppc64.AOR 918 919 case OXOR_ | gc.TINT8, 920 OXOR_ | gc.TUINT8, 921 OXOR_ | gc.TINT16, 922 OXOR_ | gc.TUINT16, 923 OXOR_ | gc.TINT32, 924 OXOR_ | gc.TUINT32, 925 OXOR_ | gc.TPTR32, 926 OXOR_ | gc.TINT64, 927 OXOR_ | gc.TUINT64, 928 OXOR_ | gc.TPTR64: 929 a = ppc64.AXOR 930 931 // TODO(minux): handle rotates 932 //case CASE(OLROT, TINT8): 933 //case CASE(OLROT, TUINT8): 934 //case CASE(OLROT, TINT16): 935 //case CASE(OLROT, TUINT16): 936 //case CASE(OLROT, TINT32): 937 //case CASE(OLROT, TUINT32): 938 //case CASE(OLROT, TPTR32): 939 //case CASE(OLROT, TINT64): 940 //case CASE(OLROT, TUINT64): 941 //case CASE(OLROT, TPTR64): 942 // a = 0//???; RLDC? 943 // break; 944 945 case OLSH_ | gc.TINT8, 946 OLSH_ | gc.TUINT8, 947 OLSH_ | gc.TINT16, 948 OLSH_ | gc.TUINT16, 949 OLSH_ | gc.TINT32, 950 OLSH_ | gc.TUINT32, 951 OLSH_ | gc.TPTR32, 952 OLSH_ | gc.TINT64, 953 OLSH_ | gc.TUINT64, 954 OLSH_ | gc.TPTR64: 955 a = ppc64.ASLD 956 957 case ORSH_ | gc.TUINT8, 958 ORSH_ | gc.TUINT16, 959 ORSH_ | gc.TUINT32, 960 ORSH_ | gc.TPTR32, 961 ORSH_ | gc.TUINT64, 962 ORSH_ | gc.TPTR64: 963 a = ppc64.ASRD 964 965 case ORSH_ | gc.TINT8, 966 ORSH_ | gc.TINT16, 967 ORSH_ | gc.TINT32, 968 ORSH_ | gc.TINT64: 969 a = ppc64.ASRAD 970 971 // TODO(minux): handle rotates 972 //case CASE(ORROTC, TINT8): 973 //case CASE(ORROTC, TUINT8): 974 //case CASE(ORROTC, TINT16): 975 //case CASE(ORROTC, TUINT16): 976 //case CASE(ORROTC, TINT32): 977 //case CASE(ORROTC, TUINT32): 978 //case CASE(ORROTC, TINT64): 979 //case CASE(ORROTC, TUINT64): 980 // a = 0//??? RLDC?? 981 // break; 982 983 case OHMUL_ | gc.TINT64: 984 a = ppc64.AMULHD 985 986 case OHMUL_ | gc.TUINT64, 987 OHMUL_ | gc.TPTR64: 988 a = ppc64.AMULHDU 989 990 case OMUL_ | gc.TINT8, 991 OMUL_ | gc.TINT16, 992 OMUL_ | gc.TINT32, 993 OMUL_ | gc.TINT64: 994 a = ppc64.AMULLD 995 996 case OMUL_ | gc.TUINT8, 997 OMUL_ | gc.TUINT16, 998 OMUL_ | gc.TUINT32, 999 OMUL_ | gc.TPTR32, 1000 // don't use word multiply, the high 32-bit are undefined. 1001 OMUL_ | gc.TUINT64, 1002 OMUL_ | gc.TPTR64: 1003 // for 64-bit multiplies, signedness doesn't matter. 1004 a = ppc64.AMULLD 1005 1006 case OMUL_ | gc.TFLOAT32: 1007 a = ppc64.AFMULS 1008 1009 case OMUL_ | gc.TFLOAT64: 1010 a = ppc64.AFMUL 1011 1012 case ODIV_ | gc.TINT8, 1013 ODIV_ | gc.TINT16, 1014 ODIV_ | gc.TINT32, 1015 ODIV_ | gc.TINT64: 1016 a = ppc64.ADIVD 1017 1018 case ODIV_ | gc.TUINT8, 1019 ODIV_ | gc.TUINT16, 1020 ODIV_ | gc.TUINT32, 1021 ODIV_ | gc.TPTR32, 1022 ODIV_ | gc.TUINT64, 1023 ODIV_ | gc.TPTR64: 1024 a = ppc64.ADIVDU 1025 1026 case ODIV_ | gc.TFLOAT32: 1027 a = ppc64.AFDIVS 1028 1029 case ODIV_ | gc.TFLOAT64: 1030 a = ppc64.AFDIV 1031 } 1032 1033 return a 1034 } 1035 1036 const ( 1037 ODynam = 1 << 0 1038 OAddable = 1 << 1 1039 ) 1040 1041 func xgen(n *gc.Node, a *gc.Node, o int) bool { 1042 // TODO(minux) 1043 1044 return -1 != 0 /*TypeKind(100016)*/ 1045 } 1046 1047 func sudoclean() { 1048 return 1049 } 1050 1051 /* 1052 * generate code to compute address of n, 1053 * a reference to a (perhaps nested) field inside 1054 * an array or struct. 1055 * return 0 on failure, 1 on success. 1056 * on success, leaves usable address in a. 1057 * 1058 * caller is responsible for calling sudoclean 1059 * after successful sudoaddable, 1060 * to release the register used for a. 1061 */ 1062 func sudoaddable(as int, n *gc.Node, a *obj.Addr) bool { 1063 // TODO(minux) 1064 1065 *a = obj.Addr{} 1066 return false 1067 }