github.com/mh-cbon/go@v0.0.0-20160603070303-9e112a3fe4c0/src/cmd/compile/internal/ppc64/gsubr.go (about)

     1  // Derived from Inferno utils/6c/txt.c
     2  // http://code.google.com/p/inferno-os/source/browse/utils/6c/txt.c
     3  //
     4  //	Copyright © 1994-1999 Lucent Technologies Inc.  All rights reserved.
     5  //	Portions Copyright © 1995-1997 C H Forsyth (forsyth@terzarima.net)
     6  //	Portions Copyright © 1997-1999 Vita Nuova Limited
     7  //	Portions Copyright © 2000-2007 Vita Nuova Holdings Limited (www.vitanuova.com)
     8  //	Portions Copyright © 2004,2006 Bruce Ellis
     9  //	Portions Copyright © 2005-2007 C H Forsyth (forsyth@terzarima.net)
    10  //	Revisions Copyright © 2000-2007 Lucent Technologies Inc. and others
    11  //	Portions Copyright © 2009 The Go Authors. All rights reserved.
    12  //
    13  // Permission is hereby granted, free of charge, to any person obtaining a copy
    14  // of this software and associated documentation files (the "Software"), to deal
    15  // in the Software without restriction, including without limitation the rights
    16  // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
    17  // copies of the Software, and to permit persons to whom the Software is
    18  // furnished to do so, subject to the following conditions:
    19  //
    20  // The above copyright notice and this permission notice shall be included in
    21  // all copies or substantial portions of the Software.
    22  //
    23  // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    24  // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    25  // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
    26  // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    27  // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    28  // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
    29  // THE SOFTWARE.
    30  
    31  package ppc64
    32  
    33  import (
    34  	"cmd/compile/internal/big"
    35  	"cmd/compile/internal/gc"
    36  	"cmd/internal/obj"
    37  	"cmd/internal/obj/ppc64"
    38  	"fmt"
    39  )
    40  
    41  var resvd = []int{
    42  	ppc64.REGZERO,
    43  	ppc64.REGSP, // reserved for SP
    44  	// We need to preserve the C ABI TLS pointer because sigtramp
    45  	// may happen during C code and needs to access the g. C
    46  	// clobbers REGG, so if Go were to clobber REGTLS, sigtramp
    47  	// won't know which convention to use. By preserving REGTLS,
    48  	// we can just retrieve g from TLS when we aren't sure.
    49  	ppc64.REGTLS,
    50  
    51  	// TODO(austin): Consolidate REGTLS and REGG?
    52  	ppc64.REGG,
    53  	ppc64.REGTMP, // REGTMP
    54  	ppc64.FREGCVI,
    55  	ppc64.FREGZERO,
    56  	ppc64.FREGHALF,
    57  	ppc64.FREGONE,
    58  	ppc64.FREGTWO,
    59  }
    60  
    61  /*
    62   * generate
    63   *	as $c, n
    64   */
    65  func ginscon(as obj.As, c int64, n2 *gc.Node) {
    66  	var n1 gc.Node
    67  
    68  	gc.Nodconst(&n1, gc.Types[gc.TINT64], c)
    69  
    70  	if as != ppc64.AMOVD && (c < -ppc64.BIG || c > ppc64.BIG) || n2.Op != gc.OREGISTER || as == ppc64.AMULLD {
    71  		// cannot have more than 16-bit of immediate in ADD, etc.
    72  		// instead, MOV into register first.
    73  		var ntmp gc.Node
    74  		gc.Regalloc(&ntmp, gc.Types[gc.TINT64], nil)
    75  
    76  		rawgins(ppc64.AMOVD, &n1, &ntmp)
    77  		rawgins(as, &ntmp, n2)
    78  		gc.Regfree(&ntmp)
    79  		return
    80  	}
    81  
    82  	rawgins(as, &n1, n2)
    83  }
    84  
    85  /*
    86   * generate
    87   *	as n, $c (CMP/CMPU)
    88   */
    89  func ginscon2(as obj.As, n2 *gc.Node, c int64) {
    90  	var n1 gc.Node
    91  
    92  	gc.Nodconst(&n1, gc.Types[gc.TINT64], c)
    93  
    94  	switch as {
    95  	default:
    96  		gc.Fatalf("ginscon2")
    97  
    98  	case ppc64.ACMP:
    99  		if -ppc64.BIG <= c && c <= ppc64.BIG {
   100  			rawgins(as, n2, &n1)
   101  			return
   102  		}
   103  
   104  	case ppc64.ACMPU:
   105  		if 0 <= c && c <= 2*ppc64.BIG {
   106  			rawgins(as, n2, &n1)
   107  			return
   108  		}
   109  	}
   110  
   111  	// MOV n1 into register first
   112  	var ntmp gc.Node
   113  	gc.Regalloc(&ntmp, gc.Types[gc.TINT64], nil)
   114  
   115  	rawgins(ppc64.AMOVD, &n1, &ntmp)
   116  	rawgins(as, n2, &ntmp)
   117  	gc.Regfree(&ntmp)
   118  }
   119  
   120  func ginscmp(op gc.Op, t *gc.Type, n1, n2 *gc.Node, likely int) *obj.Prog {
   121  	if t.IsInteger() && n1.Op == gc.OLITERAL && n2.Op != gc.OLITERAL {
   122  		// Reverse comparison to place constant last.
   123  		op = gc.Brrev(op)
   124  		n1, n2 = n2, n1
   125  	}
   126  
   127  	var r1, r2, g1, g2 gc.Node
   128  	gc.Regalloc(&r1, t, n1)
   129  	gc.Regalloc(&g1, n1.Type, &r1)
   130  	gc.Cgen(n1, &g1)
   131  	gmove(&g1, &r1)
   132  	if t.IsInteger() && gc.Isconst(n2, gc.CTINT) {
   133  		ginscon2(optoas(gc.OCMP, t), &r1, n2.Int64())
   134  	} else {
   135  		gc.Regalloc(&r2, t, n2)
   136  		gc.Regalloc(&g2, n1.Type, &r2)
   137  		gc.Cgen(n2, &g2)
   138  		gmove(&g2, &r2)
   139  		rawgins(optoas(gc.OCMP, t), &r1, &r2)
   140  		gc.Regfree(&g2)
   141  		gc.Regfree(&r2)
   142  	}
   143  	gc.Regfree(&g1)
   144  	gc.Regfree(&r1)
   145  	return gc.Gbranch(optoas(op, t), nil, likely)
   146  }
   147  
   148  // set up nodes representing 2^63
   149  var (
   150  	bigi         gc.Node
   151  	bigf         gc.Node
   152  	bignodes_did bool
   153  )
   154  
   155  func bignodes() {
   156  	if bignodes_did {
   157  		return
   158  	}
   159  	bignodes_did = true
   160  
   161  	var i big.Int
   162  	i.SetInt64(1)
   163  	i.Lsh(&i, 63)
   164  
   165  	gc.Nodconst(&bigi, gc.Types[gc.TUINT64], 0)
   166  	bigi.SetBigInt(&i)
   167  
   168  	bigi.Convconst(&bigf, gc.Types[gc.TFLOAT64])
   169  }
   170  
   171  /*
   172   * generate move:
   173   *	t = f
   174   * hard part is conversions.
   175   */
   176  func gmove(f *gc.Node, t *gc.Node) {
   177  	if gc.Debug['M'] != 0 {
   178  		fmt.Printf("gmove %v -> %v\n", gc.Nconv(f, gc.FmtLong), gc.Nconv(t, gc.FmtLong))
   179  	}
   180  
   181  	ft := int(gc.Simsimtype(f.Type))
   182  	tt := int(gc.Simsimtype(t.Type))
   183  	cvt := t.Type
   184  
   185  	if gc.Iscomplex[ft] || gc.Iscomplex[tt] {
   186  		gc.Complexmove(f, t)
   187  		return
   188  	}
   189  
   190  	// cannot have two memory operands
   191  	var r2 gc.Node
   192  	var r1 gc.Node
   193  	var a obj.As
   194  	if gc.Ismem(f) && gc.Ismem(t) {
   195  		goto hard
   196  	}
   197  
   198  	// convert constant to desired type
   199  	if f.Op == gc.OLITERAL {
   200  		var con gc.Node
   201  		switch tt {
   202  		default:
   203  			f.Convconst(&con, t.Type)
   204  
   205  		case gc.TINT32,
   206  			gc.TINT16,
   207  			gc.TINT8:
   208  			var con gc.Node
   209  			f.Convconst(&con, gc.Types[gc.TINT64])
   210  			var r1 gc.Node
   211  			gc.Regalloc(&r1, con.Type, t)
   212  			gins(ppc64.AMOVD, &con, &r1)
   213  			gmove(&r1, t)
   214  			gc.Regfree(&r1)
   215  			return
   216  
   217  		case gc.TUINT32,
   218  			gc.TUINT16,
   219  			gc.TUINT8:
   220  			var con gc.Node
   221  			f.Convconst(&con, gc.Types[gc.TUINT64])
   222  			var r1 gc.Node
   223  			gc.Regalloc(&r1, con.Type, t)
   224  			gins(ppc64.AMOVD, &con, &r1)
   225  			gmove(&r1, t)
   226  			gc.Regfree(&r1)
   227  			return
   228  		}
   229  
   230  		f = &con
   231  		ft = tt // so big switch will choose a simple mov
   232  
   233  		// constants can't move directly to memory.
   234  		if gc.Ismem(t) {
   235  			goto hard
   236  		}
   237  	}
   238  
   239  	// float constants come from memory.
   240  	//if(isfloat[tt])
   241  	//	goto hard;
   242  
   243  	// 64-bit immediates are also from memory.
   244  	//if(isint[tt])
   245  	//	goto hard;
   246  	//// 64-bit immediates are really 32-bit sign-extended
   247  	//// unless moving into a register.
   248  	//if(isint[tt]) {
   249  	//	if(mpcmpfixfix(con.val.u.xval, minintval[TINT32]) < 0)
   250  	//		goto hard;
   251  	//	if(mpcmpfixfix(con.val.u.xval, maxintval[TINT32]) > 0)
   252  	//		goto hard;
   253  	//}
   254  
   255  	// value -> value copy, only one memory operand.
   256  	// figure out the instruction to use.
   257  	// break out of switch for one-instruction gins.
   258  	// goto rdst for "destination must be register".
   259  	// goto hard for "convert to cvt type first".
   260  	// otherwise handle and return.
   261  
   262  	switch uint32(ft)<<16 | uint32(tt) {
   263  	default:
   264  		gc.Fatalf("gmove %v -> %v", gc.Tconv(f.Type, gc.FmtLong), gc.Tconv(t.Type, gc.FmtLong))
   265  
   266  		/*
   267  		 * integer copy and truncate
   268  		 */
   269  	case gc.TINT8<<16 | gc.TINT8, // same size
   270  		gc.TUINT8<<16 | gc.TINT8,
   271  		gc.TINT16<<16 | gc.TINT8,
   272  		// truncate
   273  		gc.TUINT16<<16 | gc.TINT8,
   274  		gc.TINT32<<16 | gc.TINT8,
   275  		gc.TUINT32<<16 | gc.TINT8,
   276  		gc.TINT64<<16 | gc.TINT8,
   277  		gc.TUINT64<<16 | gc.TINT8:
   278  		a = ppc64.AMOVB
   279  
   280  	case gc.TINT8<<16 | gc.TUINT8, // same size
   281  		gc.TUINT8<<16 | gc.TUINT8,
   282  		gc.TINT16<<16 | gc.TUINT8,
   283  		// truncate
   284  		gc.TUINT16<<16 | gc.TUINT8,
   285  		gc.TINT32<<16 | gc.TUINT8,
   286  		gc.TUINT32<<16 | gc.TUINT8,
   287  		gc.TINT64<<16 | gc.TUINT8,
   288  		gc.TUINT64<<16 | gc.TUINT8:
   289  		a = ppc64.AMOVBZ
   290  
   291  	case gc.TINT16<<16 | gc.TINT16, // same size
   292  		gc.TUINT16<<16 | gc.TINT16,
   293  		gc.TINT32<<16 | gc.TINT16,
   294  		// truncate
   295  		gc.TUINT32<<16 | gc.TINT16,
   296  		gc.TINT64<<16 | gc.TINT16,
   297  		gc.TUINT64<<16 | gc.TINT16:
   298  		a = ppc64.AMOVH
   299  
   300  	case gc.TINT16<<16 | gc.TUINT16, // same size
   301  		gc.TUINT16<<16 | gc.TUINT16,
   302  		gc.TINT32<<16 | gc.TUINT16,
   303  		// truncate
   304  		gc.TUINT32<<16 | gc.TUINT16,
   305  		gc.TINT64<<16 | gc.TUINT16,
   306  		gc.TUINT64<<16 | gc.TUINT16:
   307  		a = ppc64.AMOVHZ
   308  
   309  	case gc.TINT32<<16 | gc.TINT32, // same size
   310  		gc.TUINT32<<16 | gc.TINT32,
   311  		gc.TINT64<<16 | gc.TINT32,
   312  		// truncate
   313  		gc.TUINT64<<16 | gc.TINT32:
   314  		a = ppc64.AMOVW
   315  
   316  	case gc.TINT32<<16 | gc.TUINT32, // same size
   317  		gc.TUINT32<<16 | gc.TUINT32,
   318  		gc.TINT64<<16 | gc.TUINT32,
   319  		gc.TUINT64<<16 | gc.TUINT32:
   320  		a = ppc64.AMOVWZ
   321  
   322  	case gc.TINT64<<16 | gc.TINT64, // same size
   323  		gc.TINT64<<16 | gc.TUINT64,
   324  		gc.TUINT64<<16 | gc.TINT64,
   325  		gc.TUINT64<<16 | gc.TUINT64:
   326  		a = ppc64.AMOVD
   327  
   328  		/*
   329  		 * integer up-conversions
   330  		 */
   331  	case gc.TINT8<<16 | gc.TINT16, // sign extend int8
   332  		gc.TINT8<<16 | gc.TUINT16,
   333  		gc.TINT8<<16 | gc.TINT32,
   334  		gc.TINT8<<16 | gc.TUINT32,
   335  		gc.TINT8<<16 | gc.TINT64,
   336  		gc.TINT8<<16 | gc.TUINT64:
   337  		a = ppc64.AMOVB
   338  
   339  		goto rdst
   340  
   341  	case gc.TUINT8<<16 | gc.TINT16, // zero extend uint8
   342  		gc.TUINT8<<16 | gc.TUINT16,
   343  		gc.TUINT8<<16 | gc.TINT32,
   344  		gc.TUINT8<<16 | gc.TUINT32,
   345  		gc.TUINT8<<16 | gc.TINT64,
   346  		gc.TUINT8<<16 | gc.TUINT64:
   347  		a = ppc64.AMOVBZ
   348  
   349  		goto rdst
   350  
   351  	case gc.TINT16<<16 | gc.TINT32, // sign extend int16
   352  		gc.TINT16<<16 | gc.TUINT32,
   353  		gc.TINT16<<16 | gc.TINT64,
   354  		gc.TINT16<<16 | gc.TUINT64:
   355  		a = ppc64.AMOVH
   356  
   357  		goto rdst
   358  
   359  	case gc.TUINT16<<16 | gc.TINT32, // zero extend uint16
   360  		gc.TUINT16<<16 | gc.TUINT32,
   361  		gc.TUINT16<<16 | gc.TINT64,
   362  		gc.TUINT16<<16 | gc.TUINT64:
   363  		a = ppc64.AMOVHZ
   364  
   365  		goto rdst
   366  
   367  	case gc.TINT32<<16 | gc.TINT64, // sign extend int32
   368  		gc.TINT32<<16 | gc.TUINT64:
   369  		a = ppc64.AMOVW
   370  
   371  		goto rdst
   372  
   373  	case gc.TUINT32<<16 | gc.TINT64, // zero extend uint32
   374  		gc.TUINT32<<16 | gc.TUINT64:
   375  		a = ppc64.AMOVWZ
   376  
   377  		goto rdst
   378  
   379  		//warn("gmove: convert float to int not implemented: %N -> %N\n", f, t);
   380  	//return;
   381  	// algorithm is:
   382  	//	if small enough, use native float64 -> int64 conversion.
   383  	//	otherwise, subtract 2^63, convert, and add it back.
   384  	/*
   385  	* float to integer
   386  	 */
   387  	case gc.TFLOAT32<<16 | gc.TINT32,
   388  		gc.TFLOAT64<<16 | gc.TINT32,
   389  		gc.TFLOAT32<<16 | gc.TINT64,
   390  		gc.TFLOAT64<<16 | gc.TINT64,
   391  		gc.TFLOAT32<<16 | gc.TINT16,
   392  		gc.TFLOAT32<<16 | gc.TINT8,
   393  		gc.TFLOAT32<<16 | gc.TUINT16,
   394  		gc.TFLOAT32<<16 | gc.TUINT8,
   395  		gc.TFLOAT64<<16 | gc.TINT16,
   396  		gc.TFLOAT64<<16 | gc.TINT8,
   397  		gc.TFLOAT64<<16 | gc.TUINT16,
   398  		gc.TFLOAT64<<16 | gc.TUINT8,
   399  		gc.TFLOAT32<<16 | gc.TUINT32,
   400  		gc.TFLOAT64<<16 | gc.TUINT32,
   401  		gc.TFLOAT32<<16 | gc.TUINT64,
   402  		gc.TFLOAT64<<16 | gc.TUINT64:
   403  		bignodes()
   404  
   405  		var r1 gc.Node
   406  		gc.Regalloc(&r1, gc.Types[ft], f)
   407  		gmove(f, &r1)
   408  		if tt == gc.TUINT64 {
   409  			gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], nil)
   410  			gmove(&bigf, &r2)
   411  			gins(ppc64.AFCMPU, &r1, &r2)
   412  			p1 := gc.Gbranch(optoas(gc.OLT, gc.Types[gc.TFLOAT64]), nil, +1)
   413  			gins(ppc64.AFSUB, &r2, &r1)
   414  			gc.Patch(p1, gc.Pc)
   415  			gc.Regfree(&r2)
   416  		}
   417  
   418  		gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], nil)
   419  		var r3 gc.Node
   420  		gc.Regalloc(&r3, gc.Types[gc.TINT64], t)
   421  		gins(ppc64.AFCTIDZ, &r1, &r2)
   422  		p1 := gins(ppc64.AFMOVD, &r2, nil)
   423  		p1.To.Type = obj.TYPE_MEM
   424  		p1.To.Reg = ppc64.REGSP
   425  		p1.To.Offset = -8
   426  		p1 = gins(ppc64.AMOVD, nil, &r3)
   427  		p1.From.Type = obj.TYPE_MEM
   428  		p1.From.Reg = ppc64.REGSP
   429  		p1.From.Offset = -8
   430  		gc.Regfree(&r2)
   431  		gc.Regfree(&r1)
   432  		if tt == gc.TUINT64 {
   433  			p1 := gc.Gbranch(optoas(gc.OLT, gc.Types[gc.TFLOAT64]), nil, +1) // use CR0 here again
   434  			gc.Nodreg(&r1, gc.Types[gc.TINT64], ppc64.REGTMP)
   435  			gins(ppc64.AMOVD, &bigi, &r1)
   436  			gins(ppc64.AADD, &r1, &r3)
   437  			gc.Patch(p1, gc.Pc)
   438  		}
   439  
   440  		gmove(&r3, t)
   441  		gc.Regfree(&r3)
   442  		return
   443  
   444  		//warn("gmove: convert int to float not implemented: %N -> %N\n", f, t);
   445  	/*
   446  	 * signed integer to float
   447  	 */
   448  	case gc.TINT32<<16 | gc.TFLOAT32,
   449  		gc.TINT32<<16 | gc.TFLOAT64,
   450  		gc.TINT64<<16 | gc.TFLOAT32,
   451  		gc.TINT64<<16 | gc.TFLOAT64,
   452  		gc.TINT16<<16 | gc.TFLOAT32,
   453  		gc.TINT16<<16 | gc.TFLOAT64,
   454  		gc.TINT8<<16 | gc.TFLOAT32,
   455  		gc.TINT8<<16 | gc.TFLOAT64:
   456  		var r1 gc.Node
   457  		gc.Regalloc(&r1, gc.Types[gc.TINT64], nil)
   458  		gmove(f, &r1)
   459  		gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], t)
   460  		p1 := gins(ppc64.AMOVD, &r1, nil)
   461  		p1.To.Type = obj.TYPE_MEM
   462  		p1.To.Reg = ppc64.REGSP
   463  		p1.To.Offset = -8
   464  		p1 = gins(ppc64.AFMOVD, nil, &r2)
   465  		p1.From.Type = obj.TYPE_MEM
   466  		p1.From.Reg = ppc64.REGSP
   467  		p1.From.Offset = -8
   468  		gins(ppc64.AFCFID, &r2, &r2)
   469  		gc.Regfree(&r1)
   470  		gmove(&r2, t)
   471  		gc.Regfree(&r2)
   472  		return
   473  
   474  	/*
   475  	 * unsigned integer to float
   476  	 */
   477  	case gc.TUINT16<<16 | gc.TFLOAT32,
   478  		gc.TUINT16<<16 | gc.TFLOAT64,
   479  		gc.TUINT8<<16 | gc.TFLOAT32,
   480  		gc.TUINT8<<16 | gc.TFLOAT64,
   481  		gc.TUINT32<<16 | gc.TFLOAT32,
   482  		gc.TUINT32<<16 | gc.TFLOAT64,
   483  		gc.TUINT64<<16 | gc.TFLOAT32,
   484  		gc.TUINT64<<16 | gc.TFLOAT64:
   485  
   486  		var r1 gc.Node
   487  		gc.Regalloc(&r1, gc.Types[gc.TUINT64], nil)
   488  		gmove(f, &r1)
   489  		gc.Regalloc(&r2, gc.Types[gc.TFLOAT64], t)
   490  		p1 := gins(ppc64.AMOVD, &r1, nil)
   491  		p1.To.Type = obj.TYPE_MEM
   492  		p1.To.Reg = ppc64.REGSP
   493  		p1.To.Offset = -8
   494  		p1 = gins(ppc64.AFMOVD, nil, &r2)
   495  		p1.From.Type = obj.TYPE_MEM
   496  		p1.From.Reg = ppc64.REGSP
   497  		p1.From.Offset = -8
   498  		gins(ppc64.AFCFIDU, &r2, &r2)
   499  		gc.Regfree(&r1)
   500  		gmove(&r2, t)
   501  		gc.Regfree(&r2)
   502  		return
   503  
   504  		/*
   505  		 * float to float
   506  		 */
   507  	case gc.TFLOAT32<<16 | gc.TFLOAT32:
   508  		a = ppc64.AFMOVS
   509  
   510  	case gc.TFLOAT64<<16 | gc.TFLOAT64:
   511  		a = ppc64.AFMOVD
   512  
   513  	case gc.TFLOAT32<<16 | gc.TFLOAT64:
   514  		a = ppc64.AFMOVS
   515  		goto rdst
   516  
   517  	case gc.TFLOAT64<<16 | gc.TFLOAT32:
   518  		a = ppc64.AFRSP
   519  		goto rdst
   520  	}
   521  
   522  	gins(a, f, t)
   523  	return
   524  
   525  	// requires register destination
   526  rdst:
   527  	{
   528  		gc.Regalloc(&r1, t.Type, t)
   529  
   530  		gins(a, f, &r1)
   531  		gmove(&r1, t)
   532  		gc.Regfree(&r1)
   533  		return
   534  	}
   535  
   536  	// requires register intermediate
   537  hard:
   538  	gc.Regalloc(&r1, cvt, t)
   539  
   540  	gmove(f, &r1)
   541  	gmove(&r1, t)
   542  	gc.Regfree(&r1)
   543  	return
   544  }
   545  
   546  // gins is called by the front end.
   547  // It synthesizes some multiple-instruction sequences
   548  // so the front end can stay simpler.
   549  func gins(as obj.As, f, t *gc.Node) *obj.Prog {
   550  	if as >= obj.A_ARCHSPECIFIC {
   551  		if x, ok := f.IntLiteral(); ok {
   552  			ginscon(as, x, t)
   553  			return nil // caller must not use
   554  		}
   555  	}
   556  	if as == ppc64.ACMP || as == ppc64.ACMPU {
   557  		if x, ok := t.IntLiteral(); ok {
   558  			ginscon2(as, f, x)
   559  			return nil // caller must not use
   560  		}
   561  	}
   562  	return rawgins(as, f, t)
   563  }
   564  
   565  /*
   566   * generate one instruction:
   567   *	as f, t
   568   */
   569  func rawgins(as obj.As, f *gc.Node, t *gc.Node) *obj.Prog {
   570  	// TODO(austin): Add self-move test like in 6g (but be careful
   571  	// of truncation moves)
   572  
   573  	p := gc.Prog(as)
   574  	gc.Naddr(&p.From, f)
   575  	gc.Naddr(&p.To, t)
   576  
   577  	switch as {
   578  	case obj.ACALL:
   579  		if p.To.Type == obj.TYPE_REG && p.To.Reg != ppc64.REG_CTR {
   580  			// Allow front end to emit CALL REG, and rewrite into MOV REG, CTR; CALL CTR.
   581  			if gc.Ctxt.Flag_shared {
   582  				// Make sure function pointer is in R12 as well when
   583  				// compiling Go into PIC.
   584  				// TODO(mwhudson): it would obviously be better to
   585  				// change the register allocation to put the value in
   586  				// R12 already, but I don't know how to do that.
   587  				q := gc.Prog(as)
   588  				q.As = ppc64.AMOVD
   589  				q.From = p.To
   590  				q.To.Type = obj.TYPE_REG
   591  				q.To.Reg = ppc64.REG_R12
   592  			}
   593  			pp := gc.Prog(as)
   594  			pp.From = p.From
   595  			pp.To.Type = obj.TYPE_REG
   596  			pp.To.Reg = ppc64.REG_CTR
   597  
   598  			p.As = ppc64.AMOVD
   599  			p.From = p.To
   600  			p.To.Type = obj.TYPE_REG
   601  			p.To.Reg = ppc64.REG_CTR
   602  
   603  			if gc.Ctxt.Flag_shared {
   604  				// When compiling Go into PIC, the function we just
   605  				// called via pointer might have been implemented in
   606  				// a separate module and so overwritten the TOC
   607  				// pointer in R2; reload it.
   608  				q := gc.Prog(ppc64.AMOVD)
   609  				q.From.Type = obj.TYPE_MEM
   610  				q.From.Offset = 24
   611  				q.From.Reg = ppc64.REGSP
   612  				q.To.Type = obj.TYPE_REG
   613  				q.To.Reg = ppc64.REG_R2
   614  			}
   615  
   616  			if gc.Debug['g'] != 0 {
   617  				fmt.Printf("%v\n", p)
   618  				fmt.Printf("%v\n", pp)
   619  			}
   620  
   621  			return pp
   622  		}
   623  
   624  	// Bad things the front end has done to us. Crash to find call stack.
   625  	case ppc64.AAND, ppc64.AMULLD:
   626  		if p.From.Type == obj.TYPE_CONST {
   627  			gc.Debug['h'] = 1
   628  			gc.Fatalf("bad inst: %v", p)
   629  		}
   630  	case ppc64.ACMP, ppc64.ACMPU:
   631  		if p.From.Type == obj.TYPE_MEM || p.To.Type == obj.TYPE_MEM {
   632  			gc.Debug['h'] = 1
   633  			gc.Fatalf("bad inst: %v", p)
   634  		}
   635  	}
   636  
   637  	if gc.Debug['g'] != 0 {
   638  		fmt.Printf("%v\n", p)
   639  	}
   640  
   641  	w := int32(0)
   642  	switch as {
   643  	case ppc64.AMOVB,
   644  		ppc64.AMOVBU,
   645  		ppc64.AMOVBZ,
   646  		ppc64.AMOVBZU:
   647  		w = 1
   648  
   649  	case ppc64.AMOVH,
   650  		ppc64.AMOVHU,
   651  		ppc64.AMOVHZ,
   652  		ppc64.AMOVHZU:
   653  		w = 2
   654  
   655  	case ppc64.AMOVW,
   656  		ppc64.AMOVWU,
   657  		ppc64.AMOVWZ,
   658  		ppc64.AMOVWZU:
   659  		w = 4
   660  
   661  	case ppc64.AMOVD,
   662  		ppc64.AMOVDU:
   663  		if p.From.Type == obj.TYPE_CONST || p.From.Type == obj.TYPE_ADDR {
   664  			break
   665  		}
   666  		w = 8
   667  	}
   668  
   669  	if w != 0 && ((f != nil && p.From.Width < int64(w)) || (t != nil && p.To.Type != obj.TYPE_REG && p.To.Width > int64(w))) {
   670  		gc.Dump("f", f)
   671  		gc.Dump("t", t)
   672  		gc.Fatalf("bad width: %v (%d, %d)\n", p, p.From.Width, p.To.Width)
   673  	}
   674  
   675  	return p
   676  }
   677  
   678  /*
   679   * return Axxx for Oxxx on type t.
   680   */
   681  func optoas(op gc.Op, t *gc.Type) obj.As {
   682  	if t == nil {
   683  		gc.Fatalf("optoas: t is nil")
   684  	}
   685  
   686  	// avoid constant conversions in switches below
   687  	const (
   688  		OMINUS_ = uint32(gc.OMINUS) << 16
   689  		OLSH_   = uint32(gc.OLSH) << 16
   690  		ORSH_   = uint32(gc.ORSH) << 16
   691  		OADD_   = uint32(gc.OADD) << 16
   692  		OSUB_   = uint32(gc.OSUB) << 16
   693  		OMUL_   = uint32(gc.OMUL) << 16
   694  		ODIV_   = uint32(gc.ODIV) << 16
   695  		OOR_    = uint32(gc.OOR) << 16
   696  		OAND_   = uint32(gc.OAND) << 16
   697  		OXOR_   = uint32(gc.OXOR) << 16
   698  		OEQ_    = uint32(gc.OEQ) << 16
   699  		ONE_    = uint32(gc.ONE) << 16
   700  		OLT_    = uint32(gc.OLT) << 16
   701  		OLE_    = uint32(gc.OLE) << 16
   702  		OGE_    = uint32(gc.OGE) << 16
   703  		OGT_    = uint32(gc.OGT) << 16
   704  		OCMP_   = uint32(gc.OCMP) << 16
   705  		OAS_    = uint32(gc.OAS) << 16
   706  		OHMUL_  = uint32(gc.OHMUL) << 16
   707  		OSQRT_  = uint32(gc.OSQRT) << 16
   708  	)
   709  
   710  	a := obj.AXXX
   711  	switch uint32(op)<<16 | uint32(gc.Simtype[t.Etype]) {
   712  	default:
   713  		gc.Fatalf("optoas: no entry for op=%v type=%v", op, t)
   714  
   715  	case OEQ_ | gc.TBOOL,
   716  		OEQ_ | gc.TINT8,
   717  		OEQ_ | gc.TUINT8,
   718  		OEQ_ | gc.TINT16,
   719  		OEQ_ | gc.TUINT16,
   720  		OEQ_ | gc.TINT32,
   721  		OEQ_ | gc.TUINT32,
   722  		OEQ_ | gc.TINT64,
   723  		OEQ_ | gc.TUINT64,
   724  		OEQ_ | gc.TPTR32,
   725  		OEQ_ | gc.TPTR64,
   726  		OEQ_ | gc.TFLOAT32,
   727  		OEQ_ | gc.TFLOAT64:
   728  		a = ppc64.ABEQ
   729  
   730  	case ONE_ | gc.TBOOL,
   731  		ONE_ | gc.TINT8,
   732  		ONE_ | gc.TUINT8,
   733  		ONE_ | gc.TINT16,
   734  		ONE_ | gc.TUINT16,
   735  		ONE_ | gc.TINT32,
   736  		ONE_ | gc.TUINT32,
   737  		ONE_ | gc.TINT64,
   738  		ONE_ | gc.TUINT64,
   739  		ONE_ | gc.TPTR32,
   740  		ONE_ | gc.TPTR64,
   741  		ONE_ | gc.TFLOAT32,
   742  		ONE_ | gc.TFLOAT64:
   743  		a = ppc64.ABNE
   744  
   745  	case OLT_ | gc.TINT8, // ACMP
   746  		OLT_ | gc.TINT16,
   747  		OLT_ | gc.TINT32,
   748  		OLT_ | gc.TINT64,
   749  		OLT_ | gc.TUINT8,
   750  		// ACMPU
   751  		OLT_ | gc.TUINT16,
   752  		OLT_ | gc.TUINT32,
   753  		OLT_ | gc.TUINT64,
   754  		OLT_ | gc.TFLOAT32,
   755  		// AFCMPU
   756  		OLT_ | gc.TFLOAT64:
   757  		a = ppc64.ABLT
   758  
   759  	case OLE_ | gc.TINT8, // ACMP
   760  		OLE_ | gc.TINT16,
   761  		OLE_ | gc.TINT32,
   762  		OLE_ | gc.TINT64,
   763  		OLE_ | gc.TUINT8,
   764  		// ACMPU
   765  		OLE_ | gc.TUINT16,
   766  		OLE_ | gc.TUINT32,
   767  		OLE_ | gc.TUINT64:
   768  		// No OLE for floats, because it mishandles NaN.
   769  		// Front end must reverse comparison or use OLT and OEQ together.
   770  		a = ppc64.ABLE
   771  
   772  	case OGT_ | gc.TINT8,
   773  		OGT_ | gc.TINT16,
   774  		OGT_ | gc.TINT32,
   775  		OGT_ | gc.TINT64,
   776  		OGT_ | gc.TUINT8,
   777  		OGT_ | gc.TUINT16,
   778  		OGT_ | gc.TUINT32,
   779  		OGT_ | gc.TUINT64,
   780  		OGT_ | gc.TFLOAT32,
   781  		OGT_ | gc.TFLOAT64:
   782  		a = ppc64.ABGT
   783  
   784  	case OGE_ | gc.TINT8,
   785  		OGE_ | gc.TINT16,
   786  		OGE_ | gc.TINT32,
   787  		OGE_ | gc.TINT64,
   788  		OGE_ | gc.TUINT8,
   789  		OGE_ | gc.TUINT16,
   790  		OGE_ | gc.TUINT32,
   791  		OGE_ | gc.TUINT64:
   792  		// No OGE for floats, because it mishandles NaN.
   793  		// Front end must reverse comparison or use OLT and OEQ together.
   794  		a = ppc64.ABGE
   795  
   796  	case OCMP_ | gc.TBOOL,
   797  		OCMP_ | gc.TINT8,
   798  		OCMP_ | gc.TINT16,
   799  		OCMP_ | gc.TINT32,
   800  		OCMP_ | gc.TPTR32,
   801  		OCMP_ | gc.TINT64:
   802  		a = ppc64.ACMP
   803  
   804  	case OCMP_ | gc.TUINT8,
   805  		OCMP_ | gc.TUINT16,
   806  		OCMP_ | gc.TUINT32,
   807  		OCMP_ | gc.TUINT64,
   808  		OCMP_ | gc.TPTR64:
   809  		a = ppc64.ACMPU
   810  
   811  	case OCMP_ | gc.TFLOAT32,
   812  		OCMP_ | gc.TFLOAT64:
   813  		a = ppc64.AFCMPU
   814  
   815  	case OAS_ | gc.TBOOL,
   816  		OAS_ | gc.TINT8:
   817  		a = ppc64.AMOVB
   818  
   819  	case OAS_ | gc.TUINT8:
   820  		a = ppc64.AMOVBZ
   821  
   822  	case OAS_ | gc.TINT16:
   823  		a = ppc64.AMOVH
   824  
   825  	case OAS_ | gc.TUINT16:
   826  		a = ppc64.AMOVHZ
   827  
   828  	case OAS_ | gc.TINT32:
   829  		a = ppc64.AMOVW
   830  
   831  	case OAS_ | gc.TUINT32,
   832  		OAS_ | gc.TPTR32:
   833  		a = ppc64.AMOVWZ
   834  
   835  	case OAS_ | gc.TINT64,
   836  		OAS_ | gc.TUINT64,
   837  		OAS_ | gc.TPTR64:
   838  		a = ppc64.AMOVD
   839  
   840  	case OAS_ | gc.TFLOAT32:
   841  		a = ppc64.AFMOVS
   842  
   843  	case OAS_ | gc.TFLOAT64:
   844  		a = ppc64.AFMOVD
   845  
   846  	case OADD_ | gc.TINT8,
   847  		OADD_ | gc.TUINT8,
   848  		OADD_ | gc.TINT16,
   849  		OADD_ | gc.TUINT16,
   850  		OADD_ | gc.TINT32,
   851  		OADD_ | gc.TUINT32,
   852  		OADD_ | gc.TPTR32,
   853  		OADD_ | gc.TINT64,
   854  		OADD_ | gc.TUINT64,
   855  		OADD_ | gc.TPTR64:
   856  		a = ppc64.AADD
   857  
   858  	case OADD_ | gc.TFLOAT32:
   859  		a = ppc64.AFADDS
   860  
   861  	case OADD_ | gc.TFLOAT64:
   862  		a = ppc64.AFADD
   863  
   864  	case OSUB_ | gc.TINT8,
   865  		OSUB_ | gc.TUINT8,
   866  		OSUB_ | gc.TINT16,
   867  		OSUB_ | gc.TUINT16,
   868  		OSUB_ | gc.TINT32,
   869  		OSUB_ | gc.TUINT32,
   870  		OSUB_ | gc.TPTR32,
   871  		OSUB_ | gc.TINT64,
   872  		OSUB_ | gc.TUINT64,
   873  		OSUB_ | gc.TPTR64:
   874  		a = ppc64.ASUB
   875  
   876  	case OSUB_ | gc.TFLOAT32:
   877  		a = ppc64.AFSUBS
   878  
   879  	case OSUB_ | gc.TFLOAT64:
   880  		a = ppc64.AFSUB
   881  
   882  	case OMINUS_ | gc.TINT8,
   883  		OMINUS_ | gc.TUINT8,
   884  		OMINUS_ | gc.TINT16,
   885  		OMINUS_ | gc.TUINT16,
   886  		OMINUS_ | gc.TINT32,
   887  		OMINUS_ | gc.TUINT32,
   888  		OMINUS_ | gc.TPTR32,
   889  		OMINUS_ | gc.TINT64,
   890  		OMINUS_ | gc.TUINT64,
   891  		OMINUS_ | gc.TPTR64:
   892  		a = ppc64.ANEG
   893  
   894  	case OAND_ | gc.TINT8,
   895  		OAND_ | gc.TUINT8,
   896  		OAND_ | gc.TINT16,
   897  		OAND_ | gc.TUINT16,
   898  		OAND_ | gc.TINT32,
   899  		OAND_ | gc.TUINT32,
   900  		OAND_ | gc.TPTR32,
   901  		OAND_ | gc.TINT64,
   902  		OAND_ | gc.TUINT64,
   903  		OAND_ | gc.TPTR64:
   904  		a = ppc64.AAND
   905  
   906  	case OOR_ | gc.TINT8,
   907  		OOR_ | gc.TUINT8,
   908  		OOR_ | gc.TINT16,
   909  		OOR_ | gc.TUINT16,
   910  		OOR_ | gc.TINT32,
   911  		OOR_ | gc.TUINT32,
   912  		OOR_ | gc.TPTR32,
   913  		OOR_ | gc.TINT64,
   914  		OOR_ | gc.TUINT64,
   915  		OOR_ | gc.TPTR64:
   916  		a = ppc64.AOR
   917  
   918  	case OXOR_ | gc.TINT8,
   919  		OXOR_ | gc.TUINT8,
   920  		OXOR_ | gc.TINT16,
   921  		OXOR_ | gc.TUINT16,
   922  		OXOR_ | gc.TINT32,
   923  		OXOR_ | gc.TUINT32,
   924  		OXOR_ | gc.TPTR32,
   925  		OXOR_ | gc.TINT64,
   926  		OXOR_ | gc.TUINT64,
   927  		OXOR_ | gc.TPTR64:
   928  		a = ppc64.AXOR
   929  
   930  		// TODO(minux): handle rotates
   931  	//case CASE(OLROT, TINT8):
   932  	//case CASE(OLROT, TUINT8):
   933  	//case CASE(OLROT, TINT16):
   934  	//case CASE(OLROT, TUINT16):
   935  	//case CASE(OLROT, TINT32):
   936  	//case CASE(OLROT, TUINT32):
   937  	//case CASE(OLROT, TPTR32):
   938  	//case CASE(OLROT, TINT64):
   939  	//case CASE(OLROT, TUINT64):
   940  	//case CASE(OLROT, TPTR64):
   941  	//	a = 0//???; RLDC?
   942  	//	break;
   943  
   944  	case OLSH_ | gc.TINT8,
   945  		OLSH_ | gc.TUINT8,
   946  		OLSH_ | gc.TINT16,
   947  		OLSH_ | gc.TUINT16,
   948  		OLSH_ | gc.TINT32,
   949  		OLSH_ | gc.TUINT32,
   950  		OLSH_ | gc.TPTR32,
   951  		OLSH_ | gc.TINT64,
   952  		OLSH_ | gc.TUINT64,
   953  		OLSH_ | gc.TPTR64:
   954  		a = ppc64.ASLD
   955  
   956  	case ORSH_ | gc.TUINT8,
   957  		ORSH_ | gc.TUINT16,
   958  		ORSH_ | gc.TUINT32,
   959  		ORSH_ | gc.TPTR32,
   960  		ORSH_ | gc.TUINT64,
   961  		ORSH_ | gc.TPTR64:
   962  		a = ppc64.ASRD
   963  
   964  	case ORSH_ | gc.TINT8,
   965  		ORSH_ | gc.TINT16,
   966  		ORSH_ | gc.TINT32,
   967  		ORSH_ | gc.TINT64:
   968  		a = ppc64.ASRAD
   969  
   970  		// TODO(minux): handle rotates
   971  	//case CASE(ORROTC, TINT8):
   972  	//case CASE(ORROTC, TUINT8):
   973  	//case CASE(ORROTC, TINT16):
   974  	//case CASE(ORROTC, TUINT16):
   975  	//case CASE(ORROTC, TINT32):
   976  	//case CASE(ORROTC, TUINT32):
   977  	//case CASE(ORROTC, TINT64):
   978  	//case CASE(ORROTC, TUINT64):
   979  	//	a = 0//??? RLDC??
   980  	//	break;
   981  
   982  	case OHMUL_ | gc.TINT64:
   983  		a = ppc64.AMULHD
   984  
   985  	case OHMUL_ | gc.TUINT64,
   986  		OHMUL_ | gc.TPTR64:
   987  		a = ppc64.AMULHDU
   988  
   989  	case OMUL_ | gc.TINT8,
   990  		OMUL_ | gc.TINT16,
   991  		OMUL_ | gc.TINT32,
   992  		OMUL_ | gc.TINT64:
   993  		a = ppc64.AMULLD
   994  
   995  	case OMUL_ | gc.TUINT8,
   996  		OMUL_ | gc.TUINT16,
   997  		OMUL_ | gc.TUINT32,
   998  		OMUL_ | gc.TPTR32,
   999  		// don't use word multiply, the high 32-bit are undefined.
  1000  		OMUL_ | gc.TUINT64,
  1001  		OMUL_ | gc.TPTR64:
  1002  		// for 64-bit multiplies, signedness doesn't matter.
  1003  		a = ppc64.AMULLD
  1004  
  1005  	case OMUL_ | gc.TFLOAT32:
  1006  		a = ppc64.AFMULS
  1007  
  1008  	case OMUL_ | gc.TFLOAT64:
  1009  		a = ppc64.AFMUL
  1010  
  1011  	case ODIV_ | gc.TINT8,
  1012  		ODIV_ | gc.TINT16,
  1013  		ODIV_ | gc.TINT32,
  1014  		ODIV_ | gc.TINT64:
  1015  		a = ppc64.ADIVD
  1016  
  1017  	case ODIV_ | gc.TUINT8,
  1018  		ODIV_ | gc.TUINT16,
  1019  		ODIV_ | gc.TUINT32,
  1020  		ODIV_ | gc.TPTR32,
  1021  		ODIV_ | gc.TUINT64,
  1022  		ODIV_ | gc.TPTR64:
  1023  		a = ppc64.ADIVDU
  1024  
  1025  	case ODIV_ | gc.TFLOAT32:
  1026  		a = ppc64.AFDIVS
  1027  
  1028  	case ODIV_ | gc.TFLOAT64:
  1029  		a = ppc64.AFDIV
  1030  
  1031  	case OSQRT_ | gc.TFLOAT64:
  1032  		a = ppc64.AFSQRT
  1033  	}
  1034  
  1035  	return a
  1036  }
  1037  
  1038  const (
  1039  	ODynam   = 1 << 0
  1040  	OAddable = 1 << 1
  1041  )
  1042  
  1043  func xgen(n *gc.Node, a *gc.Node, o int) bool {
  1044  	// TODO(minux)
  1045  
  1046  	return -1 != 0 /*TypeKind(100016)*/
  1047  }
  1048  
  1049  func sudoclean() {
  1050  	return
  1051  }
  1052  
  1053  /*
  1054   * generate code to compute address of n,
  1055   * a reference to a (perhaps nested) field inside
  1056   * an array or struct.
  1057   * return 0 on failure, 1 on success.
  1058   * on success, leaves usable address in a.
  1059   *
  1060   * caller is responsible for calling sudoclean
  1061   * after successful sudoaddable,
  1062   * to release the register used for a.
  1063   */
  1064  func sudoaddable(as obj.As, n *gc.Node, a *obj.Addr) bool {
  1065  	// TODO(minux)
  1066  
  1067  	*a = obj.Addr{}
  1068  	return false
  1069  }