github.com/q45/go@v0.0.0-20151101211701-a4fb8c13db3f/src/cmd/compile/internal/mips64/peep.go (about)

     1  // Derived from Inferno utils/6c/peep.c
     2  // http://code.google.com/p/inferno-os/source/browse/utils/6c/peep.c
     3  //
     4  //	Copyright © 1994-1999 Lucent Technologies Inc.  All rights reserved.
     5  //	Portions Copyright © 1995-1997 C H Forsyth (forsyth@terzarima.net)
     6  //	Portions Copyright © 1997-1999 Vita Nuova Limited
     7  //	Portions Copyright © 2000-2007 Vita Nuova Holdings Limited (www.vitanuova.com)
     8  //	Portions Copyright © 2004,2006 Bruce Ellis
     9  //	Portions Copyright © 2005-2007 C H Forsyth (forsyth@terzarima.net)
    10  //	Revisions Copyright © 2000-2007 Lucent Technologies Inc. and others
    11  //	Portions Copyright © 2009 The Go Authors.  All rights reserved.
    12  //
    13  // Permission is hereby granted, free of charge, to any person obtaining a copy
    14  // of this software and associated documentation files (the "Software"), to deal
    15  // in the Software without restriction, including without limitation the rights
    16  // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
    17  // copies of the Software, and to permit persons to whom the Software is
    18  // furnished to do so, subject to the following conditions:
    19  //
    20  // The above copyright notice and this permission notice shall be included in
    21  // all copies or substantial portions of the Software.
    22  //
    23  // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    24  // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    25  // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
    26  // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    27  // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    28  // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
    29  // THE SOFTWARE.
    30  
    31  package ppc64
    32  
    33  import (
    34  	"cmd/compile/internal/gc"
    35  	"cmd/internal/obj"
    36  	"cmd/internal/obj/ppc64"
    37  	"fmt"
    38  )
    39  
    40  var gactive uint32
    41  
    42  func peep(firstp *obj.Prog) {
    43  	g := (*gc.Graph)(gc.Flowstart(firstp, nil))
    44  	if g == nil {
    45  		return
    46  	}
    47  	gactive = 0
    48  
    49  	var p *obj.Prog
    50  	var r *gc.Flow
    51  	var t int
    52  loop1:
    53  	if gc.Debug['P'] != 0 && gc.Debug['v'] != 0 {
    54  		gc.Dumpit("loop1", g.Start, 0)
    55  	}
    56  
    57  	t = 0
    58  	for r = g.Start; r != nil; r = r.Link {
    59  		p = r.Prog
    60  
    61  		// TODO(austin) Handle smaller moves.  arm and amd64
    62  		// distinguish between moves that moves that *must*
    63  		// sign/zero extend and moves that don't care so they
    64  		// can eliminate moves that don't care without
    65  		// breaking moves that do care.  This might let us
    66  		// simplify or remove the next peep loop, too.
    67  		if p.As == ppc64.AMOVD || p.As == ppc64.AFMOVD {
    68  			if regtyp(&p.To) {
    69  				// Try to eliminate reg->reg moves
    70  				if regtyp(&p.From) {
    71  					if p.From.Type == p.To.Type {
    72  						if copyprop(r) {
    73  							excise(r)
    74  							t++
    75  						} else if subprop(r) && copyprop(r) {
    76  							excise(r)
    77  							t++
    78  						}
    79  					}
    80  				}
    81  
    82  				// Convert uses to $0 to uses of R0 and
    83  				// propagate R0
    84  				if regzer(&p.From) != 0 {
    85  					if p.To.Type == obj.TYPE_REG {
    86  						p.From.Type = obj.TYPE_REG
    87  						p.From.Reg = ppc64.REGZERO
    88  						if copyprop(r) {
    89  							excise(r)
    90  							t++
    91  						} else if subprop(r) && copyprop(r) {
    92  							excise(r)
    93  							t++
    94  						}
    95  					}
    96  				}
    97  			}
    98  		}
    99  	}
   100  
   101  	if t != 0 {
   102  		goto loop1
   103  	}
   104  
   105  	/*
   106  	 * look for MOVB x,R; MOVB R,R (for small MOVs not handled above)
   107  	 */
   108  	var p1 *obj.Prog
   109  	var r1 *gc.Flow
   110  	for r := (*gc.Flow)(g.Start); r != nil; r = r.Link {
   111  		p = r.Prog
   112  		switch p.As {
   113  		default:
   114  			continue
   115  
   116  		case ppc64.AMOVH,
   117  			ppc64.AMOVHZ,
   118  			ppc64.AMOVB,
   119  			ppc64.AMOVBZ,
   120  			ppc64.AMOVW,
   121  			ppc64.AMOVWZ:
   122  			if p.To.Type != obj.TYPE_REG {
   123  				continue
   124  			}
   125  		}
   126  
   127  		r1 = r.Link
   128  		if r1 == nil {
   129  			continue
   130  		}
   131  		p1 = r1.Prog
   132  		if p1.As != p.As {
   133  			continue
   134  		}
   135  		if p1.From.Type != obj.TYPE_REG || p1.From.Reg != p.To.Reg {
   136  			continue
   137  		}
   138  		if p1.To.Type != obj.TYPE_REG || p1.To.Reg != p.To.Reg {
   139  			continue
   140  		}
   141  		excise(r1)
   142  	}
   143  
   144  	if gc.Debug['D'] > 1 {
   145  		goto ret /* allow following code improvement to be suppressed */
   146  	}
   147  
   148  	/*
   149  	 * look for OP x,y,R; CMP R, $0 -> OPCC x,y,R
   150  	 * when OP can set condition codes correctly
   151  	 */
   152  	for r := (*gc.Flow)(g.Start); r != nil; r = r.Link {
   153  		p = r.Prog
   154  		switch p.As {
   155  		case ppc64.ACMP,
   156  			ppc64.ACMPW: /* always safe? */
   157  			if regzer(&p.To) == 0 {
   158  				continue
   159  			}
   160  			r1 = r.S1
   161  			if r1 == nil {
   162  				continue
   163  			}
   164  			switch r1.Prog.As {
   165  			default:
   166  				continue
   167  
   168  				/* the conditions can be complex and these are currently little used */
   169  			case ppc64.ABCL,
   170  				ppc64.ABC:
   171  				continue
   172  
   173  			case ppc64.ABEQ,
   174  				ppc64.ABGE,
   175  				ppc64.ABGT,
   176  				ppc64.ABLE,
   177  				ppc64.ABLT,
   178  				ppc64.ABNE,
   179  				ppc64.ABVC,
   180  				ppc64.ABVS:
   181  				break
   182  			}
   183  
   184  			r1 = r
   185  			for {
   186  				r1 = gc.Uniqp(r1)
   187  				if r1 == nil || r1.Prog.As != obj.ANOP {
   188  					break
   189  				}
   190  			}
   191  
   192  			if r1 == nil {
   193  				continue
   194  			}
   195  			p1 = r1.Prog
   196  			if p1.To.Type != obj.TYPE_REG || p1.To.Reg != p.From.Reg {
   197  				continue
   198  			}
   199  			switch p1.As {
   200  			/* irregular instructions */
   201  			case ppc64.ASUB,
   202  				ppc64.AADD,
   203  				ppc64.AXOR,
   204  				ppc64.AOR:
   205  				if p1.From.Type == obj.TYPE_CONST || p1.From.Type == obj.TYPE_ADDR {
   206  					continue
   207  				}
   208  			}
   209  
   210  			switch p1.As {
   211  			default:
   212  				continue
   213  
   214  			case ppc64.AMOVW,
   215  				ppc64.AMOVD:
   216  				if p1.From.Type != obj.TYPE_REG {
   217  					continue
   218  				}
   219  				continue
   220  
   221  			case ppc64.AANDCC,
   222  				ppc64.AANDNCC,
   223  				ppc64.AORCC,
   224  				ppc64.AORNCC,
   225  				ppc64.AXORCC,
   226  				ppc64.ASUBCC,
   227  				ppc64.ASUBECC,
   228  				ppc64.ASUBMECC,
   229  				ppc64.ASUBZECC,
   230  				ppc64.AADDCC,
   231  				ppc64.AADDCCC,
   232  				ppc64.AADDECC,
   233  				ppc64.AADDMECC,
   234  				ppc64.AADDZECC,
   235  				ppc64.ARLWMICC,
   236  				ppc64.ARLWNMCC,
   237  				/* don't deal with floating point instructions for now */
   238  				/*
   239  					case AFABS:
   240  					case AFADD:
   241  					case AFADDS:
   242  					case AFCTIW:
   243  					case AFCTIWZ:
   244  					case AFDIV:
   245  					case AFDIVS:
   246  					case AFMADD:
   247  					case AFMADDS:
   248  					case AFMOVD:
   249  					case AFMSUB:
   250  					case AFMSUBS:
   251  					case AFMUL:
   252  					case AFMULS:
   253  					case AFNABS:
   254  					case AFNEG:
   255  					case AFNMADD:
   256  					case AFNMADDS:
   257  					case AFNMSUB:
   258  					case AFNMSUBS:
   259  					case AFRSP:
   260  					case AFSUB:
   261  					case AFSUBS:
   262  					case ACNTLZW:
   263  					case AMTFSB0:
   264  					case AMTFSB1:
   265  				*/
   266  				ppc64.AADD,
   267  				ppc64.AADDV,
   268  				ppc64.AADDC,
   269  				ppc64.AADDCV,
   270  				ppc64.AADDME,
   271  				ppc64.AADDMEV,
   272  				ppc64.AADDE,
   273  				ppc64.AADDEV,
   274  				ppc64.AADDZE,
   275  				ppc64.AADDZEV,
   276  				ppc64.AAND,
   277  				ppc64.AANDN,
   278  				ppc64.ADIVW,
   279  				ppc64.ADIVWV,
   280  				ppc64.ADIVWU,
   281  				ppc64.ADIVWUV,
   282  				ppc64.ADIVD,
   283  				ppc64.ADIVDV,
   284  				ppc64.ADIVDU,
   285  				ppc64.ADIVDUV,
   286  				ppc64.AEQV,
   287  				ppc64.AEXTSB,
   288  				ppc64.AEXTSH,
   289  				ppc64.AEXTSW,
   290  				ppc64.AMULHW,
   291  				ppc64.AMULHWU,
   292  				ppc64.AMULLW,
   293  				ppc64.AMULLWV,
   294  				ppc64.AMULHD,
   295  				ppc64.AMULHDU,
   296  				ppc64.AMULLD,
   297  				ppc64.AMULLDV,
   298  				ppc64.ANAND,
   299  				ppc64.ANEG,
   300  				ppc64.ANEGV,
   301  				ppc64.ANOR,
   302  				ppc64.AOR,
   303  				ppc64.AORN,
   304  				ppc64.AREM,
   305  				ppc64.AREMV,
   306  				ppc64.AREMU,
   307  				ppc64.AREMUV,
   308  				ppc64.AREMD,
   309  				ppc64.AREMDV,
   310  				ppc64.AREMDU,
   311  				ppc64.AREMDUV,
   312  				ppc64.ARLWMI,
   313  				ppc64.ARLWNM,
   314  				ppc64.ASLW,
   315  				ppc64.ASRAW,
   316  				ppc64.ASRW,
   317  				ppc64.ASLD,
   318  				ppc64.ASRAD,
   319  				ppc64.ASRD,
   320  				ppc64.ASUB,
   321  				ppc64.ASUBV,
   322  				ppc64.ASUBC,
   323  				ppc64.ASUBCV,
   324  				ppc64.ASUBME,
   325  				ppc64.ASUBMEV,
   326  				ppc64.ASUBE,
   327  				ppc64.ASUBEV,
   328  				ppc64.ASUBZE,
   329  				ppc64.ASUBZEV,
   330  				ppc64.AXOR:
   331  				t = variant2as(int(p1.As), as2variant(int(p1.As))|V_CC)
   332  			}
   333  
   334  			if gc.Debug['D'] != 0 {
   335  				fmt.Printf("cmp %v; %v -> ", p1, p)
   336  			}
   337  			p1.As = int16(t)
   338  			if gc.Debug['D'] != 0 {
   339  				fmt.Printf("%v\n", p1)
   340  			}
   341  			excise(r)
   342  			continue
   343  		}
   344  	}
   345  
   346  ret:
   347  	gc.Flowend(g)
   348  }
   349  
   350  func excise(r *gc.Flow) {
   351  	p := (*obj.Prog)(r.Prog)
   352  	if gc.Debug['P'] != 0 && gc.Debug['v'] != 0 {
   353  		fmt.Printf("%v ===delete===\n", p)
   354  	}
   355  	obj.Nopout(p)
   356  	gc.Ostats.Ndelmov++
   357  }
   358  
   359  /*
   360   * regzer returns 1 if a's value is 0 (a is R0 or $0)
   361   */
   362  func regzer(a *obj.Addr) int {
   363  	if a.Type == obj.TYPE_CONST || a.Type == obj.TYPE_ADDR {
   364  		if a.Sym == nil && a.Reg == 0 {
   365  			if a.Offset == 0 {
   366  				return 1
   367  			}
   368  		}
   369  	}
   370  	if a.Type == obj.TYPE_REG {
   371  		if a.Reg == ppc64.REGZERO {
   372  			return 1
   373  		}
   374  	}
   375  	return 0
   376  }
   377  
   378  func regtyp(a *obj.Addr) bool {
   379  	// TODO(rsc): Floating point register exclusions?
   380  	return a.Type == obj.TYPE_REG && ppc64.REG_R0 <= a.Reg && a.Reg <= ppc64.REG_F31 && a.Reg != ppc64.REGZERO
   381  }
   382  
   383  /*
   384   * the idea is to substitute
   385   * one register for another
   386   * from one MOV to another
   387   *	MOV	a, R1
   388   *	ADD	b, R1	/ no use of R2
   389   *	MOV	R1, R2
   390   * would be converted to
   391   *	MOV	a, R2
   392   *	ADD	b, R2
   393   *	MOV	R2, R1
   394   * hopefully, then the former or latter MOV
   395   * will be eliminated by copy propagation.
   396   *
   397   * r0 (the argument, not the register) is the MOV at the end of the
   398   * above sequences.  This returns 1 if it modified any instructions.
   399   */
   400  func subprop(r0 *gc.Flow) bool {
   401  	p := (*obj.Prog)(r0.Prog)
   402  	v1 := (*obj.Addr)(&p.From)
   403  	if !regtyp(v1) {
   404  		return false
   405  	}
   406  	v2 := (*obj.Addr)(&p.To)
   407  	if !regtyp(v2) {
   408  		return false
   409  	}
   410  	for r := gc.Uniqp(r0); r != nil; r = gc.Uniqp(r) {
   411  		if gc.Uniqs(r) == nil {
   412  			break
   413  		}
   414  		p = r.Prog
   415  		if p.As == obj.AVARDEF || p.As == obj.AVARKILL {
   416  			continue
   417  		}
   418  		if p.Info.Flags&gc.Call != 0 {
   419  			return false
   420  		}
   421  
   422  		if p.Info.Flags&(gc.RightRead|gc.RightWrite) == gc.RightWrite {
   423  			if p.To.Type == v1.Type {
   424  				if p.To.Reg == v1.Reg {
   425  					copysub(&p.To, v1, v2, 1)
   426  					if gc.Debug['P'] != 0 {
   427  						fmt.Printf("gotit: %v->%v\n%v", gc.Ctxt.Dconv(v1), gc.Ctxt.Dconv(v2), r.Prog)
   428  						if p.From.Type == v2.Type {
   429  							fmt.Printf(" excise")
   430  						}
   431  						fmt.Printf("\n")
   432  					}
   433  
   434  					for r = gc.Uniqs(r); r != r0; r = gc.Uniqs(r) {
   435  						p = r.Prog
   436  						copysub(&p.From, v1, v2, 1)
   437  						copysub1(p, v1, v2, 1)
   438  						copysub(&p.To, v1, v2, 1)
   439  						if gc.Debug['P'] != 0 {
   440  							fmt.Printf("%v\n", r.Prog)
   441  						}
   442  					}
   443  
   444  					t := int(int(v1.Reg))
   445  					v1.Reg = v2.Reg
   446  					v2.Reg = int16(t)
   447  					if gc.Debug['P'] != 0 {
   448  						fmt.Printf("%v last\n", r.Prog)
   449  					}
   450  					return true
   451  				}
   452  			}
   453  		}
   454  
   455  		if copyau(&p.From, v2) || copyau1(p, v2) || copyau(&p.To, v2) {
   456  			break
   457  		}
   458  		if copysub(&p.From, v1, v2, 0) != 0 || copysub1(p, v1, v2, 0) != 0 || copysub(&p.To, v1, v2, 0) != 0 {
   459  			break
   460  		}
   461  	}
   462  
   463  	return false
   464  }
   465  
   466  /*
   467   * The idea is to remove redundant copies.
   468   *	v1->v2	F=0
   469   *	(use v2	s/v2/v1/)*
   470   *	set v1	F=1
   471   *	use v2	return fail (v1->v2 move must remain)
   472   *	-----------------
   473   *	v1->v2	F=0
   474   *	(use v2	s/v2/v1/)*
   475   *	set v1	F=1
   476   *	set v2	return success (caller can remove v1->v2 move)
   477   */
   478  func copyprop(r0 *gc.Flow) bool {
   479  	p := (*obj.Prog)(r0.Prog)
   480  	v1 := (*obj.Addr)(&p.From)
   481  	v2 := (*obj.Addr)(&p.To)
   482  	if copyas(v1, v2) {
   483  		if gc.Debug['P'] != 0 {
   484  			fmt.Printf("eliminating self-move: %v\n", r0.Prog)
   485  		}
   486  		return true
   487  	}
   488  
   489  	gactive++
   490  	if gc.Debug['P'] != 0 {
   491  		fmt.Printf("trying to eliminate %v->%v move from:\n%v\n", gc.Ctxt.Dconv(v1), gc.Ctxt.Dconv(v2), r0.Prog)
   492  	}
   493  	return copy1(v1, v2, r0.S1, 0)
   494  }
   495  
   496  // copy1 replaces uses of v2 with v1 starting at r and returns 1 if
   497  // all uses were rewritten.
   498  func copy1(v1 *obj.Addr, v2 *obj.Addr, r *gc.Flow, f int) bool {
   499  	if uint32(r.Active) == gactive {
   500  		if gc.Debug['P'] != 0 {
   501  			fmt.Printf("act set; return 1\n")
   502  		}
   503  		return true
   504  	}
   505  
   506  	r.Active = int32(gactive)
   507  	if gc.Debug['P'] != 0 {
   508  		fmt.Printf("copy1 replace %v with %v f=%d\n", gc.Ctxt.Dconv(v2), gc.Ctxt.Dconv(v1), f)
   509  	}
   510  	var t int
   511  	var p *obj.Prog
   512  	for ; r != nil; r = r.S1 {
   513  		p = r.Prog
   514  		if gc.Debug['P'] != 0 {
   515  			fmt.Printf("%v", p)
   516  		}
   517  		if f == 0 && gc.Uniqp(r) == nil {
   518  			// Multiple predecessors; conservatively
   519  			// assume v1 was set on other path
   520  			f = 1
   521  
   522  			if gc.Debug['P'] != 0 {
   523  				fmt.Printf("; merge; f=%d", f)
   524  			}
   525  		}
   526  
   527  		t = copyu(p, v2, nil)
   528  		switch t {
   529  		case 2: /* rar, can't split */
   530  			if gc.Debug['P'] != 0 {
   531  				fmt.Printf("; %v rar; return 0\n", gc.Ctxt.Dconv(v2))
   532  			}
   533  			return false
   534  
   535  		case 3: /* set */
   536  			if gc.Debug['P'] != 0 {
   537  				fmt.Printf("; %v set; return 1\n", gc.Ctxt.Dconv(v2))
   538  			}
   539  			return true
   540  
   541  		case 1, /* used, substitute */
   542  			4: /* use and set */
   543  			if f != 0 {
   544  				if gc.Debug['P'] == 0 {
   545  					return false
   546  				}
   547  				if t == 4 {
   548  					fmt.Printf("; %v used+set and f=%d; return 0\n", gc.Ctxt.Dconv(v2), f)
   549  				} else {
   550  					fmt.Printf("; %v used and f=%d; return 0\n", gc.Ctxt.Dconv(v2), f)
   551  				}
   552  				return false
   553  			}
   554  
   555  			if copyu(p, v2, v1) != 0 {
   556  				if gc.Debug['P'] != 0 {
   557  					fmt.Printf("; sub fail; return 0\n")
   558  				}
   559  				return false
   560  			}
   561  
   562  			if gc.Debug['P'] != 0 {
   563  				fmt.Printf("; sub %v->%v\n => %v", gc.Ctxt.Dconv(v2), gc.Ctxt.Dconv(v1), p)
   564  			}
   565  			if t == 4 {
   566  				if gc.Debug['P'] != 0 {
   567  					fmt.Printf("; %v used+set; return 1\n", gc.Ctxt.Dconv(v2))
   568  				}
   569  				return true
   570  			}
   571  		}
   572  
   573  		if f == 0 {
   574  			t = copyu(p, v1, nil)
   575  			if f == 0 && (t == 2 || t == 3 || t == 4) {
   576  				f = 1
   577  				if gc.Debug['P'] != 0 {
   578  					fmt.Printf("; %v set and !f; f=%d", gc.Ctxt.Dconv(v1), f)
   579  				}
   580  			}
   581  		}
   582  
   583  		if gc.Debug['P'] != 0 {
   584  			fmt.Printf("\n")
   585  		}
   586  		if r.S2 != nil {
   587  			if !copy1(v1, v2, r.S2, f) {
   588  				return false
   589  			}
   590  		}
   591  	}
   592  
   593  	return true
   594  }
   595  
   596  // If s==nil, copyu returns the set/use of v in p; otherwise, it
   597  // modifies p to replace reads of v with reads of s and returns 0 for
   598  // success or non-zero for failure.
   599  //
   600  // If s==nil, copy returns one of the following values:
   601  // 	1 if v only used
   602  //	2 if v is set and used in one address (read-alter-rewrite;
   603  // 	  can't substitute)
   604  //	3 if v is only set
   605  //	4 if v is set in one address and used in another (so addresses
   606  // 	  can be rewritten independently)
   607  //	0 otherwise (not touched)
   608  func copyu(p *obj.Prog, v *obj.Addr, s *obj.Addr) int {
   609  	if p.From3Type() != obj.TYPE_NONE {
   610  		// 9g never generates a from3
   611  		fmt.Printf("copyu: from3 (%v) not implemented\n", gc.Ctxt.Dconv(p.From3))
   612  	}
   613  
   614  	switch p.As {
   615  	default:
   616  		fmt.Printf("copyu: can't find %v\n", obj.Aconv(int(p.As)))
   617  		return 2
   618  
   619  	case obj.ANOP, /* read p->from, write p->to */
   620  		ppc64.AMOVH,
   621  		ppc64.AMOVHZ,
   622  		ppc64.AMOVB,
   623  		ppc64.AMOVBZ,
   624  		ppc64.AMOVW,
   625  		ppc64.AMOVWZ,
   626  		ppc64.AMOVD,
   627  		ppc64.ANEG,
   628  		ppc64.ANEGCC,
   629  		ppc64.AADDME,
   630  		ppc64.AADDMECC,
   631  		ppc64.AADDZE,
   632  		ppc64.AADDZECC,
   633  		ppc64.ASUBME,
   634  		ppc64.ASUBMECC,
   635  		ppc64.ASUBZE,
   636  		ppc64.ASUBZECC,
   637  		ppc64.AFCTIW,
   638  		ppc64.AFCTIWZ,
   639  		ppc64.AFCTID,
   640  		ppc64.AFCTIDZ,
   641  		ppc64.AFCFID,
   642  		ppc64.AFCFIDCC,
   643  		ppc64.AFMOVS,
   644  		ppc64.AFMOVD,
   645  		ppc64.AFRSP,
   646  		ppc64.AFNEG,
   647  		ppc64.AFNEGCC:
   648  		if s != nil {
   649  			if copysub(&p.From, v, s, 1) != 0 {
   650  				return 1
   651  			}
   652  
   653  			// Update only indirect uses of v in p->to
   654  			if !copyas(&p.To, v) {
   655  				if copysub(&p.To, v, s, 1) != 0 {
   656  					return 1
   657  				}
   658  			}
   659  			return 0
   660  		}
   661  
   662  		if copyas(&p.To, v) {
   663  			// Fix up implicit from
   664  			if p.From.Type == obj.TYPE_NONE {
   665  				p.From = p.To
   666  			}
   667  			if copyau(&p.From, v) {
   668  				return 4
   669  			}
   670  			return 3
   671  		}
   672  
   673  		if copyau(&p.From, v) {
   674  			return 1
   675  		}
   676  		if copyau(&p.To, v) {
   677  			// p->to only indirectly uses v
   678  			return 1
   679  		}
   680  
   681  		return 0
   682  
   683  	case ppc64.AMOVBU, /* rar p->from, write p->to or read p->from, rar p->to */
   684  		ppc64.AMOVBZU,
   685  		ppc64.AMOVHU,
   686  		ppc64.AMOVHZU,
   687  		ppc64.AMOVWZU,
   688  		ppc64.AMOVDU:
   689  		if p.From.Type == obj.TYPE_MEM {
   690  			if copyas(&p.From, v) {
   691  				// No s!=nil check; need to fail
   692  				// anyway in that case
   693  				return 2
   694  			}
   695  
   696  			if s != nil {
   697  				if copysub(&p.To, v, s, 1) != 0 {
   698  					return 1
   699  				}
   700  				return 0
   701  			}
   702  
   703  			if copyas(&p.To, v) {
   704  				return 3
   705  			}
   706  		} else if p.To.Type == obj.TYPE_MEM {
   707  			if copyas(&p.To, v) {
   708  				return 2
   709  			}
   710  			if s != nil {
   711  				if copysub(&p.From, v, s, 1) != 0 {
   712  					return 1
   713  				}
   714  				return 0
   715  			}
   716  
   717  			if copyau(&p.From, v) {
   718  				return 1
   719  			}
   720  		} else {
   721  			fmt.Printf("copyu: bad %v\n", p)
   722  		}
   723  
   724  		return 0
   725  
   726  	case ppc64.ARLWMI, /* read p->from, read p->reg, rar p->to */
   727  		ppc64.ARLWMICC:
   728  		if copyas(&p.To, v) {
   729  			return 2
   730  		}
   731  		fallthrough
   732  
   733  		/* fall through */
   734  	case ppc64.AADD,
   735  		/* read p->from, read p->reg, write p->to */
   736  		ppc64.AADDC,
   737  		ppc64.AADDE,
   738  		ppc64.ASUB,
   739  		ppc64.ASLW,
   740  		ppc64.ASRW,
   741  		ppc64.ASRAW,
   742  		ppc64.ASLD,
   743  		ppc64.ASRD,
   744  		ppc64.ASRAD,
   745  		ppc64.AOR,
   746  		ppc64.AORCC,
   747  		ppc64.AORN,
   748  		ppc64.AORNCC,
   749  		ppc64.AAND,
   750  		ppc64.AANDCC,
   751  		ppc64.AANDN,
   752  		ppc64.AANDNCC,
   753  		ppc64.ANAND,
   754  		ppc64.ANANDCC,
   755  		ppc64.ANOR,
   756  		ppc64.ANORCC,
   757  		ppc64.AXOR,
   758  		ppc64.AMULHW,
   759  		ppc64.AMULHWU,
   760  		ppc64.AMULLW,
   761  		ppc64.AMULLD,
   762  		ppc64.ADIVW,
   763  		ppc64.ADIVD,
   764  		ppc64.ADIVWU,
   765  		ppc64.ADIVDU,
   766  		ppc64.AREM,
   767  		ppc64.AREMU,
   768  		ppc64.AREMD,
   769  		ppc64.AREMDU,
   770  		ppc64.ARLWNM,
   771  		ppc64.ARLWNMCC,
   772  		ppc64.AFADDS,
   773  		ppc64.AFADD,
   774  		ppc64.AFSUBS,
   775  		ppc64.AFSUB,
   776  		ppc64.AFMULS,
   777  		ppc64.AFMUL,
   778  		ppc64.AFDIVS,
   779  		ppc64.AFDIV:
   780  		if s != nil {
   781  			if copysub(&p.From, v, s, 1) != 0 {
   782  				return 1
   783  			}
   784  			if copysub1(p, v, s, 1) != 0 {
   785  				return 1
   786  			}
   787  
   788  			// Update only indirect uses of v in p->to
   789  			if !copyas(&p.To, v) {
   790  				if copysub(&p.To, v, s, 1) != 0 {
   791  					return 1
   792  				}
   793  			}
   794  			return 0
   795  		}
   796  
   797  		if copyas(&p.To, v) {
   798  			if p.Reg == 0 {
   799  				// Fix up implicit reg (e.g., ADD
   800  				// R3,R4 -> ADD R3,R4,R4) so we can
   801  				// update reg and to separately.
   802  				p.Reg = p.To.Reg
   803  			}
   804  
   805  			if copyau(&p.From, v) {
   806  				return 4
   807  			}
   808  			if copyau1(p, v) {
   809  				return 4
   810  			}
   811  			return 3
   812  		}
   813  
   814  		if copyau(&p.From, v) {
   815  			return 1
   816  		}
   817  		if copyau1(p, v) {
   818  			return 1
   819  		}
   820  		if copyau(&p.To, v) {
   821  			return 1
   822  		}
   823  		return 0
   824  
   825  	case ppc64.ABEQ,
   826  		ppc64.ABGT,
   827  		ppc64.ABGE,
   828  		ppc64.ABLT,
   829  		ppc64.ABLE,
   830  		ppc64.ABNE,
   831  		ppc64.ABVC,
   832  		ppc64.ABVS:
   833  		return 0
   834  
   835  	case obj.ACHECKNIL, /* read p->from */
   836  		ppc64.ACMP, /* read p->from, read p->to */
   837  		ppc64.ACMPU,
   838  		ppc64.ACMPW,
   839  		ppc64.ACMPWU,
   840  		ppc64.AFCMPO,
   841  		ppc64.AFCMPU:
   842  		if s != nil {
   843  			if copysub(&p.From, v, s, 1) != 0 {
   844  				return 1
   845  			}
   846  			return copysub(&p.To, v, s, 1)
   847  		}
   848  
   849  		if copyau(&p.From, v) {
   850  			return 1
   851  		}
   852  		if copyau(&p.To, v) {
   853  			return 1
   854  		}
   855  		return 0
   856  
   857  		// 9g never generates a branch to a GPR (this isn't
   858  	// even a normal instruction; liblink turns it in to a
   859  	// mov and a branch).
   860  	case ppc64.ABR: /* read p->to */
   861  		if s != nil {
   862  			if copysub(&p.To, v, s, 1) != 0 {
   863  				return 1
   864  			}
   865  			return 0
   866  		}
   867  
   868  		if copyau(&p.To, v) {
   869  			return 1
   870  		}
   871  		return 0
   872  
   873  	case obj.ARET: /* funny */
   874  		if s != nil {
   875  			return 0
   876  		}
   877  
   878  		// All registers die at this point, so claim
   879  		// everything is set (and not used).
   880  		return 3
   881  
   882  	case ppc64.ABL: /* funny */
   883  		if v.Type == obj.TYPE_REG {
   884  			// TODO(rsc): REG_R0 and REG_F0 used to be
   885  			// (when register numbers started at 0) exregoffset and exfregoffset,
   886  			// which are unset entirely.
   887  			// It's strange that this handles R0 and F0 differently from the other
   888  			// registers. Possible failure to optimize?
   889  			if ppc64.REG_R0 < v.Reg && v.Reg <= ppc64.REGEXT {
   890  				return 2
   891  			}
   892  			if v.Reg == ppc64.REGARG {
   893  				return 2
   894  			}
   895  			if ppc64.REG_F0 < v.Reg && v.Reg <= ppc64.FREGEXT {
   896  				return 2
   897  			}
   898  		}
   899  
   900  		if p.From.Type == obj.TYPE_REG && v.Type == obj.TYPE_REG && p.From.Reg == v.Reg {
   901  			return 2
   902  		}
   903  
   904  		if s != nil {
   905  			if copysub(&p.To, v, s, 1) != 0 {
   906  				return 1
   907  			}
   908  			return 0
   909  		}
   910  
   911  		if copyau(&p.To, v) {
   912  			return 4
   913  		}
   914  		return 3
   915  
   916  		// R0 is zero, used by DUFFZERO, cannot be substituted.
   917  	// R3 is ptr to memory, used and set, cannot be substituted.
   918  	case obj.ADUFFZERO:
   919  		if v.Type == obj.TYPE_REG {
   920  			if v.Reg == 0 {
   921  				return 1
   922  			}
   923  			if v.Reg == 3 {
   924  				return 2
   925  			}
   926  		}
   927  
   928  		return 0
   929  
   930  		// R3, R4 are ptr to src, dst, used and set, cannot be substituted.
   931  	// R5 is scratch, set by DUFFCOPY, cannot be substituted.
   932  	case obj.ADUFFCOPY:
   933  		if v.Type == obj.TYPE_REG {
   934  			if v.Reg == 3 || v.Reg == 4 {
   935  				return 2
   936  			}
   937  			if v.Reg == 5 {
   938  				return 3
   939  			}
   940  		}
   941  
   942  		return 0
   943  
   944  	case obj.ATEXT: /* funny */
   945  		if v.Type == obj.TYPE_REG {
   946  			if v.Reg == ppc64.REGARG {
   947  				return 3
   948  			}
   949  		}
   950  		return 0
   951  
   952  	case obj.APCDATA,
   953  		obj.AFUNCDATA,
   954  		obj.AVARDEF,
   955  		obj.AVARKILL:
   956  		return 0
   957  	}
   958  }
   959  
   960  // copyas returns 1 if a and v address the same register.
   961  //
   962  // If a is the from operand, this means this operation reads the
   963  // register in v.  If a is the to operand, this means this operation
   964  // writes the register in v.
   965  func copyas(a *obj.Addr, v *obj.Addr) bool {
   966  	if regtyp(v) {
   967  		if a.Type == v.Type {
   968  			if a.Reg == v.Reg {
   969  				return true
   970  			}
   971  		}
   972  	}
   973  	return false
   974  }
   975  
   976  // copyau returns 1 if a either directly or indirectly addresses the
   977  // same register as v.
   978  //
   979  // If a is the from operand, this means this operation reads the
   980  // register in v.  If a is the to operand, this means the operation
   981  // either reads or writes the register in v (if !copyas(a, v), then
   982  // the operation reads the register in v).
   983  func copyau(a *obj.Addr, v *obj.Addr) bool {
   984  	if copyas(a, v) {
   985  		return true
   986  	}
   987  	if v.Type == obj.TYPE_REG {
   988  		if a.Type == obj.TYPE_MEM || (a.Type == obj.TYPE_ADDR && a.Reg != 0) {
   989  			if v.Reg == a.Reg {
   990  				return true
   991  			}
   992  		}
   993  	}
   994  	return false
   995  }
   996  
   997  // copyau1 returns 1 if p->reg references the same register as v and v
   998  // is a direct reference.
   999  func copyau1(p *obj.Prog, v *obj.Addr) bool {
  1000  	if regtyp(v) && v.Reg != 0 {
  1001  		if p.Reg == v.Reg {
  1002  			return true
  1003  		}
  1004  	}
  1005  	return false
  1006  }
  1007  
  1008  // copysub replaces v with s in a if f!=0 or indicates it if could if f==0.
  1009  // Returns 1 on failure to substitute (it always succeeds on ppc64).
  1010  func copysub(a *obj.Addr, v *obj.Addr, s *obj.Addr, f int) int {
  1011  	if f != 0 {
  1012  		if copyau(a, v) {
  1013  			a.Reg = s.Reg
  1014  		}
  1015  	}
  1016  	return 0
  1017  }
  1018  
  1019  // copysub1 replaces v with s in p1->reg if f!=0 or indicates if it could if f==0.
  1020  // Returns 1 on failure to substitute (it always succeeds on ppc64).
  1021  func copysub1(p1 *obj.Prog, v *obj.Addr, s *obj.Addr, f int) int {
  1022  	if f != 0 {
  1023  		if copyau1(p1, v) {
  1024  			p1.Reg = s.Reg
  1025  		}
  1026  	}
  1027  	return 0
  1028  }
  1029  
  1030  func sameaddr(a *obj.Addr, v *obj.Addr) bool {
  1031  	if a.Type != v.Type {
  1032  		return false
  1033  	}
  1034  	if regtyp(v) && a.Reg == v.Reg {
  1035  		return true
  1036  	}
  1037  	if v.Type == obj.NAME_AUTO || v.Type == obj.NAME_PARAM {
  1038  		if v.Offset == a.Offset {
  1039  			return true
  1040  		}
  1041  	}
  1042  	return false
  1043  }
  1044  
  1045  func smallindir(a *obj.Addr, reg *obj.Addr) bool {
  1046  	return reg.Type == obj.TYPE_REG && a.Type == obj.TYPE_MEM && a.Reg == reg.Reg && 0 <= a.Offset && a.Offset < 4096
  1047  }
  1048  
  1049  func stackaddr(a *obj.Addr) bool {
  1050  	return a.Type == obj.TYPE_REG && a.Reg == ppc64.REGSP
  1051  }