github.com/x04/go/src@v0.0.0-20200202162449-3d481ceb3525/runtime/mkpreempt.go (about)

     1  // Copyright 2019 The Go Authors. All rights reserved.
     2  // Use of this source code is governed by a BSD-style
     3  // license that can be found in the LICENSE file.
     4  
     5  // +build ignore
     6  
     7  // mkpreempt generates the asyncPreempt functions for each
     8  // architecture.
     9  package main
    10  
    11  import (
    12  	"github.com/x04/go/src/flag"
    13  	"github.com/x04/go/src/fmt"
    14  	"github.com/x04/go/src/io"
    15  	"github.com/x04/go/src/log"
    16  	"github.com/x04/go/src/os"
    17  	"github.com/x04/go/src/strings"
    18  )
    19  
    20  // Copied from cmd/compile/internal/ssa/gen/*Ops.go
    21  
    22  var regNames386 = []string{
    23  	"AX",
    24  	"CX",
    25  	"DX",
    26  	"BX",
    27  	"SP",
    28  	"BP",
    29  	"SI",
    30  	"DI",
    31  	"X0",
    32  	"X1",
    33  	"X2",
    34  	"X3",
    35  	"X4",
    36  	"X5",
    37  	"X6",
    38  	"X7",
    39  }
    40  
    41  var regNamesAMD64 = []string{
    42  	"AX",
    43  	"CX",
    44  	"DX",
    45  	"BX",
    46  	"SP",
    47  	"BP",
    48  	"SI",
    49  	"DI",
    50  	"R8",
    51  	"R9",
    52  	"R10",
    53  	"R11",
    54  	"R12",
    55  	"R13",
    56  	"R14",
    57  	"R15",
    58  	"X0",
    59  	"X1",
    60  	"X2",
    61  	"X3",
    62  	"X4",
    63  	"X5",
    64  	"X6",
    65  	"X7",
    66  	"X8",
    67  	"X9",
    68  	"X10",
    69  	"X11",
    70  	"X12",
    71  	"X13",
    72  	"X14",
    73  	"X15",
    74  }
    75  
    76  var out io.Writer
    77  
    78  var arches = map[string]func(){
    79  	"386":		gen386,
    80  	"amd64":	genAMD64,
    81  	"arm":		genARM,
    82  	"arm64":	genARM64,
    83  	"mips64x":	func() { genMIPS(true) },
    84  	"mipsx":	func() { genMIPS(false) },
    85  	"ppc64x":	genPPC64,
    86  	"riscv64":	genRISCV64,
    87  	"s390x":	genS390X,
    88  	"wasm":		genWasm,
    89  }
    90  var beLe = map[string]bool{"mips64x": true, "mipsx": true, "ppc64x": true}
    91  
    92  func main() {
    93  	flag.Parse()
    94  	if flag.NArg() > 0 {
    95  		out = os.Stdout
    96  		for _, arch := range flag.Args() {
    97  			gen, ok := arches[arch]
    98  			if !ok {
    99  				log.Fatalf("unknown arch %s", arch)
   100  			}
   101  			header(arch)
   102  			gen()
   103  		}
   104  		return
   105  	}
   106  
   107  	for arch, gen := range arches {
   108  		f, err := os.Create(fmt.Sprintf("preempt_%s.s", arch))
   109  		if err != nil {
   110  			log.Fatal(err)
   111  		}
   112  		out = f
   113  		header(arch)
   114  		gen()
   115  		if err := f.Close(); err != nil {
   116  			log.Fatal(err)
   117  		}
   118  	}
   119  }
   120  
   121  func header(arch string) {
   122  	fmt.Fprintf(out, "// Code generated by mkpreempt.go; DO NOT EDIT.\n\n")
   123  	if beLe[arch] {
   124  		base := arch[:len(arch)-1]
   125  		fmt.Fprintf(out, "// +build %s %sle\n\n", base, base)
   126  	}
   127  	fmt.Fprintf(out, "#include \"go_asm.h\"\n")
   128  	fmt.Fprintf(out, "#include \"textflag.h\"\n\n")
   129  	fmt.Fprintf(out, "TEXT ·asyncPreempt(SB),NOSPLIT|NOFRAME,$0-0\n")
   130  }
   131  
   132  func p(f string, args ...interface{}) {
   133  	fmted := fmt.Sprintf(f, args...)
   134  	fmt.Fprintf(out, "\t%s\n", strings.Replace(fmted, "\n", "\n\t", -1))
   135  }
   136  
   137  func label(l string) {
   138  	fmt.Fprintf(out, "%s\n", l)
   139  }
   140  
   141  type layout struct {
   142  	stack	int
   143  	regs	[]regPos
   144  	sp	string	// stack pointer register
   145  }
   146  
   147  type regPos struct {
   148  	pos	int
   149  
   150  	op	string
   151  	reg	string
   152  
   153  	// If this register requires special save and restore, these
   154  	// give those operations with a %d placeholder for the stack
   155  	// offset.
   156  	save, restore	string
   157  }
   158  
   159  func (l *layout) add(op, reg string, size int) {
   160  	l.regs = append(l.regs, regPos{op: op, reg: reg, pos: l.stack})
   161  	l.stack += size
   162  }
   163  
   164  func (l *layout) addSpecial(save, restore string, size int) {
   165  	l.regs = append(l.regs, regPos{save: save, restore: restore, pos: l.stack})
   166  	l.stack += size
   167  }
   168  
   169  func (l *layout) save() {
   170  	for _, reg := range l.regs {
   171  		if reg.save != "" {
   172  			p(reg.save, reg.pos)
   173  		} else {
   174  			p("%s %s, %d(%s)", reg.op, reg.reg, reg.pos, l.sp)
   175  		}
   176  	}
   177  }
   178  
   179  func (l *layout) restore() {
   180  	for i := len(l.regs) - 1; i >= 0; i-- {
   181  		reg := l.regs[i]
   182  		if reg.restore != "" {
   183  			p(reg.restore, reg.pos)
   184  		} else {
   185  			p("%s %d(%s), %s", reg.op, reg.pos, l.sp, reg.reg)
   186  		}
   187  	}
   188  }
   189  
   190  func gen386() {
   191  	p("PUSHFL")
   192  
   193  	// Save general purpose registers.
   194  	var l = layout{sp: "SP"}
   195  	for _, reg := range regNames386 {
   196  		if reg == "SP" || strings.HasPrefix(reg, "X") {
   197  			continue
   198  		}
   199  		l.add("MOVL", reg, 4)
   200  	}
   201  
   202  	// Save the 387 state.
   203  	l.addSpecial(
   204  		"FSAVE %d(SP)\nFLDCW runtime·controlWord64(SB)",
   205  		"FRSTOR %d(SP)",
   206  		108)
   207  
   208  	// Save SSE state only if supported.
   209  	lSSE := layout{stack: l.stack, sp: "SP"}
   210  	for i := 0; i < 8; i++ {
   211  		lSSE.add("MOVUPS", fmt.Sprintf("X%d", i), 16)
   212  	}
   213  
   214  	p("ADJSP $%d", lSSE.stack)
   215  	p("NOP SP")
   216  	l.save()
   217  	p("CMPB internal∕cpu·X86+const_offsetX86HasSSE2(SB), $1\nJNE nosse")
   218  	lSSE.save()
   219  	label("nosse:")
   220  	p("CALL ·asyncPreempt2(SB)")
   221  	p("CMPB internal∕cpu·X86+const_offsetX86HasSSE2(SB), $1\nJNE nosse2")
   222  	lSSE.restore()
   223  	label("nosse2:")
   224  	l.restore()
   225  	p("ADJSP $%d", -lSSE.stack)
   226  
   227  	p("POPFL")
   228  	p("RET")
   229  }
   230  
   231  func genAMD64() {
   232  	// Assign stack offsets.
   233  	var l = layout{sp: "SP"}
   234  	for _, reg := range regNamesAMD64 {
   235  		if reg == "SP" || reg == "BP" {
   236  			continue
   237  		}
   238  		if strings.HasPrefix(reg, "X") {
   239  			l.add("MOVUPS", reg, 16)
   240  		} else {
   241  			l.add("MOVQ", reg, 8)
   242  		}
   243  	}
   244  
   245  	// TODO: MXCSR register?
   246  
   247  	p("PUSHQ BP")
   248  	p("MOVQ SP, BP")
   249  	p("// Save flags before clobbering them")
   250  	p("PUSHFQ")
   251  	p("// obj doesn't understand ADD/SUB on SP, but does understand ADJSP")
   252  	p("ADJSP $%d", l.stack)
   253  	p("// But vet doesn't know ADJSP, so suppress vet stack checking")
   254  	p("NOP SP")
   255  	l.save()
   256  	p("CALL ·asyncPreempt2(SB)")
   257  	l.restore()
   258  	p("ADJSP $%d", -l.stack)
   259  	p("POPFQ")
   260  	p("POPQ BP")
   261  	p("RET")
   262  }
   263  
   264  func genARM() {
   265  	// Add integer registers R0-R12.
   266  	// R13 (SP), R14 (LR), R15 (PC) are special and not saved here.
   267  	var l = layout{sp: "R13", stack: 4}	// add LR slot
   268  	for i := 0; i <= 12; i++ {
   269  		reg := fmt.Sprintf("R%d", i)
   270  		if i == 10 {
   271  			continue	// R10 is g register, no need to save/restore
   272  		}
   273  		l.add("MOVW", reg, 4)
   274  	}
   275  	// Add flag register.
   276  	l.addSpecial(
   277  		"MOVW CPSR, R0\nMOVW R0, %d(R13)",
   278  		"MOVW %d(R13), R0\nMOVW R0, CPSR",
   279  		4)
   280  
   281  	// Add floating point registers F0-F15 and flag register.
   282  	var lfp = layout{stack: l.stack, sp: "R13"}
   283  	lfp.addSpecial(
   284  		"MOVW FPCR, R0\nMOVW R0, %d(R13)",
   285  		"MOVW %d(R13), R0\nMOVW R0, FPCR",
   286  		4)
   287  	for i := 0; i <= 15; i++ {
   288  		reg := fmt.Sprintf("F%d", i)
   289  		lfp.add("MOVD", reg, 8)
   290  	}
   291  
   292  	p("MOVW.W R14, -%d(R13)", lfp.stack)	// allocate frame, save LR
   293  	l.save()
   294  	p("MOVB ·goarm(SB), R0\nCMP $6, R0\nBLT nofp")	// test goarm, and skip FP registers if goarm=5.
   295  	lfp.save()
   296  	label("nofp:")
   297  	p("CALL ·asyncPreempt2(SB)")
   298  	p("MOVB ·goarm(SB), R0\nCMP $6, R0\nBLT nofp2")	// test goarm, and skip FP registers if goarm=5.
   299  	lfp.restore()
   300  	label("nofp2:")
   301  	l.restore()
   302  
   303  	p("MOVW %d(R13), R14", lfp.stack)	// sigctxt.pushCall pushes LR on stack, restore it
   304  	p("MOVW.P %d(R13), R15", lfp.stack+4)	// load PC, pop frame (including the space pushed by sigctxt.pushCall)
   305  	p("UNDEF")				// shouldn't get here
   306  }
   307  
   308  func genARM64() {
   309  	// Add integer registers R0-R26
   310  	// R27 (REGTMP), R28 (g), R29 (FP), R30 (LR), R31 (SP) are special
   311  	// and not saved here.
   312  	var l = layout{sp: "RSP", stack: 8}	// add slot to save PC of interrupted instruction
   313  	for i := 0; i <= 26; i++ {
   314  		if i == 18 {
   315  			continue	// R18 is not used, skip
   316  		}
   317  		reg := fmt.Sprintf("R%d", i)
   318  		l.add("MOVD", reg, 8)
   319  	}
   320  	// Add flag registers.
   321  	l.addSpecial(
   322  		"MOVD NZCV, R0\nMOVD R0, %d(RSP)",
   323  		"MOVD %d(RSP), R0\nMOVD R0, NZCV",
   324  		8)
   325  	l.addSpecial(
   326  		"MOVD FPSR, R0\nMOVD R0, %d(RSP)",
   327  		"MOVD %d(RSP), R0\nMOVD R0, FPSR",
   328  		8)
   329  	// TODO: FPCR? I don't think we'll change it, so no need to save.
   330  	// Add floating point registers F0-F31.
   331  	for i := 0; i <= 31; i++ {
   332  		reg := fmt.Sprintf("F%d", i)
   333  		l.add("FMOVD", reg, 8)
   334  	}
   335  	if l.stack%16 != 0 {
   336  		l.stack += 8	// SP needs 16-byte alignment
   337  	}
   338  
   339  	// allocate frame, save PC of interrupted instruction (in LR)
   340  	p("MOVD R30, %d(RSP)", -l.stack)
   341  	p("SUB $%d, RSP", l.stack)
   342  	p("#ifdef GOOS_linux")
   343  	p("MOVD R29, -8(RSP)")	// save frame pointer (only used on Linux)
   344  	p("SUB $8, RSP, R29")	// set up new frame pointer
   345  	p("#endif")
   346  	// On darwin, save the LR again after decrementing SP. We run the
   347  	// signal handler on the G stack (as it doesn't support SA_ONSTACK),
   348  	// so any writes below SP may be clobbered.
   349  	p("#ifdef GOOS_darwin")
   350  	p("MOVD R30, (RSP)")
   351  	p("#endif")
   352  
   353  	l.save()
   354  	p("CALL ·asyncPreempt2(SB)")
   355  	l.restore()
   356  
   357  	p("MOVD %d(RSP), R30", l.stack)	// sigctxt.pushCall has pushed LR (at interrupt) on stack, restore it
   358  	p("#ifdef GOOS_linux")
   359  	p("MOVD -8(RSP), R29")	// restore frame pointer
   360  	p("#endif")
   361  	p("MOVD (RSP), R27")		// load PC to REGTMP
   362  	p("ADD $%d, RSP", l.stack+16)	// pop frame (including the space pushed by sigctxt.pushCall)
   363  	p("JMP (R27)")
   364  }
   365  
   366  func genMIPS(_64bit bool) {
   367  	mov := "MOVW"
   368  	movf := "MOVF"
   369  	add := "ADD"
   370  	sub := "SUB"
   371  	r28 := "R28"
   372  	regsize := 4
   373  	if _64bit {
   374  		mov = "MOVV"
   375  		movf = "MOVD"
   376  		add = "ADDV"
   377  		sub = "SUBV"
   378  		r28 = "RSB"
   379  		regsize = 8
   380  	}
   381  
   382  	// Add integer registers R1-R22, R24-R25, R28
   383  	// R0 (zero), R23 (REGTMP), R29 (SP), R30 (g), R31 (LR) are special,
   384  	// and not saved here. R26 and R27 are reserved by kernel and not used.
   385  	var l = layout{sp: "R29", stack: regsize}	// add slot to save PC of interrupted instruction (in LR)
   386  	for i := 1; i <= 25; i++ {
   387  		if i == 23 {
   388  			continue	// R23 is REGTMP
   389  		}
   390  		reg := fmt.Sprintf("R%d", i)
   391  		l.add(mov, reg, regsize)
   392  	}
   393  	l.add(mov, r28, regsize)
   394  	l.addSpecial(
   395  		mov+" HI, R1\n"+mov+" R1, %d(R29)",
   396  		mov+" %d(R29), R1\n"+mov+" R1, HI",
   397  		regsize)
   398  	l.addSpecial(
   399  		mov+" LO, R1\n"+mov+" R1, %d(R29)",
   400  		mov+" %d(R29), R1\n"+mov+" R1, LO",
   401  		regsize)
   402  	// Add floating point control/status register FCR31 (FCR0-FCR30 are irrelevant)
   403  	l.addSpecial(
   404  		mov+" FCR31, R1\n"+mov+" R1, %d(R29)",
   405  		mov+" %d(R29), R1\n"+mov+" R1, FCR31",
   406  		regsize)
   407  	// Add floating point registers F0-F31.
   408  	for i := 0; i <= 31; i++ {
   409  		reg := fmt.Sprintf("F%d", i)
   410  		l.add(movf, reg, regsize)
   411  	}
   412  
   413  	// allocate frame, save PC of interrupted instruction (in LR)
   414  	p(mov+" R31, -%d(R29)", l.stack)
   415  	p(sub+" $%d, R29", l.stack)
   416  
   417  	l.save()
   418  	p("CALL ·asyncPreempt2(SB)")
   419  	l.restore()
   420  
   421  	p(mov+" %d(R29), R31", l.stack)		// sigctxt.pushCall has pushed LR (at interrupt) on stack, restore it
   422  	p(mov + " (R29), R23")			// load PC to REGTMP
   423  	p(add+" $%d, R29", l.stack+regsize)	// pop frame (including the space pushed by sigctxt.pushCall)
   424  	p("JMP (R23)")
   425  }
   426  
   427  func genPPC64() {
   428  	// Add integer registers R3-R29
   429  	// R0 (zero), R1 (SP), R30 (g) are special and not saved here.
   430  	// R2 (TOC pointer in PIC mode), R12 (function entry address in PIC mode) have been saved in sigctxt.pushCall.
   431  	// R31 (REGTMP) will be saved manually.
   432  	var l = layout{sp: "R1", stack: 32 + 8}	// MinFrameSize on PPC64, plus one word for saving R31
   433  	for i := 3; i <= 29; i++ {
   434  		if i == 12 || i == 13 {
   435  			// R12 has been saved in sigctxt.pushCall.
   436  			// R13 is TLS pointer, not used by Go code. we must NOT
   437  			// restore it, otherwise if we parked and resumed on a
   438  			// different thread we'll mess up TLS addresses.
   439  			continue
   440  		}
   441  		reg := fmt.Sprintf("R%d", i)
   442  		l.add("MOVD", reg, 8)
   443  	}
   444  	l.addSpecial(
   445  		"MOVW CR, R31\nMOVW R31, %d(R1)",
   446  		"MOVW %d(R1), R31\nMOVFL R31, $0xff",	// this is MOVW R31, CR
   447  		8)					// CR is 4-byte wide, but just keep the alignment
   448  	l.addSpecial(
   449  		"MOVD XER, R31\nMOVD R31, %d(R1)",
   450  		"MOVD %d(R1), R31\nMOVD R31, XER",
   451  		8)
   452  	// Add floating point registers F0-F31.
   453  	for i := 0; i <= 31; i++ {
   454  		reg := fmt.Sprintf("F%d", i)
   455  		l.add("FMOVD", reg, 8)
   456  	}
   457  	// Add floating point control/status register FPSCR.
   458  	l.addSpecial(
   459  		"MOVFL FPSCR, F0\nFMOVD F0, %d(R1)",
   460  		"FMOVD %d(R1), F0\nMOVFL F0, FPSCR",
   461  		8)
   462  
   463  	p("MOVD R31, -%d(R1)", l.stack-32)	// save R31 first, we'll use R31 for saving LR
   464  	p("MOVD LR, R31")
   465  	p("MOVDU R31, -%d(R1)", l.stack)	// allocate frame, save PC of interrupted instruction (in LR)
   466  
   467  	l.save()
   468  	p("CALL ·asyncPreempt2(SB)")
   469  	l.restore()
   470  
   471  	p("MOVD %d(R1), R31", l.stack)	// sigctxt.pushCall has pushed LR, R2, R12 (at interrupt) on stack, restore them
   472  	p("MOVD R31, LR")
   473  	p("MOVD %d(R1), R2", l.stack+8)
   474  	p("MOVD %d(R1), R12", l.stack+16)
   475  	p("MOVD (R1), R31")	// load PC to CTR
   476  	p("MOVD R31, CTR")
   477  	p("MOVD 32(R1), R31")		// restore R31
   478  	p("ADD $%d, R1", l.stack+32)	// pop frame (including the space pushed by sigctxt.pushCall)
   479  	p("JMP (CTR)")
   480  }
   481  
   482  func genRISCV64() {
   483  	p("// No async preemption on riscv64 - see issue 36711")
   484  	p("UNDEF")
   485  }
   486  
   487  func genS390X() {
   488  	// Add integer registers R0-R12
   489  	// R13 (g), R14 (LR), R15 (SP) are special, and not saved here.
   490  	// Saving R10 (REGTMP) is not necessary, but it is saved anyway.
   491  	var l = layout{sp: "R15", stack: 16}	// add slot to save PC of interrupted instruction and flags
   492  	l.addSpecial(
   493  		"STMG R0, R12, %d(R15)",
   494  		"LMG %d(R15), R0, R12",
   495  		13*8)
   496  	// Add floating point registers F0-F31.
   497  	for i := 0; i <= 15; i++ {
   498  		reg := fmt.Sprintf("F%d", i)
   499  		l.add("FMOVD", reg, 8)
   500  	}
   501  
   502  	// allocate frame, save PC of interrupted instruction (in LR) and flags (condition code)
   503  	p("IPM R10")	// save flags upfront, as ADD will clobber flags
   504  	p("MOVD R14, -%d(R15)", l.stack)
   505  	p("ADD $-%d, R15", l.stack)
   506  	p("MOVW R10, 8(R15)")	// save flags
   507  
   508  	l.save()
   509  	p("CALL ·asyncPreempt2(SB)")
   510  	l.restore()
   511  
   512  	p("MOVD %d(R15), R14", l.stack)		// sigctxt.pushCall has pushed LR (at interrupt) on stack, restore it
   513  	p("ADD $%d, R15", l.stack+8)		// pop frame (including the space pushed by sigctxt.pushCall)
   514  	p("MOVWZ -%d(R15), R10", l.stack)	// load flags to REGTMP
   515  	p("TMLH R10, $(3<<12)")			// restore flags
   516  	p("MOVD -%d(R15), R10", l.stack+8)	// load PC to REGTMP
   517  	p("JMP (R10)")
   518  }
   519  
   520  func genWasm() {
   521  	p("// No async preemption on wasm")
   522  	p("UNDEF")
   523  }
   524  
   525  func notImplemented() {
   526  	p("// Not implemented yet")
   527  	p("JMP ·abort(SB)")
   528  }