github.com/likebike/go--@v0.0.0-20190911215757-0bd925d16e96/go/src/runtime/softfloat64.go (about)

     1  // Copyright 2010 The Go Authors. All rights reserved.
     2  // Use of this source code is governed by a BSD-style
     3  // license that can be found in the LICENSE file.
     4  
     5  // Software IEEE754 64-bit floating point.
     6  // Only referred to (and thus linked in) by arm port
     7  // and by tests in this directory.
     8  
     9  package runtime
    10  
    11  const (
    12  	mantbits64 uint = 52
    13  	expbits64  uint = 11
    14  	bias64          = -1<<(expbits64-1) + 1
    15  
    16  	nan64 uint64 = (1<<expbits64-1)<<mantbits64 + 1
    17  	inf64 uint64 = (1<<expbits64 - 1) << mantbits64
    18  	neg64 uint64 = 1 << (expbits64 + mantbits64)
    19  
    20  	mantbits32 uint = 23
    21  	expbits32  uint = 8
    22  	bias32          = -1<<(expbits32-1) + 1
    23  
    24  	nan32 uint32 = (1<<expbits32-1)<<mantbits32 + 1
    25  	inf32 uint32 = (1<<expbits32 - 1) << mantbits32
    26  	neg32 uint32 = 1 << (expbits32 + mantbits32)
    27  )
    28  
    29  func funpack64(f uint64) (sign, mant uint64, exp int, inf, nan bool) {
    30  	sign = f & (1 << (mantbits64 + expbits64))
    31  	mant = f & (1<<mantbits64 - 1)
    32  	exp = int(f>>mantbits64) & (1<<expbits64 - 1)
    33  
    34  	switch exp {
    35  	case 1<<expbits64 - 1:
    36  		if mant != 0 {
    37  			nan = true
    38  			return
    39  		}
    40  		inf = true
    41  		return
    42  
    43  	case 0:
    44  		// denormalized
    45  		if mant != 0 {
    46  			exp += bias64 + 1
    47  			for mant < 1<<mantbits64 {
    48  				mant <<= 1
    49  				exp--
    50  			}
    51  		}
    52  
    53  	default:
    54  		// add implicit top bit
    55  		mant |= 1 << mantbits64
    56  		exp += bias64
    57  	}
    58  	return
    59  }
    60  
    61  func funpack32(f uint32) (sign, mant uint32, exp int, inf, nan bool) {
    62  	sign = f & (1 << (mantbits32 + expbits32))
    63  	mant = f & (1<<mantbits32 - 1)
    64  	exp = int(f>>mantbits32) & (1<<expbits32 - 1)
    65  
    66  	switch exp {
    67  	case 1<<expbits32 - 1:
    68  		if mant != 0 {
    69  			nan = true
    70  			return
    71  		}
    72  		inf = true
    73  		return
    74  
    75  	case 0:
    76  		// denormalized
    77  		if mant != 0 {
    78  			exp += bias32 + 1
    79  			for mant < 1<<mantbits32 {
    80  				mant <<= 1
    81  				exp--
    82  			}
    83  		}
    84  
    85  	default:
    86  		// add implicit top bit
    87  		mant |= 1 << mantbits32
    88  		exp += bias32
    89  	}
    90  	return
    91  }
    92  
    93  func fpack64(sign, mant uint64, exp int, trunc uint64) uint64 {
    94  	mant0, exp0, trunc0 := mant, exp, trunc
    95  	if mant == 0 {
    96  		return sign
    97  	}
    98  	for mant < 1<<mantbits64 {
    99  		mant <<= 1
   100  		exp--
   101  	}
   102  	for mant >= 4<<mantbits64 {
   103  		trunc |= mant & 1
   104  		mant >>= 1
   105  		exp++
   106  	}
   107  	if mant >= 2<<mantbits64 {
   108  		if mant&1 != 0 && (trunc != 0 || mant&2 != 0) {
   109  			mant++
   110  			if mant >= 4<<mantbits64 {
   111  				mant >>= 1
   112  				exp++
   113  			}
   114  		}
   115  		mant >>= 1
   116  		exp++
   117  	}
   118  	if exp >= 1<<expbits64-1+bias64 {
   119  		return sign ^ inf64
   120  	}
   121  	if exp < bias64+1 {
   122  		if exp < bias64-int(mantbits64) {
   123  			return sign | 0
   124  		}
   125  		// repeat expecting denormal
   126  		mant, exp, trunc = mant0, exp0, trunc0
   127  		for exp < bias64 {
   128  			trunc |= mant & 1
   129  			mant >>= 1
   130  			exp++
   131  		}
   132  		if mant&1 != 0 && (trunc != 0 || mant&2 != 0) {
   133  			mant++
   134  		}
   135  		mant >>= 1
   136  		exp++
   137  		if mant < 1<<mantbits64 {
   138  			return sign | mant
   139  		}
   140  	}
   141  	return sign | uint64(exp-bias64)<<mantbits64 | mant&(1<<mantbits64-1)
   142  }
   143  
   144  func fpack32(sign, mant uint32, exp int, trunc uint32) uint32 {
   145  	mant0, exp0, trunc0 := mant, exp, trunc
   146  	if mant == 0 {
   147  		return sign
   148  	}
   149  	for mant < 1<<mantbits32 {
   150  		mant <<= 1
   151  		exp--
   152  	}
   153  	for mant >= 4<<mantbits32 {
   154  		trunc |= mant & 1
   155  		mant >>= 1
   156  		exp++
   157  	}
   158  	if mant >= 2<<mantbits32 {
   159  		if mant&1 != 0 && (trunc != 0 || mant&2 != 0) {
   160  			mant++
   161  			if mant >= 4<<mantbits32 {
   162  				mant >>= 1
   163  				exp++
   164  			}
   165  		}
   166  		mant >>= 1
   167  		exp++
   168  	}
   169  	if exp >= 1<<expbits32-1+bias32 {
   170  		return sign ^ inf32
   171  	}
   172  	if exp < bias32+1 {
   173  		if exp < bias32-int(mantbits32) {
   174  			return sign | 0
   175  		}
   176  		// repeat expecting denormal
   177  		mant, exp, trunc = mant0, exp0, trunc0
   178  		for exp < bias32 {
   179  			trunc |= mant & 1
   180  			mant >>= 1
   181  			exp++
   182  		}
   183  		if mant&1 != 0 && (trunc != 0 || mant&2 != 0) {
   184  			mant++
   185  		}
   186  		mant >>= 1
   187  		exp++
   188  		if mant < 1<<mantbits32 {
   189  			return sign | mant
   190  		}
   191  	}
   192  	return sign | uint32(exp-bias32)<<mantbits32 | mant&(1<<mantbits32-1)
   193  }
   194  
   195  func fadd64(f, g uint64) uint64 {
   196  	fs, fm, fe, fi, fn := funpack64(f)
   197  	gs, gm, ge, gi, gn := funpack64(g)
   198  
   199  	// Special cases.
   200  	switch {
   201  	case fn || gn: // NaN + x or x + NaN = NaN
   202  		return nan64
   203  
   204  	case fi && gi && fs != gs: // +Inf + -Inf or -Inf + +Inf = NaN
   205  		return nan64
   206  
   207  	case fi: // ±Inf + g = ±Inf
   208  		return f
   209  
   210  	case gi: // f + ±Inf = ±Inf
   211  		return g
   212  
   213  	case fm == 0 && gm == 0 && fs != 0 && gs != 0: // -0 + -0 = -0
   214  		return f
   215  
   216  	case fm == 0: // 0 + g = g but 0 + -0 = +0
   217  		if gm == 0 {
   218  			g ^= gs
   219  		}
   220  		return g
   221  
   222  	case gm == 0: // f + 0 = f
   223  		return f
   224  
   225  	}
   226  
   227  	if fe < ge || fe == ge && fm < gm {
   228  		f, g, fs, fm, fe, gs, gm, ge = g, f, gs, gm, ge, fs, fm, fe
   229  	}
   230  
   231  	shift := uint(fe - ge)
   232  	fm <<= 2
   233  	gm <<= 2
   234  	trunc := gm & (1<<shift - 1)
   235  	gm >>= shift
   236  	if fs == gs {
   237  		fm += gm
   238  	} else {
   239  		fm -= gm
   240  		if trunc != 0 {
   241  			fm--
   242  		}
   243  	}
   244  	if fm == 0 {
   245  		fs = 0
   246  	}
   247  	return fpack64(fs, fm, fe-2, trunc)
   248  }
   249  
   250  func fsub64(f, g uint64) uint64 {
   251  	return fadd64(f, fneg64(g))
   252  }
   253  
   254  func fneg64(f uint64) uint64 {
   255  	return f ^ (1 << (mantbits64 + expbits64))
   256  }
   257  
   258  func fmul64(f, g uint64) uint64 {
   259  	fs, fm, fe, fi, fn := funpack64(f)
   260  	gs, gm, ge, gi, gn := funpack64(g)
   261  
   262  	// Special cases.
   263  	switch {
   264  	case fn || gn: // NaN * g or f * NaN = NaN
   265  		return nan64
   266  
   267  	case fi && gi: // Inf * Inf = Inf (with sign adjusted)
   268  		return f ^ gs
   269  
   270  	case fi && gm == 0, fm == 0 && gi: // 0 * Inf = Inf * 0 = NaN
   271  		return nan64
   272  
   273  	case fm == 0: // 0 * x = 0 (with sign adjusted)
   274  		return f ^ gs
   275  
   276  	case gm == 0: // x * 0 = 0 (with sign adjusted)
   277  		return g ^ fs
   278  	}
   279  
   280  	// 53-bit * 53-bit = 107- or 108-bit
   281  	lo, hi := mullu(fm, gm)
   282  	shift := mantbits64 - 1
   283  	trunc := lo & (1<<shift - 1)
   284  	mant := hi<<(64-shift) | lo>>shift
   285  	return fpack64(fs^gs, mant, fe+ge-1, trunc)
   286  }
   287  
   288  func fdiv64(f, g uint64) uint64 {
   289  	fs, fm, fe, fi, fn := funpack64(f)
   290  	gs, gm, ge, gi, gn := funpack64(g)
   291  
   292  	// Special cases.
   293  	switch {
   294  	case fn || gn: // NaN / g = f / NaN = NaN
   295  		return nan64
   296  
   297  	case fi && gi: // ±Inf / ±Inf = NaN
   298  		return nan64
   299  
   300  	case !fi && !gi && fm == 0 && gm == 0: // 0 / 0 = NaN
   301  		return nan64
   302  
   303  	case fi, !gi && gm == 0: // Inf / g = f / 0 = Inf
   304  		return fs ^ gs ^ inf64
   305  
   306  	case gi, fm == 0: // f / Inf = 0 / g = Inf
   307  		return fs ^ gs ^ 0
   308  	}
   309  	_, _, _, _ = fi, fn, gi, gn
   310  
   311  	// 53-bit<<54 / 53-bit = 53- or 54-bit.
   312  	shift := mantbits64 + 2
   313  	q, r := divlu(fm>>(64-shift), fm<<shift, gm)
   314  	return fpack64(fs^gs, q, fe-ge-2, r)
   315  }
   316  
   317  func f64to32(f uint64) uint32 {
   318  	fs, fm, fe, fi, fn := funpack64(f)
   319  	if fn {
   320  		return nan32
   321  	}
   322  	fs32 := uint32(fs >> 32)
   323  	if fi {
   324  		return fs32 ^ inf32
   325  	}
   326  	const d = mantbits64 - mantbits32 - 1
   327  	return fpack32(fs32, uint32(fm>>d), fe-1, uint32(fm&(1<<d-1)))
   328  }
   329  
   330  func f32to64(f uint32) uint64 {
   331  	const d = mantbits64 - mantbits32
   332  	fs, fm, fe, fi, fn := funpack32(f)
   333  	if fn {
   334  		return nan64
   335  	}
   336  	fs64 := uint64(fs) << 32
   337  	if fi {
   338  		return fs64 ^ inf64
   339  	}
   340  	return fpack64(fs64, uint64(fm)<<d, fe, 0)
   341  }
   342  
   343  func fcmp64(f, g uint64) (cmp int32, isnan bool) {
   344  	fs, fm, _, fi, fn := funpack64(f)
   345  	gs, gm, _, gi, gn := funpack64(g)
   346  
   347  	switch {
   348  	case fn, gn: // flag NaN
   349  		return 0, true
   350  
   351  	case !fi && !gi && fm == 0 && gm == 0: // ±0 == ±0
   352  		return 0, false
   353  
   354  	case fs > gs: // f < 0, g > 0
   355  		return -1, false
   356  
   357  	case fs < gs: // f > 0, g < 0
   358  		return +1, false
   359  
   360  	// Same sign, not NaN.
   361  	// Can compare encodings directly now.
   362  	// Reverse for sign.
   363  	case fs == 0 && f < g, fs != 0 && f > g:
   364  		return -1, false
   365  
   366  	case fs == 0 && f > g, fs != 0 && f < g:
   367  		return +1, false
   368  	}
   369  
   370  	// f == g
   371  	return 0, false
   372  }
   373  
   374  func f64toint(f uint64) (val int64, ok bool) {
   375  	fs, fm, fe, fi, fn := funpack64(f)
   376  
   377  	switch {
   378  	case fi, fn: // NaN
   379  		return 0, false
   380  
   381  	case fe < -1: // f < 0.5
   382  		return 0, false
   383  
   384  	case fe > 63: // f >= 2^63
   385  		if fs != 0 && fm == 0 { // f == -2^63
   386  			return -1 << 63, true
   387  		}
   388  		if fs != 0 {
   389  			return 0, false
   390  		}
   391  		return 0, false
   392  	}
   393  
   394  	for fe > int(mantbits64) {
   395  		fe--
   396  		fm <<= 1
   397  	}
   398  	for fe < int(mantbits64) {
   399  		fe++
   400  		fm >>= 1
   401  	}
   402  	val = int64(fm)
   403  	if fs != 0 {
   404  		val = -val
   405  	}
   406  	return val, true
   407  }
   408  
   409  func fintto64(val int64) (f uint64) {
   410  	fs := uint64(val) & (1 << 63)
   411  	mant := uint64(val)
   412  	if fs != 0 {
   413  		mant = -mant
   414  	}
   415  	return fpack64(fs, mant, int(mantbits64), 0)
   416  }
   417  
   418  // 64x64 -> 128 multiply.
   419  // adapted from hacker's delight.
   420  func mullu(u, v uint64) (lo, hi uint64) {
   421  	const (
   422  		s    = 32
   423  		mask = 1<<s - 1
   424  	)
   425  	u0 := u & mask
   426  	u1 := u >> s
   427  	v0 := v & mask
   428  	v1 := v >> s
   429  	w0 := u0 * v0
   430  	t := u1*v0 + w0>>s
   431  	w1 := t & mask
   432  	w2 := t >> s
   433  	w1 += u0 * v1
   434  	return u * v, u1*v1 + w2 + w1>>s
   435  }
   436  
   437  // 128/64 -> 64 quotient, 64 remainder.
   438  // adapted from hacker's delight
   439  func divlu(u1, u0, v uint64) (q, r uint64) {
   440  	const b = 1 << 32
   441  
   442  	if u1 >= v {
   443  		return 1<<64 - 1, 1<<64 - 1
   444  	}
   445  
   446  	// s = nlz(v); v <<= s
   447  	s := uint(0)
   448  	for v&(1<<63) == 0 {
   449  		s++
   450  		v <<= 1
   451  	}
   452  
   453  	vn1 := v >> 32
   454  	vn0 := v & (1<<32 - 1)
   455  	un32 := u1<<s | u0>>(64-s)
   456  	un10 := u0 << s
   457  	un1 := un10 >> 32
   458  	un0 := un10 & (1<<32 - 1)
   459  	q1 := un32 / vn1
   460  	rhat := un32 - q1*vn1
   461  
   462  again1:
   463  	if q1 >= b || q1*vn0 > b*rhat+un1 {
   464  		q1--
   465  		rhat += vn1
   466  		if rhat < b {
   467  			goto again1
   468  		}
   469  	}
   470  
   471  	un21 := un32*b + un1 - q1*v
   472  	q0 := un21 / vn1
   473  	rhat = un21 - q0*vn1
   474  
   475  again2:
   476  	if q0 >= b || q0*vn0 > b*rhat+un0 {
   477  		q0--
   478  		rhat += vn1
   479  		if rhat < b {
   480  			goto again2
   481  		}
   482  	}
   483  
   484  	return q1*b + q0, (un21*b + un0 - q0*v) >> s
   485  }
   486  
   487  func fadd32(x, y uint32) uint32 {
   488  	return f64to32(fadd64(f32to64(x), f32to64(y)))
   489  }
   490  
   491  func fmul32(x, y uint32) uint32 {
   492  	return f64to32(fmul64(f32to64(x), f32to64(y)))
   493  }
   494  
   495  func fdiv32(x, y uint32) uint32 {
   496  	return f64to32(fdiv64(f32to64(x), f32to64(y)))
   497  }
   498  
   499  func feq32(x, y uint32) bool {
   500  	cmp, nan := fcmp64(f32to64(x), f32to64(y))
   501  	return cmp == 0 && !nan
   502  }
   503  
   504  func fgt32(x, y uint32) bool {
   505  	cmp, nan := fcmp64(f32to64(x), f32to64(y))
   506  	return cmp >= 1 && !nan
   507  }
   508  
   509  func fge32(x, y uint32) bool {
   510  	cmp, nan := fcmp64(f32to64(x), f32to64(y))
   511  	return cmp >= 0 && !nan
   512  }
   513  
   514  func feq64(x, y uint64) bool {
   515  	cmp, nan := fcmp64(x, y)
   516  	return cmp == 0 && !nan
   517  }
   518  
   519  func fgt64(x, y uint64) bool {
   520  	cmp, nan := fcmp64(x, y)
   521  	return cmp >= 1 && !nan
   522  }
   523  
   524  func fge64(x, y uint64) bool {
   525  	cmp, nan := fcmp64(x, y)
   526  	return cmp >= 0 && !nan
   527  }
   528  
   529  func fint32to32(x int32) uint32 {
   530  	return f64to32(fintto64(int64(x)))
   531  }
   532  
   533  func fint32to64(x int32) uint64 {
   534  	return fintto64(int64(x))
   535  }
   536  
   537  func fint64to32(x int64) uint32 {
   538  	return f64to32(fintto64(x))
   539  }
   540  
   541  func fint64to64(x int64) uint64 {
   542  	return fintto64(x)
   543  }
   544  
   545  func f32toint32(x uint32) int32 {
   546  	val, _ := f64toint(f32to64(x))
   547  	return int32(val)
   548  }
   549  
   550  func f32toint64(x uint32) int64 {
   551  	val, _ := f64toint(f32to64(x))
   552  	return val
   553  }
   554  
   555  func f64toint32(x uint64) int32 {
   556  	val, _ := f64toint(x)
   557  	return int32(val)
   558  }
   559  
   560  func f64toint64(x uint64) int64 {
   561  	val, _ := f64toint(x)
   562  	return val
   563  }
   564  
   565  func f64touint64(x float64) uint64 {
   566  	if x < float64(1<<63) {
   567  		return uint64(int64(x))
   568  	}
   569  	y := x - float64(1<<63)
   570  	z := uint64(int64(y))
   571  	return z | (1 << 63)
   572  }
   573  
   574  func f32touint64(x float32) uint64 {
   575  	if x < float32(1<<63) {
   576  		return uint64(int64(x))
   577  	}
   578  	y := x - float32(1<<63)
   579  	z := uint64(int64(y))
   580  	return z | (1 << 63)
   581  }
   582  
   583  func fuint64to64(x uint64) float64 {
   584  	if int64(x) >= 0 {
   585  		return float64(int64(x))
   586  	}
   587  	// See ../cmd/compile/internal/gc/ssa.go:uint64Tofloat
   588  	y := x & 1
   589  	z := x >> 1
   590  	z = z | y
   591  	r := float64(int64(z))
   592  	return r + r
   593  }
   594  
   595  func fuint64to32(x uint64) float32 {
   596  	return float32(fuint64to64(x))
   597  }