github.com/xushiwei/go@v0.0.0-20130601165731-2b9d83f45bc9/src/pkg/runtime/softfloat_arm.c (about) 1 // Copyright 2009 The Go Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style 3 // license that can be found in the LICENSE file. 4 5 // Software floating point interpretaton of ARM 7500 FP instructions. 6 // The interpretation is not bit compatible with the 7500. 7 // It uses true little-endian doubles, while the 7500 used mixed-endian. 8 9 #include "runtime.h" 10 11 #define CPSR 14 12 #define FLAGS_N (1U << 31) 13 #define FLAGS_Z (1U << 30) 14 #define FLAGS_C (1U << 29) 15 #define FLAGS_V (1U << 28) 16 17 void runtime·abort(void); 18 void math·sqrtC(uint64, uint64*); 19 20 static uint32 trace = 0; 21 22 static void 23 fabort(void) 24 { 25 if (1) { 26 runtime·printf("Unsupported floating point instruction\n"); 27 runtime·abort(); 28 } 29 } 30 31 static void 32 putf(uint32 reg, uint32 val) 33 { 34 m->freglo[reg] = val; 35 } 36 37 static void 38 putd(uint32 reg, uint64 val) 39 { 40 m->freglo[reg] = (uint32)val; 41 m->freghi[reg] = (uint32)(val>>32); 42 } 43 44 static uint64 45 getd(uint32 reg) 46 { 47 return (uint64)m->freglo[reg] | ((uint64)m->freghi[reg]<<32); 48 } 49 50 static void 51 fprint(void) 52 { 53 uint32 i; 54 for (i = 0; i < 16; i++) { 55 runtime·printf("\tf%d:\t%X %X\n", i, m->freghi[i], m->freglo[i]); 56 } 57 } 58 59 static uint32 60 d2f(uint64 d) 61 { 62 uint32 x; 63 64 runtime·f64to32c(d, &x); 65 return x; 66 } 67 68 static uint64 69 f2d(uint32 f) 70 { 71 uint64 x; 72 73 runtime·f32to64c(f, &x); 74 return x; 75 } 76 77 static uint32 78 fstatus(bool nan, int32 cmp) 79 { 80 if(nan) 81 return FLAGS_C | FLAGS_V; 82 if(cmp == 0) 83 return FLAGS_Z | FLAGS_C; 84 if(cmp < 0) 85 return FLAGS_N; 86 return FLAGS_C; 87 } 88 89 // conditions array record the required CPSR cond field for the 90 // first 5 pairs of conditional execution opcodes 91 // higher 4 bits are must set, lower 4 bits are must clear 92 static const uint8 conditions[10/2] = { 93 [0/2] = (FLAGS_Z >> 24) | 0, // 0: EQ (Z set), 1: NE (Z clear) 94 [2/2] = (FLAGS_C >> 24) | 0, // 2: CS/HS (C set), 3: CC/LO (C clear) 95 [4/2] = (FLAGS_N >> 24) | 0, // 4: MI (N set), 5: PL (N clear) 96 [6/2] = (FLAGS_V >> 24) | 0, // 6: VS (V set), 7: VC (V clear) 97 [8/2] = (FLAGS_C >> 24) | 98 (FLAGS_Z >> 28), // 8: HI (C set and Z clear), 9: LS (C clear and Z set) 99 }; 100 101 // returns number of words that the fp instruction 102 // is occupying, 0 if next instruction isn't float. 103 static uint32 104 stepflt(uint32 *pc, uint32 *regs) 105 { 106 uint32 i, opc, regd, regm, regn, cpsr; 107 int32 delta; 108 uint32 *addr; 109 uint64 uval; 110 int64 sval; 111 bool nan, ok; 112 int32 cmp; 113 114 i = *pc; 115 116 if(trace) 117 runtime·printf("stepflt %p %x (cpsr %x)\n", pc, i, regs[CPSR] >> 28); 118 119 opc = i >> 28; 120 if(opc == 14) // common case first 121 goto execute; 122 cpsr = regs[CPSR] >> 28; 123 switch(opc) { 124 case 0: case 1: case 2: case 3: case 4: 125 case 5: case 6: case 7: case 8: case 9: 126 if(((cpsr & (conditions[opc/2] >> 4)) == (conditions[opc/2] >> 4)) && 127 ((cpsr & (conditions[opc/2] & 0xf)) == 0)) { 128 if(opc & 1) return 1; 129 } else { 130 if(!(opc & 1)) return 1; 131 } 132 break; 133 case 10: // GE (N == V) 134 case 11: // LT (N != V) 135 if((cpsr & (FLAGS_N >> 28)) == (cpsr & (FLAGS_V >> 28))) { 136 if(opc & 1) return 1; 137 } else { 138 if(!(opc & 1)) return 1; 139 } 140 break; 141 case 12: // GT (N == V and Z == 0) 142 case 13: // LE (N != V or Z == 1) 143 if((cpsr & (FLAGS_N >> 28)) == (cpsr & (FLAGS_V >> 28)) && 144 (cpsr & (FLAGS_Z >> 28)) == 0) { 145 if(opc & 1) return 1; 146 } else { 147 if(!(opc & 1)) return 1; 148 } 149 break; 150 case 14: // AL 151 break; 152 case 15: // shouldn't happen 153 return 0; 154 } 155 if(trace) 156 runtime·printf("conditional %x (cpsr %x) pass\n", opc, cpsr); 157 i = (0xeU << 28) | (i & 0xfffffff); 158 159 execute: 160 // special cases 161 if((i&0xfffff000) == 0xe59fb000) { 162 // load r11 from pc-relative address. 163 // might be part of a floating point move 164 // (or might not, but no harm in simulating 165 // one instruction too many). 166 addr = (uint32*)((uint8*)pc + (i&0xfff) + 8); 167 regs[11] = addr[0]; 168 169 if(trace) 170 runtime·printf("*** cpu R[%d] = *(%p) %x\n", 171 11, addr, regs[11]); 172 return 1; 173 } 174 if(i == 0xe08bb00d) { 175 // add sp to r11. 176 // might be part of a large stack offset address 177 // (or might not, but again no harm done). 178 regs[11] += regs[13]; 179 180 if(trace) 181 runtime·printf("*** cpu R[%d] += R[%d] %x\n", 182 11, 13, regs[11]); 183 return 1; 184 } 185 if(i == 0xeef1fa10) { 186 regs[CPSR] = (regs[CPSR]&0x0fffffff) | m->fflag; 187 188 if(trace) 189 runtime·printf("*** fpsr R[CPSR] = F[CPSR] %x\n", regs[CPSR]); 190 return 1; 191 } 192 if((i&0xff000000) == 0xea000000) { 193 // unconditional branch 194 // can happen in the middle of floating point 195 // if the linker decides it is time to lay down 196 // a sequence of instruction stream constants. 197 delta = i&0xffffff; 198 delta = (delta<<8) >> 8; // sign extend 199 200 if(trace) 201 runtime·printf("*** cpu PC += %x\n", (delta+2)*4); 202 return delta+2; 203 } 204 205 goto stage1; 206 207 stage1: // load/store regn is cpureg, regm is 8bit offset 208 regd = i>>12 & 0xf; 209 regn = i>>16 & 0xf; 210 regm = (i & 0xff) << 2; // PLUS or MINUS ?? 211 212 switch(i & 0xfff00f00) { 213 default: 214 goto stage2; 215 216 case 0xed900a00: // single load 217 addr = (uint32*)(regs[regn] + regm); 218 m->freglo[regd] = addr[0]; 219 220 if(trace) 221 runtime·printf("*** load F[%d] = %x\n", 222 regd, m->freglo[regd]); 223 break; 224 225 case 0xed900b00: // double load 226 addr = (uint32*)(regs[regn] + regm); 227 m->freglo[regd] = addr[0]; 228 m->freghi[regd] = addr[1]; 229 230 if(trace) 231 runtime·printf("*** load D[%d] = %x-%x\n", 232 regd, m->freghi[regd], m->freglo[regd]); 233 break; 234 235 case 0xed800a00: // single store 236 addr = (uint32*)(regs[regn] + regm); 237 addr[0] = m->freglo[regd]; 238 239 if(trace) 240 runtime·printf("*** *(%p) = %x\n", 241 addr, addr[0]); 242 break; 243 244 case 0xed800b00: // double store 245 addr = (uint32*)(regs[regn] + regm); 246 addr[0] = m->freglo[regd]; 247 addr[1] = m->freghi[regd]; 248 249 if(trace) 250 runtime·printf("*** *(%p) = %x-%x\n", 251 addr, addr[1], addr[0]); 252 break; 253 } 254 return 1; 255 256 stage2: // regd, regm, regn are 4bit variables 257 regm = i>>0 & 0xf; 258 switch(i & 0xfff00ff0) { 259 default: 260 goto stage3; 261 262 case 0xf3000110: // veor 263 m->freglo[regd] = m->freglo[regm]^m->freglo[regn]; 264 m->freghi[regd] = m->freghi[regm]^m->freghi[regn]; 265 266 if(trace) 267 runtime·printf("*** veor D[%d] = %x-%x\n", 268 regd, m->freghi[regd], m->freglo[regd]); 269 break; 270 271 case 0xeeb00b00: // D[regd] = const(regn,regm) 272 regn = (regn<<4) | regm; 273 regm = 0x40000000UL; 274 if(regn & 0x80) 275 regm |= 0x80000000UL; 276 if(regn & 0x40) 277 regm ^= 0x7fc00000UL; 278 regm |= (regn & 0x3f) << 16; 279 m->freglo[regd] = 0; 280 m->freghi[regd] = regm; 281 282 if(trace) 283 runtime·printf("*** immed D[%d] = %x-%x\n", 284 regd, m->freghi[regd], m->freglo[regd]); 285 break; 286 287 case 0xeeb00a00: // F[regd] = const(regn,regm) 288 regn = (regn<<4) | regm; 289 regm = 0x40000000UL; 290 if(regn & 0x80) 291 regm |= 0x80000000UL; 292 if(regn & 0x40) 293 regm ^= 0x7e000000UL; 294 regm |= (regn & 0x3f) << 19; 295 m->freglo[regd] = regm; 296 297 if(trace) 298 runtime·printf("*** immed D[%d] = %x\n", 299 regd, m->freglo[regd]); 300 break; 301 302 case 0xee300b00: // D[regd] = D[regn]+D[regm] 303 runtime·fadd64c(getd(regn), getd(regm), &uval); 304 putd(regd, uval); 305 306 if(trace) 307 runtime·printf("*** add D[%d] = D[%d]+D[%d] %x-%x\n", 308 regd, regn, regm, m->freghi[regd], m->freglo[regd]); 309 break; 310 311 case 0xee300a00: // F[regd] = F[regn]+F[regm] 312 runtime·fadd64c(f2d(m->freglo[regn]), f2d(m->freglo[regm]), &uval); 313 m->freglo[regd] = d2f(uval); 314 315 if(trace) 316 runtime·printf("*** add F[%d] = F[%d]+F[%d] %x\n", 317 regd, regn, regm, m->freglo[regd]); 318 break; 319 320 case 0xee300b40: // D[regd] = D[regn]-D[regm] 321 runtime·fsub64c(getd(regn), getd(regm), &uval); 322 putd(regd, uval); 323 324 if(trace) 325 runtime·printf("*** sub D[%d] = D[%d]-D[%d] %x-%x\n", 326 regd, regn, regm, m->freghi[regd], m->freglo[regd]); 327 break; 328 329 case 0xee300a40: // F[regd] = F[regn]-F[regm] 330 runtime·fsub64c(f2d(m->freglo[regn]), f2d(m->freglo[regm]), &uval); 331 m->freglo[regd] = d2f(uval); 332 333 if(trace) 334 runtime·printf("*** sub F[%d] = F[%d]-F[%d] %x\n", 335 regd, regn, regm, m->freglo[regd]); 336 break; 337 338 case 0xee200b00: // D[regd] = D[regn]*D[regm] 339 runtime·fmul64c(getd(regn), getd(regm), &uval); 340 putd(regd, uval); 341 342 if(trace) 343 runtime·printf("*** mul D[%d] = D[%d]*D[%d] %x-%x\n", 344 regd, regn, regm, m->freghi[regd], m->freglo[regd]); 345 break; 346 347 case 0xee200a00: // F[regd] = F[regn]*F[regm] 348 runtime·fmul64c(f2d(m->freglo[regn]), f2d(m->freglo[regm]), &uval); 349 m->freglo[regd] = d2f(uval); 350 351 if(trace) 352 runtime·printf("*** mul F[%d] = F[%d]*F[%d] %x\n", 353 regd, regn, regm, m->freglo[regd]); 354 break; 355 356 case 0xee800b00: // D[regd] = D[regn]/D[regm] 357 runtime·fdiv64c(getd(regn), getd(regm), &uval); 358 putd(regd, uval); 359 360 if(trace) 361 runtime·printf("*** div D[%d] = D[%d]/D[%d] %x-%x\n", 362 regd, regn, regm, m->freghi[regd], m->freglo[regd]); 363 break; 364 365 case 0xee800a00: // F[regd] = F[regn]/F[regm] 366 runtime·fdiv64c(f2d(m->freglo[regn]), f2d(m->freglo[regm]), &uval); 367 m->freglo[regd] = d2f(uval); 368 369 if(trace) 370 runtime·printf("*** div F[%d] = F[%d]/F[%d] %x\n", 371 regd, regn, regm, m->freglo[regd]); 372 break; 373 374 case 0xee000b10: // S[regn] = R[regd] (MOVW) (regm ignored) 375 m->freglo[regn] = regs[regd]; 376 377 if(trace) 378 runtime·printf("*** cpy S[%d] = R[%d] %x\n", 379 regn, regd, m->freglo[regn]); 380 break; 381 382 case 0xee100b10: // R[regd] = S[regn] (MOVW) (regm ignored) 383 regs[regd] = m->freglo[regn]; 384 385 if(trace) 386 runtime·printf("*** cpy R[%d] = S[%d] %x\n", 387 regd, regn, regs[regd]); 388 break; 389 } 390 return 1; 391 392 stage3: // regd, regm are 4bit variables 393 switch(i & 0xffff0ff0) { 394 default: 395 goto done; 396 397 case 0xeeb00a40: // F[regd] = F[regm] (MOVF) 398 m->freglo[regd] = m->freglo[regm]; 399 400 if(trace) 401 runtime·printf("*** F[%d] = F[%d] %x\n", 402 regd, regm, m->freglo[regd]); 403 break; 404 405 case 0xeeb00b40: // D[regd] = D[regm] (MOVD) 406 m->freglo[regd] = m->freglo[regm]; 407 m->freghi[regd] = m->freghi[regm]; 408 409 if(trace) 410 runtime·printf("*** D[%d] = D[%d] %x-%x\n", 411 regd, regm, m->freghi[regd], m->freglo[regd]); 412 break; 413 414 case 0xeeb10bc0: // D[regd] = sqrt D[regm] 415 math·sqrtC(getd(regm), &uval); 416 putd(regd, uval); 417 418 if(trace) 419 runtime·printf("*** D[%d] = sqrt D[%d] %x-%x\n", 420 regd, regm, m->freghi[regd], m->freglo[regd]); 421 break; 422 423 case 0xeeb00bc0: // D[regd] = abs D[regm] 424 m->freglo[regd] = m->freglo[regm]; 425 m->freghi[regd] = m->freghi[regm] & ((1<<31)-1); 426 427 if(trace) 428 runtime·printf("*** D[%d] = abs D[%d] %x-%x\n", 429 regd, regm, m->freghi[regd], m->freglo[regd]); 430 break; 431 432 case 0xeeb00ac0: // F[regd] = abs F[regm] 433 m->freglo[regd] = m->freglo[regm] & ((1<<31)-1); 434 435 if(trace) 436 runtime·printf("*** F[%d] = abs F[%d] %x\n", 437 regd, regm, m->freglo[regd]); 438 break; 439 440 case 0xeeb40bc0: // D[regd] :: D[regm] (CMPD) 441 runtime·fcmp64c(getd(regd), getd(regm), &cmp, &nan); 442 m->fflag = fstatus(nan, cmp); 443 444 if(trace) 445 runtime·printf("*** cmp D[%d]::D[%d] %x\n", 446 regd, regm, m->fflag); 447 break; 448 449 case 0xeeb40ac0: // F[regd] :: F[regm] (CMPF) 450 runtime·fcmp64c(f2d(m->freglo[regd]), f2d(m->freglo[regm]), &cmp, &nan); 451 m->fflag = fstatus(nan, cmp); 452 453 if(trace) 454 runtime·printf("*** cmp F[%d]::F[%d] %x\n", 455 regd, regm, m->fflag); 456 break; 457 458 case 0xeeb70ac0: // D[regd] = F[regm] (MOVFD) 459 putd(regd, f2d(m->freglo[regm])); 460 461 if(trace) 462 runtime·printf("*** f2d D[%d]=F[%d] %x-%x\n", 463 regd, regm, m->freghi[regd], m->freglo[regd]); 464 break; 465 466 case 0xeeb70bc0: // F[regd] = D[regm] (MOVDF) 467 m->freglo[regd] = d2f(getd(regm)); 468 469 if(trace) 470 runtime·printf("*** d2f F[%d]=D[%d] %x-%x\n", 471 regd, regm, m->freghi[regd], m->freglo[regd]); 472 break; 473 474 case 0xeebd0ac0: // S[regd] = F[regm] (MOVFW) 475 runtime·f64tointc(f2d(m->freglo[regm]), &sval, &ok); 476 if(!ok || (int32)sval != sval) 477 sval = 0; 478 m->freglo[regd] = sval; 479 480 if(trace) 481 runtime·printf("*** fix S[%d]=F[%d] %x\n", 482 regd, regm, m->freglo[regd]); 483 break; 484 485 case 0xeebc0ac0: // S[regd] = F[regm] (MOVFW.U) 486 runtime·f64tointc(f2d(m->freglo[regm]), &sval, &ok); 487 if(!ok || (uint32)sval != sval) 488 sval = 0; 489 m->freglo[regd] = sval; 490 491 if(trace) 492 runtime·printf("*** fix unsigned S[%d]=F[%d] %x\n", 493 regd, regm, m->freglo[regd]); 494 break; 495 496 case 0xeebd0bc0: // S[regd] = D[regm] (MOVDW) 497 runtime·f64tointc(getd(regm), &sval, &ok); 498 if(!ok || (int32)sval != sval) 499 sval = 0; 500 m->freglo[regd] = sval; 501 502 if(trace) 503 runtime·printf("*** fix S[%d]=D[%d] %x\n", 504 regd, regm, m->freglo[regd]); 505 break; 506 507 case 0xeebc0bc0: // S[regd] = D[regm] (MOVDW.U) 508 runtime·f64tointc(getd(regm), &sval, &ok); 509 if(!ok || (uint32)sval != sval) 510 sval = 0; 511 m->freglo[regd] = sval; 512 513 if(trace) 514 runtime·printf("*** fix unsigned S[%d]=D[%d] %x\n", 515 regd, regm, m->freglo[regd]); 516 break; 517 518 case 0xeeb80ac0: // D[regd] = S[regm] (MOVWF) 519 cmp = m->freglo[regm]; 520 if(cmp < 0) { 521 runtime·fintto64c(-cmp, &uval); 522 putf(regd, d2f(uval)); 523 m->freglo[regd] ^= 0x80000000; 524 } else { 525 runtime·fintto64c(cmp, &uval); 526 putf(regd, d2f(uval)); 527 } 528 529 if(trace) 530 runtime·printf("*** float D[%d]=S[%d] %x-%x\n", 531 regd, regm, m->freghi[regd], m->freglo[regd]); 532 break; 533 534 case 0xeeb80a40: // D[regd] = S[regm] (MOVWF.U) 535 runtime·fintto64c(m->freglo[regm], &uval); 536 putf(regd, d2f(uval)); 537 538 if(trace) 539 runtime·printf("*** float unsigned D[%d]=S[%d] %x-%x\n", 540 regd, regm, m->freghi[regd], m->freglo[regd]); 541 break; 542 543 case 0xeeb80bc0: // D[regd] = S[regm] (MOVWD) 544 cmp = m->freglo[regm]; 545 if(cmp < 0) { 546 runtime·fintto64c(-cmp, &uval); 547 putd(regd, uval); 548 m->freghi[regd] ^= 0x80000000; 549 } else { 550 runtime·fintto64c(cmp, &uval); 551 putd(regd, uval); 552 } 553 554 if(trace) 555 runtime·printf("*** float D[%d]=S[%d] %x-%x\n", 556 regd, regm, m->freghi[regd], m->freglo[regd]); 557 break; 558 559 case 0xeeb80b40: // D[regd] = S[regm] (MOVWD.U) 560 runtime·fintto64c(m->freglo[regm], &uval); 561 putd(regd, uval); 562 563 if(trace) 564 runtime·printf("*** float unsigned D[%d]=S[%d] %x-%x\n", 565 regd, regm, m->freghi[regd], m->freglo[regd]); 566 break; 567 } 568 return 1; 569 570 done: 571 if((i&0xff000000) == 0xee000000 || 572 (i&0xff000000) == 0xed000000) { 573 runtime·printf("stepflt %p %x\n", pc, i); 574 fabort(); 575 } 576 return 0; 577 } 578 579 #pragma textflag 7 580 uint32* 581 runtime·_sfloat2(uint32 *lr, uint32 r0) 582 { 583 uint32 skip; 584 585 skip = stepflt(lr, &r0); 586 if(skip == 0) { 587 runtime·printf("sfloat2 %p %x\n", lr, *lr); 588 fabort(); // not ok to fail first instruction 589 } 590 591 lr += skip; 592 while(skip = stepflt(lr, &r0)) 593 lr += skip; 594 return lr; 595 }