1 | 2 | do_func.sa 3.4 2/18/91 3 | 4 | Do_func performs the unimplemented operation. The operation 5 | to be performed is determined from the lower 7 bits of the 6 | extension word (except in the case of fmovecr and fsincos). 7 | The opcode and tag bits form an index into a jump table in 8 | tbldo.sa. Cases of zero, infinity and NaN are handled in 9 | do_func by forcing the default result. Normalized and 10 | denormalized (there are no unnormalized numbers at this 11 | point) are passed onto the emulation code. 12 | 13 | CMDREG1B and STAG are extracted from the fsave frame 14 | and combined to form the table index. The function called 15 | will start with a0 pointing to the ETEMP operand. Dyadic 16 | functions can find FPTEMP at -12(a0). 17 | 18 | Called functions return their result in fp0. Sincos returns 19 | sin(x) in fp0 and cos(x) in fp1. 20 | 21 22 | Copyright (C) Motorola, Inc. 1990 23 | All Rights Reserved 24 | 25 | THIS IS UNPUBLISHED PROPRIETARY SOURCE CODE OF MOTOROLA 26 | The copyright notice above does not evidence any 27 | actual or intended publication of such source code. 28 29 DO_FUNC: |idnt 2,1 | Motorola 040 Floating Point Software Package 30 31 |section 8 32 33 .include "fpsp.h" 34 35 |xref t_dz2 36 |xref t_operr 37 |xref t_inx2 38 |xref t_resdnrm 39 |xref dst_nan 40 |xref src_nan 41 |xref nrm_set 42 |xref sto_cos 43 44 |xref tblpre 45 |xref slognp1,slogn,slog10,slog2 46 |xref slognd,slog10d,slog2d 47 |xref smod,srem 48 |xref sscale 49 |xref smovcr 50 51 PONE: .long 0x3fff0000,0x80000000,0x00000000 |+1 52 MONE: .long 0xbfff0000,0x80000000,0x00000000 |-1 53 PZERO: .long 0x00000000,0x00000000,0x00000000 |+0 54 MZERO: .long 0x80000000,0x00000000,0x00000000 |-0 55 PINF: .long 0x7fff0000,0x00000000,0x00000000 |+inf 56 MINF: .long 0xffff0000,0x00000000,0x00000000 |-inf 57 QNAN: .long 0x7fff0000,0xffffffff,0xffffffff |non-signaling nan 58 PPIBY2: .long 0x3FFF0000,0xC90FDAA2,0x2168C235 |+PI/2 59 MPIBY2: .long 0xbFFF0000,0xC90FDAA2,0x2168C235 |-PI/2 60 61 .global do_func 62 do_func: 63 clrb CU_ONLY(%a6) 64 | 65 | Check for fmovecr. It does not follow the format of fp gen 66 | unimplemented instructions. The test is on the upper 6 bits; 67 | if they are $17, the inst is fmovecr. Call entry smovcr 68 | directly. 69 | 70 bfextu CMDREG1B(%a6){#0:#6},%d0 |get opclass and src fields 71 cmpil #0x17,%d0 |if op class and size fields are $17, 72 | ;it is FMOVECR; if not, continue 73 bnes not_fmovecr 74 jmp smovcr |fmovecr; jmp directly to emulation 75 76 not_fmovecr: 77 movew CMDREG1B(%a6),%d0 78 andl #0x7F,%d0 79 cmpil #0x38,%d0 |if the extension is >= $38, 80 bges serror |it is illegal 81 bfextu STAG(%a6){#0:#3},%d1 82 lsll #3,%d0 |make room for STAG 83 addl %d1,%d0 |combine for final index into table 84 leal tblpre,%a1 |start of monster jump table 85 movel (%a1,%d0.w*4),%a1 |real target address 86 leal ETEMP(%a6),%a0 |a0 is pointer to src op 87 movel USER_FPCR(%a6),%d1 88 andl #0xFF,%d1 | discard all but rounding mode/prec 89 fmovel #0,%fpcr 90 jmp (%a1) 91 | 92 | ERROR 93 | 94 .global serror 95 serror: 96 st STORE_FLG(%a6) 97 rts 98 | 99 | These routines load forced values into fp0. They are called 100 | by index into tbldo. 101 | 102 | Load a signed zero to fp0 and set inex2/ainex 103 | 104 .global snzrinx 105 snzrinx: 106 btstb #sign_bit,LOCAL_EX(%a0) |get sign of source operand 107 bnes ld_mzinx |if negative, branch 108 bsr ld_pzero |bsr so we can return and set inx 109 bra t_inx2 |now, set the inx for the next inst 110 ld_mzinx: 111 bsr ld_mzero |if neg, load neg zero, return here 112 bra t_inx2 |now, set the inx for the next inst 113 | 114 | Load a signed zero to fp0; do not set inex2/ainex 115 | 116 .global szero 117 szero: 118 btstb #sign_bit,LOCAL_EX(%a0) |get sign of source operand 119 bne ld_mzero |if neg, load neg zero 120 bra ld_pzero |load positive zero 121 | 122 | Load a signed infinity to fp0; do not set inex2/ainex 123 | 124 .global sinf 125 sinf: 126 btstb #sign_bit,LOCAL_EX(%a0) |get sign of source operand 127 bne ld_minf |if negative branch 128 bra ld_pinf 129 | 130 | Load a signed one to fp0; do not set inex2/ainex 131 | 132 .global sone 133 sone: 134 btstb #sign_bit,LOCAL_EX(%a0) |check sign of source 135 bne ld_mone 136 bra ld_pone 137 | 138 | Load a signed pi/2 to fp0; do not set inex2/ainex 139 | 140 .global spi_2 141 spi_2: 142 btstb #sign_bit,LOCAL_EX(%a0) |check sign of source 143 bne ld_mpi2 144 bra ld_ppi2 145 | 146 | Load either a +0 or +inf for plus/minus operand 147 | 148 .global szr_inf 149 szr_inf: 150 btstb #sign_bit,LOCAL_EX(%a0) |check sign of source 151 bne ld_pzero 152 bra ld_pinf 153 | 154 | Result is either an operr or +inf for plus/minus operand 155 | [Used by slogn, slognp1, slog10, and slog2] 156 | 157 .global sopr_inf 158 sopr_inf: 159 btstb #sign_bit,LOCAL_EX(%a0) |check sign of source 160 bne t_operr 161 bra ld_pinf 162 | 163 | FLOGNP1 164 | 165 .global sslognp1 166 sslognp1: 167 fmovemx (%a0),%fp0-%fp0 168 fcmpb #-1,%fp0 169 fbgt slognp1 170 fbeq t_dz2 |if = -1, divide by zero exception 171 fmovel #0,%FPSR |clr N flag 172 bra t_operr |take care of operands < -1 173 | 174 | FETOXM1 175 | 176 .global setoxm1i 177 setoxm1i: 178 btstb #sign_bit,LOCAL_EX(%a0) |check sign of source 179 bne ld_mone 180 bra ld_pinf 181 | 182 | FLOGN 183 | 184 | Test for 1.0 as an input argument, returning +zero. Also check 185 | the sign and return operr if negative. 186 | 187 .global sslogn 188 sslogn: 189 btstb #sign_bit,LOCAL_EX(%a0) 190 bne t_operr |take care of operands < 0 191 cmpiw #0x3fff,LOCAL_EX(%a0) |test for 1.0 input 192 bne slogn 193 cmpil #0x80000000,LOCAL_HI(%a0) 194 bne slogn 195 tstl LOCAL_LO(%a0) 196 bne slogn 197 fmovex PZERO,%fp0 198 rts 199 200 .global sslognd 201 sslognd: 202 btstb #sign_bit,LOCAL_EX(%a0) 203 beq slognd 204 bra t_operr |take care of operands < 0 205 206 | 207 | FLOG10 208 | 209 .global sslog10 210 sslog10: 211 btstb #sign_bit,LOCAL_EX(%a0) 212 bne t_operr |take care of operands < 0 213 cmpiw #0x3fff,LOCAL_EX(%a0) |test for 1.0 input 214 bne slog10 215 cmpil #0x80000000,LOCAL_HI(%a0) 216 bne slog10 217 tstl LOCAL_LO(%a0) 218 bne slog10 219 fmovex PZERO,%fp0 220 rts 221 222 .global sslog10d 223 sslog10d: 224 btstb #sign_bit,LOCAL_EX(%a0) 225 beq slog10d 226 bra t_operr |take care of operands < 0 227 228 | 229 | FLOG2 230 | 231 .global sslog2 232 sslog2: 233 btstb #sign_bit,LOCAL_EX(%a0) 234 bne t_operr |take care of operands < 0 235 cmpiw #0x3fff,LOCAL_EX(%a0) |test for 1.0 input 236 bne slog2 237 cmpil #0x80000000,LOCAL_HI(%a0) 238 bne slog2 239 tstl LOCAL_LO(%a0) 240 bne slog2 241 fmovex PZERO,%fp0 242 rts 243 244 .global sslog2d 245 sslog2d: 246 btstb #sign_bit,LOCAL_EX(%a0) 247 beq slog2d 248 bra t_operr |take care of operands < 0 249 250 | 251 | FMOD 252 | 253 pmodt: 254 | ;$21 fmod 255 | ;dtag,stag 256 .long smod | 00,00 norm,norm = normal 257 .long smod_oper | 00,01 norm,zero = nan with operr 258 .long smod_fpn | 00,10 norm,inf = fpn 259 .long smod_snan | 00,11 norm,nan = nan 260 .long smod_zro | 01,00 zero,norm = +-zero 261 .long smod_oper | 01,01 zero,zero = nan with operr 262 .long smod_zro | 01,10 zero,inf = +-zero 263 .long smod_snan | 01,11 zero,nan = nan 264 .long smod_oper | 10,00 inf,norm = nan with operr 265 .long smod_oper | 10,01 inf,zero = nan with operr 266 .long smod_oper | 10,10 inf,inf = nan with operr 267 .long smod_snan | 10,11 inf,nan = nan 268 .long smod_dnan | 11,00 nan,norm = nan 269 .long smod_dnan | 11,01 nan,zero = nan 270 .long smod_dnan | 11,10 nan,inf = nan 271 .long smod_dnan | 11,11 nan,nan = nan 272 273 .global pmod 274 pmod: 275 clrb FPSR_QBYTE(%a6) | clear quotient field 276 bfextu STAG(%a6){#0:#3},%d0 |stag = d0 277 bfextu DTAG(%a6){#0:#3},%d1 |dtag = d1 278 279 | 280 | Alias extended denorms to norms for the jump table. 281 | 282 bclrl #2,%d0 283 bclrl #2,%d1 284 285 lslb #2,%d1 286 orb %d0,%d1 |d1{3:2} = dtag, d1{1:0} = stag 287 | ;Tag values: 288 | ;00 = norm or denorm 289 | ;01 = zero 290 | ;10 = inf 291 | ;11 = nan 292 lea pmodt,%a1 293 movel (%a1,%d1.w*4),%a1 294 jmp (%a1) 295 296 smod_snan: 297 bra src_nan 298 smod_dnan: 299 bra dst_nan 300 smod_oper: 301 bra t_operr 302 smod_zro: 303 moveb ETEMP(%a6),%d1 |get sign of src op 304 moveb FPTEMP(%a6),%d0 |get sign of dst op 305 eorb %d0,%d1 |get exor of sign bits 306 btstl #7,%d1 |test for sign 307 beqs smod_zsn |if clr, do not set sign big 308 bsetb #q_sn_bit,FPSR_QBYTE(%a6) |set q-byte sign bit 309 smod_zsn: 310 btstl #7,%d0 |test if + or - 311 beq ld_pzero |if pos then load +0 312 bra ld_mzero |else neg load -0 313 314 smod_fpn: 315 moveb ETEMP(%a6),%d1 |get sign of src op 316 moveb FPTEMP(%a6),%d0 |get sign of dst op 317 eorb %d0,%d1 |get exor of sign bits 318 btstl #7,%d1 |test for sign 319 beqs smod_fsn |if clr, do not set sign big 320 bsetb #q_sn_bit,FPSR_QBYTE(%a6) |set q-byte sign bit 321 smod_fsn: 322 tstb DTAG(%a6) |filter out denormal destination case 323 bpls smod_nrm | 324 leal FPTEMP(%a6),%a0 |a0<- addr(FPTEMP) 325 bra t_resdnrm |force UNFL(but exact) result 326 smod_nrm: 327 fmovel USER_FPCR(%a6),%fpcr |use user's rmode and precision 328 fmovex FPTEMP(%a6),%fp0 |return dest to fp0 329 rts 330 331 | 332 | FREM 333 | 334 premt: 335 | ;$25 frem 336 | ;dtag,stag 337 .long srem | 00,00 norm,norm = normal 338 .long srem_oper | 00,01 norm,zero = nan with operr 339 .long srem_fpn | 00,10 norm,inf = fpn 340 .long srem_snan | 00,11 norm,nan = nan 341 .long srem_zro | 01,00 zero,norm = +-zero 342 .long srem_oper | 01,01 zero,zero = nan with operr 343 .long srem_zro | 01,10 zero,inf = +-zero 344 .long srem_snan | 01,11 zero,nan = nan 345 .long srem_oper | 10,00 inf,norm = nan with operr 346 .long srem_oper | 10,01 inf,zero = nan with operr 347 .long srem_oper | 10,10 inf,inf = nan with operr 348 .long srem_snan | 10,11 inf,nan = nan 349 .long srem_dnan | 11,00 nan,norm = nan 350 .long srem_dnan | 11,01 nan,zero = nan 351 .long srem_dnan | 11,10 nan,inf = nan 352 .long srem_dnan | 11,11 nan,nan = nan 353 354 .global prem 355 prem: 356 clrb FPSR_QBYTE(%a6) |clear quotient field 357 bfextu STAG(%a6){#0:#3},%d0 |stag = d0 358 bfextu DTAG(%a6){#0:#3},%d1 |dtag = d1 359 | 360 | Alias extended denorms to norms for the jump table. 361 | 362 bclr #2,%d0 363 bclr #2,%d1 364 365 lslb #2,%d1 366 orb %d0,%d1 |d1{3:2} = dtag, d1{1:0} = stag 367 | ;Tag values: 368 | ;00 = norm or denorm 369 | ;01 = zero 370 | ;10 = inf 371 | ;11 = nan 372 lea premt,%a1 373 movel (%a1,%d1.w*4),%a1 374 jmp (%a1) 375 376 srem_snan: 377 bra src_nan 378 srem_dnan: 379 bra dst_nan 380 srem_oper: 381 bra t_operr 382 srem_zro: 383 moveb ETEMP(%a6),%d1 |get sign of src op 384 moveb FPTEMP(%a6),%d0 |get sign of dst op 385 eorb %d0,%d1 |get exor of sign bits 386 btstl #7,%d1 |test for sign 387 beqs srem_zsn |if clr, do not set sign big 388 bsetb #q_sn_bit,FPSR_QBYTE(%a6) |set q-byte sign bit 389 srem_zsn: 390 btstl #7,%d0 |test if + or - 391 beq ld_pzero |if pos then load +0 392 bra ld_mzero |else neg load -0 393 394 srem_fpn: 395 moveb ETEMP(%a6),%d1 |get sign of src op 396 moveb FPTEMP(%a6),%d0 |get sign of dst op 397 eorb %d0,%d1 |get exor of sign bits 398 btstl #7,%d1 |test for sign 399 beqs srem_fsn |if clr, do not set sign big 400 bsetb #q_sn_bit,FPSR_QBYTE(%a6) |set q-byte sign bit 401 srem_fsn: 402 tstb DTAG(%a6) |filter out denormal destination case 403 bpls srem_nrm | 404 leal FPTEMP(%a6),%a0 |a0<- addr(FPTEMP) 405 bra t_resdnrm |force UNFL(but exact) result 406 srem_nrm: 407 fmovel USER_FPCR(%a6),%fpcr |use user's rmode and precision 408 fmovex FPTEMP(%a6),%fp0 |return dest to fp0 409 rts 410 | 411 | FSCALE 412 | 413 pscalet: 414 | ;$26 fscale 415 | ;dtag,stag 416 .long sscale | 00,00 norm,norm = result 417 .long sscale | 00,01 norm,zero = fpn 418 .long scl_opr | 00,10 norm,inf = nan with operr 419 .long scl_snan | 00,11 norm,nan = nan 420 .long scl_zro | 01,00 zero,norm = +-zero 421 .long scl_zro | 01,01 zero,zero = +-zero 422 .long scl_opr | 01,10 zero,inf = nan with operr 423 .long scl_snan | 01,11 zero,nan = nan 424 .long scl_inf | 10,00 inf,norm = +-inf 425 .long scl_inf | 10,01 inf,zero = +-inf 426 .long scl_opr | 10,10 inf,inf = nan with operr 427 .long scl_snan | 10,11 inf,nan = nan 428 .long scl_dnan | 11,00 nan,norm = nan 429 .long scl_dnan | 11,01 nan,zero = nan 430 .long scl_dnan | 11,10 nan,inf = nan 431 .long scl_dnan | 11,11 nan,nan = nan 432 433 .global pscale 434 pscale: 435 bfextu STAG(%a6){#0:#3},%d0 |stag in d0 436 bfextu DTAG(%a6){#0:#3},%d1 |dtag in d1 437 bclrl #2,%d0 |alias denorm into norm 438 bclrl #2,%d1 |alias denorm into norm 439 lslb #2,%d1 440 orb %d0,%d1 |d1{4:2} = dtag, d1{1:0} = stag 441 | ;dtag values stag values: 442 | ;000 = norm 00 = norm 443 | ;001 = zero 01 = zero 444 | ;010 = inf 10 = inf 445 | ;011 = nan 11 = nan 446 | ;100 = dnrm 447 | 448 | 449 leal pscalet,%a1 |load start of jump table 450 movel (%a1,%d1.w*4),%a1 |load a1 with label depending on tag 451 jmp (%a1) |go to the routine 452 453 scl_opr: 454 bra t_operr 455 456 scl_dnan: 457 bra dst_nan 458 459 scl_zro: 460 btstb #sign_bit,FPTEMP_EX(%a6) |test if + or - 461 beq ld_pzero |if pos then load +0 462 bra ld_mzero |if neg then load -0 463 scl_inf: 464 btstb #sign_bit,FPTEMP_EX(%a6) |test if + or - 465 beq ld_pinf |if pos then load +inf 466 bra ld_minf |else neg load -inf 467 scl_snan: 468 bra src_nan 469 | 470 | FSINCOS 471 | 472 .global ssincosz 473 ssincosz: 474 btstb #sign_bit,ETEMP(%a6) |get sign 475 beqs sincosp 476 fmovex MZERO,%fp0 477 bras sincoscom 478 sincosp: 479 fmovex PZERO,%fp0 480 sincoscom: 481 fmovemx PONE,%fp1-%fp1 |do not allow FPSR to be affected 482 bra sto_cos |store cosine result 483 484 .global ssincosi 485 ssincosi: 486 fmovex QNAN,%fp1 |load NAN 487 bsr sto_cos |store cosine result 488 fmovex QNAN,%fp0 |load NAN 489 bra t_operr 490 491 .global ssincosnan 492 ssincosnan: 493 movel ETEMP_EX(%a6),FP_SCR1(%a6) 494 movel ETEMP_HI(%a6),FP_SCR1+4(%a6) 495 movel ETEMP_LO(%a6),FP_SCR1+8(%a6) 496 bsetb #signan_bit,FP_SCR1+4(%a6) 497 fmovemx FP_SCR1(%a6),%fp1-%fp1 498 bsr sto_cos 499 bra src_nan 500 | 501 | This code forces default values for the zero, inf, and nan cases 502 | in the transcendentals code. The CC bits must be set in the 503 | stacked FPSR to be correctly reported. 504 | 505 |**Returns +PI/2 506 .global ld_ppi2 507 ld_ppi2: 508 fmovex PPIBY2,%fp0 |load +pi/2 509 bra t_inx2 |set inex2 exc 510 511 |**Returns -PI/2 512 .global ld_mpi2 513 ld_mpi2: 514 fmovex MPIBY2,%fp0 |load -pi/2 515 orl #neg_mask,USER_FPSR(%a6) |set N bit 516 bra t_inx2 |set inex2 exc 517 518 |**Returns +inf 519 .global ld_pinf 520 ld_pinf: 521 fmovex PINF,%fp0 |load +inf 522 orl #inf_mask,USER_FPSR(%a6) |set I bit 523 rts 524 525 |**Returns -inf 526 .global ld_minf 527 ld_minf: 528 fmovex MINF,%fp0 |load -inf 529 orl #neg_mask+inf_mask,USER_FPSR(%a6) |set N and I bits 530 rts 531 532 |**Returns +1 533 .global ld_pone 534 ld_pone: 535 fmovex PONE,%fp0 |load +1 536 rts 537 538 |**Returns -1 539 .global ld_mone 540 ld_mone: 541 fmovex MONE,%fp0 |load -1 542 orl #neg_mask,USER_FPSR(%a6) |set N bit 543 rts 544 545 |**Returns +0 546 .global ld_pzero 547 ld_pzero: 548 fmovex PZERO,%fp0 |load +0 549 orl #z_mask,USER_FPSR(%a6) |set Z bit 550 rts 551 552 |**Returns -0 553 .global ld_mzero 554 ld_mzero: 555 fmovex MZERO,%fp0 |load -0 556 orl #neg_mask+z_mask,USER_FPSR(%a6) |set N and Z bits 557 rts 558 559 |end