fp_scan.S (11682B)
1/* 2 * fp_scan.S 3 * 4 * Copyright Roman Zippel, 1997. All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions 8 * are met: 9 * 1. Redistributions of source code must retain the above copyright 10 * notice, and the entire permission notice in its entirety, 11 * including the disclaimer of warranties. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 3. The name of the author may not be used to endorse or promote 16 * products derived from this software without specific prior 17 * written permission. 18 * 19 * ALTERNATIVELY, this product may be distributed under the terms of 20 * the GNU General Public License, in which case the provisions of the GPL are 21 * required INSTEAD OF the above restrictions. (This clause is 22 * necessary due to a potential bad interaction between the GPL and 23 * the restrictions contained in a BSD-style copyright.) 24 * 25 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED 26 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 27 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 28 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, 29 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES 30 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 31 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 32 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, 33 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 34 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED 35 * OF THE POSSIBILITY OF SUCH DAMAGE. 36 */ 37 38#include "fp_emu.h" 39#include "fp_decode.h" 40 41 .globl fp_scan, fp_datasize 42 43 .data 44 45| %d2 - first two instr words 46| %d1 - operand size 47 48/* operand formats are: 49 50 Long = 0, i.e. fmove.l 51 Single, i.e. fmove.s 52 Extended, i.e. fmove.x 53 Packed-BCD, i.e. fmove.p 54 Word, i.e. fmove.w 55 Double, i.e. fmove.d 56*/ 57 58 .text 59 60| On entry: 61| FPDATA - base of emulated FPU registers 62 63fp_scan: 64| normal fpu instruction? (this excludes fsave/frestore) 65 fp_get_pc %a0 66 printf PDECODE,"%08x: ",1,%a0 67 getuser.b (%a0),%d0,fp_err_ua1,%a0 68#if 1 69 cmp.b #0xf2,%d0 | cpid = 1 70#else 71 cmp.b #0xfc,%d0 | cpid = 6 72#endif 73 jne fp_nonstd 74| first two instruction words are kept in %d2 75 getuser.l (%a0)+,%d2,fp_err_ua1,%a0 76 fp_put_pc %a0 77fp_decode_cond: | separate conditional instr 78 fp_decode_cond_instr_type 79 80 .long fp_decode_move, fp_fscc 81 .long fp_fbccw, fp_fbccl 82 83fp_decode_move: | separate move instr 84 fp_decode_move_instr_type 85 86 .long fp_fgen_fp, fp_ill 87 .long fp_fgen_ea, fp_fmove_fp2mem 88 .long fp_fmovem_cr, fp_fmovem_cr 89 .long fp_fmovem_fp, fp_fmovem_fp 90 91| now all arithmetic instr and a few move instr are left 92fp_fgen_fp: | source is a fpu register 93 clr.b (FPD_FPSR+2,FPDATA) | clear the exception byte 94 fp_decode_sourcespec 95 printf PDECODE,"f<op>.x fp%d",1,%d0 96 fp_get_fp_reg 97 lea (FPD_TEMPFP1,FPDATA),%a1 | copy src into a temp location 98 move.l (%a0)+,(%a1)+ 99 move.l (%a0)+,(%a1)+ 100 move.l (%a0),(%a1) 101 lea (-8,%a1),%a0 102 jra fp_getdest 103 104fp_fgen_ea: | source is <ea> 105 clr.b (FPD_FPSR+2,FPDATA) | clear the exception byte 106 | sort out fmovecr, keep data size in %d1 107 fp_decode_sourcespec 108 cmp.w #7,%d0 109 jeq fp_fmovecr 110 move.w %d0,%d1 | store data size twice in %d1 111 swap %d1 | one can be trashed below 112 move.w %d0,%d1 113#ifdef FPU_EMU_DEBUG 114 lea 0f,%a0 115 clr.l %d0 116 move.b (%a0,%d1.w),%d0 117 printf PDECODE,"f<op>.%c ",1,%d0 118 119 .data 1200: .byte 'l','s','x','p','w','d','b',0 121 .previous 122#endif 123 124/* 125 fp_getsource, fp_getdest 126 127 basically, we end up with a pointer to the source operand in 128 %a1, and a pointer to the destination operand in %a0. both 129 are, of course, 96-bit extended floating point numbers. 130*/ 131 132fp_getsource: 133 | decode addressing mode for source 134 fp_decode_addr_mode 135 136 .long fp_data, fp_ill 137 .long fp_indirect, fp_postinc 138 .long fp_predecr, fp_disp16 139 .long fp_extmode0, fp_extmode1 140 141 | addressing mode: data register direct 142fp_data: 143 fp_mode_data_direct 144 jsr fp_get_data_reg 145 lea (FPD_TEMPFP1,FPDATA),%a0 146 jmp ([0f:w,%pc,%d1.w*4]) 147 148 .align 4 1490: 150 .long fp_data_long, fp_data_single 151 .long fp_ill, fp_ill 152 .long fp_data_word, fp_ill 153 .long fp_data_byte, fp_ill 154 155 | data types that fit in an integer data register 156fp_data_byte: 157 extb.l %d0 158 jra fp_data_long 159 160fp_data_word: 161 ext.l %d0 162 163fp_data_long: 164 jsr fp_conv_long2ext 165 jra fp_getdest 166 167fp_data_single: 168 jsr fp_conv_single2ext 169 jra fp_getdest 170 171 | addressing mode: address register indirect 172fp_indirect: 173 fp_mode_addr_indirect 174 jra fp_fetchsource 175 176 | addressing mode: address register indirect with postincrement 177fp_postinc: 178 fp_mode_addr_indirect_postinc 179 jra fp_fetchsource 180 181 | addressing mode: address register indirect with predecrement 182fp_predecr: 183 fp_mode_addr_indirect_predec 184 jra fp_fetchsource 185 186 | addressing mode: address register/programm counter indirect 187 | with 16bit displacement 188fp_disp16: 189 fp_mode_addr_indirect_disp16 190 jra fp_fetchsource 191 192 | all other indirect addressing modes will finally end up here 193fp_extmode0: 194 fp_mode_addr_indirect_extmode0 195 jra fp_fetchsource 196 197| all pc relative addressing modes and immediate/absolute modes end up here 198| the first ones are sent to fp_extmode0 or fp_disp16 199| and only the latter are handled here 200fp_extmode1: 201 fp_decode_addr_reg 202 jmp ([0f:w,%pc,%d0*4]) 203 204 .align 4 2050: 206 .long fp_abs_short, fp_abs_long 207 .long fp_disp16, fp_extmode0 208 .long fp_immediate, fp_ill 209 .long fp_ill, fp_ill 210 211 | addressing mode: absolute short 212fp_abs_short: 213 fp_mode_abs_short 214 jra fp_fetchsource 215 216 | addressing mode: absolute long 217fp_abs_long: 218 fp_mode_abs_long 219 jra fp_fetchsource 220 221 | addressing mode: immediate data 222fp_immediate: 223 printf PDECODE,"#" 224 fp_get_pc %a0 225 move.w (fp_datasize,%d1.w*2),%d0 226 addq.w #1,%d0 227 and.w #-2,%d0 228#ifdef FPU_EMU_DEBUG 229 movem.l %d0/%d1,-(%sp) 230 movel %a0,%a1 231 clr.l %d1 232 jra 2f 2331: getuser.b (%a1)+,%d1,fp_err_ua1,%a1 234 printf PDECODE,"%02x",1,%d1 2352: dbra %d0,1b 236 movem.l (%sp)+,%d0/%d1 237#endif 238 lea (%a0,%d0.w),%a1 239 fp_put_pc %a1 240| jra fp_fetchsource 241 242fp_fetchsource: 243 move.l %a0,%a1 244 swap %d1 245 lea (FPD_TEMPFP1,FPDATA),%a0 246 jmp ([0f:w,%pc,%d1.w*4]) 247 248 .align 4 2490: .long fp_long, fp_single 250 .long fp_ext, fp_pack 251 .long fp_word, fp_double 252 .long fp_byte, fp_ill 253 254fp_long: 255 getuser.l (%a1),%d0,fp_err_ua1,%a1 256 jsr fp_conv_long2ext 257 jra fp_getdest 258 259fp_single: 260 getuser.l (%a1),%d0,fp_err_ua1,%a1 261 jsr fp_conv_single2ext 262 jra fp_getdest 263 264fp_ext: 265 getuser.l (%a1)+,%d0,fp_err_ua1,%a1 266 lsr.l #8,%d0 267 lsr.l #7,%d0 268 lsr.w #1,%d0 269 move.l %d0,(%a0)+ 270 getuser.l (%a1)+,%d0,fp_err_ua1,%a1 271 move.l %d0,(%a0)+ 272 getuser.l (%a1),%d0,fp_err_ua1,%a1 273 move.l %d0,(%a0) 274 subq.l #8,%a0 275 jra fp_getdest 276 277fp_pack: 278 /* not supported yet */ 279 jra fp_ill 280 281fp_word: 282 getuser.w (%a1),%d0,fp_err_ua1,%a1 283 ext.l %d0 284 jsr fp_conv_long2ext 285 jra fp_getdest 286 287fp_double: 288 jsr fp_conv_double2ext 289 jra fp_getdest 290 291fp_byte: 292 getuser.b (%a1),%d0,fp_err_ua1,%a1 293 extb.l %d0 294 jsr fp_conv_long2ext 295| jra fp_getdest 296 297fp_getdest: 298 move.l %a0,%a1 299 bfextu %d2{#22,#3},%d0 300 printf PDECODE,",fp%d\n",1,%d0 301 fp_get_fp_reg 302 movem.l %a0/%a1,-(%sp) 303 pea fp_finalrounding 304 bfextu %d2{#25,#7},%d0 305 jmp ([0f:w,%pc,%d0*4]) 306 307 .align 4 3080: 309 .long fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz 310 .long fp_fsqrt, fp_ill, fp_flognp1, fp_ill 311 .long fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill 312 .long fp_fasin, fp_fatanh, fp_fsin, fp_ftan 313 .long fp_fetox, fp_ftwotox, fp_ftentox, fp_ill 314 .long fp_flogn, fp_flog10, fp_flog2, fp_ill 315 .long fp_fabs, fp_fcosh, fp_fneg, fp_ill 316 .long fp_facos, fp_fcos, fp_fgetexp, fp_fgetman 317 .long fp_fdiv, fp_fmod, fp_fadd, fp_fmul 318 .long fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul 319 .long fp_fsub, fp_ill, fp_ill, fp_ill 320 .long fp_ill, fp_ill, fp_ill, fp_ill 321 .long fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3 322 .long fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7 323 .long fp_fcmp, fp_ill, fp_ftst, fp_ill 324 .long fp_ill, fp_ill, fp_ill, fp_ill 325 .long fp_fsmove, fp_fssqrt, fp_ill, fp_ill 326 .long fp_fdmove, fp_fdsqrt, fp_ill, fp_ill 327 .long fp_ill, fp_ill, fp_ill, fp_ill 328 .long fp_ill, fp_ill, fp_ill, fp_ill 329 .long fp_ill, fp_ill, fp_ill, fp_ill 330 .long fp_ill, fp_ill, fp_ill, fp_ill 331 .long fp_fsabs, fp_ill, fp_fsneg, fp_ill 332 .long fp_fdabs, fp_ill, fp_fdneg, fp_ill 333 .long fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul 334 .long fp_fddiv, fp_ill, fp_fdadd, fp_fdmul 335 .long fp_fssub, fp_ill, fp_ill, fp_ill 336 .long fp_fdsub, fp_ill, fp_ill, fp_ill 337 .long fp_ill, fp_ill, fp_ill, fp_ill 338 .long fp_ill, fp_ill, fp_ill, fp_ill 339 .long fp_ill, fp_ill, fp_ill, fp_ill 340 .long fp_ill, fp_ill, fp_ill, fp_ill 341 342 | Instructions follow 343 344 | Move an (emulated) ROM constant 345fp_fmovecr: 346 bfextu %d2{#27,#5},%d0 347 printf PINSTR,"fp_fmovecr #%d",1,%d0 348 move.l %d0,%d1 349 add.l %d0,%d0 350 add.l %d1,%d0 351 lea (fp_constants,%d0*4),%a0 352 move.l #0x801cc0ff,%d0 353 addq.l #1,%d1 354 lsl.l %d1,%d0 355 jcc 1f 356 fp_set_sr FPSR_EXC_INEX2 | INEX2 exception 3571: moveq #-128,%d0 | continue with fmove 358 and.l %d0,%d2 359 jra fp_getdest 360 361 .data 362 .align 4 363fp_constants: 364 .long 0x00004000,0xc90fdaa2,0x2168c235 | pi 365 .extend 0,0,0,0,0,0,0,0,0,0 366 .long 0x00003ffd,0x9a209a84,0xfbcff798 | log10(2) 367 .long 0x00004000,0xadf85458,0xa2bb4a9a | e 368 .long 0x00003fff,0xb8aa3b29,0x5c17f0bc | log2(e) 369 .long 0x00003ffd,0xde5bd8a9,0x37287195 | log10(e) 370 .long 0x00000000,0x00000000,0x00000000 | 0.0 371 .long 0x00003ffe,0xb17217f7,0xd1cf79ac | 1n(2) 372 .long 0x00004000,0x935d8ddd,0xaaa8ac17 | 1n(10) 373 | read this as "1.0 * 2^0" - note the high bit in the mantissa 374 .long 0x00003fff,0x80000000,0x00000000 | 10^0 375 .long 0x00004002,0xa0000000,0x00000000 | 10^1 376 .long 0x00004005,0xc8000000,0x00000000 | 10^2 377 .long 0x0000400c,0x9c400000,0x00000000 | 10^4 378 .long 0x00004019,0xbebc2000,0x00000000 | 10^8 379 .long 0x00004034,0x8e1bc9bf,0x04000000 | 10^16 380 .long 0x00004069,0x9dc5ada8,0x2b70b59e | 10^32 381 .long 0x000040d3,0xc2781f49,0xffcfa6d5 | 10^64 382 .long 0x000041a8,0x93ba47c9,0x80e98ce0 | 10^128 383 .long 0x00004351,0xaa7eebfb,0x9df9de8e | 10^256 384 .long 0x000046a3,0xe319a0ae,0xa60e91c7 | 10^512 385 .long 0x00004d48,0xc9767586,0x81750c17 | 10^1024 386 .long 0x00005a92,0x9e8b3b5d,0xc53d5de5 | 10^2048 387 .long 0x00007525,0xc4605202,0x8a20979b | 10^4096 388 .previous 389 390fp_fmove_mem2fp: 391 printf PINSTR,"fmove %p,%p\n",2,%a0,%a1 392 move.l (%a1)+,(%a0)+ 393 move.l (%a1)+,(%a0)+ 394 move.l (%a1),(%a0) 395 subq.l #8,%a0 396 rts 397 398fpa_fsglmul: 399 move.l #fp_finalrounding_single_fast,(%sp) 400 jra fp_fsglmul 401 402fpa_fsgldiv: 403 move.l #fp_finalrounding_single_fast,(%sp) 404 jra fp_fsgldiv 405 406.macro fp_dosingleprec instr 407 printf PINSTR,"single " 408 move.l #fp_finalrounding_single,(%sp) 409 jra \instr 410.endm 411 412.macro fp_dodoubleprec instr 413 printf PINSTR,"double " 414 move.l #fp_finalrounding_double,(%sp) 415 jra \instr 416.endm 417 418fp_fsmove: 419 fp_dosingleprec fp_fmove_mem2fp 420 421fp_fssqrt: 422 fp_dosingleprec fp_fsqrt 423 424fp_fdmove: 425 fp_dodoubleprec fp_fmove_mem2fp 426 427fp_fdsqrt: 428 fp_dodoubleprec fp_fsqrt 429 430fp_fsabs: 431 fp_dosingleprec fp_fabs 432 433fp_fsneg: 434 fp_dosingleprec fp_fneg 435 436fp_fdabs: 437 fp_dodoubleprec fp_fabs 438 439fp_fdneg: 440 fp_dodoubleprec fp_fneg 441 442fp_fsdiv: 443 fp_dosingleprec fp_fdiv 444 445fp_fsadd: 446 fp_dosingleprec fp_fadd 447 448fp_fsmul: 449 fp_dosingleprec fp_fmul 450 451fp_fddiv: 452 fp_dodoubleprec fp_fdiv 453 454fp_fdadd: 455 fp_dodoubleprec fp_fadd 456 457fp_fdmul: 458 fp_dodoubleprec fp_fmul 459 460fp_fssub: 461 fp_dosingleprec fp_fsub 462 463fp_fdsub: 464 fp_dodoubleprec fp_fsub 465 466fp_nonstd: 467 fp_get_pc %a0 468 getuser.l (%a0),%d0,fp_err_ua1,%a0 469 printf ,"nonstd ((%08x)=%08x)\n",2,%a0,%d0 470 moveq #-1,%d0 471 rts 472 473 .data 474 .align 4 475 476 | data sizes corresponding to the operand formats 477fp_datasize: 478 .word 4, 4, 12, 12, 2, 8, 1, 0