cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

fp_scan.S (11682B)


      1/*
      2 * fp_scan.S
      3 *
      4 * Copyright Roman Zippel, 1997.  All rights reserved.
      5 *
      6 * Redistribution and use in source and binary forms, with or without
      7 * modification, are permitted provided that the following conditions
      8 * are met:
      9 * 1. Redistributions of source code must retain the above copyright
     10 *    notice, and the entire permission notice in its entirety,
     11 *    including the disclaimer of warranties.
     12 * 2. Redistributions in binary form must reproduce the above copyright
     13 *    notice, this list of conditions and the following disclaimer in the
     14 *    documentation and/or other materials provided with the distribution.
     15 * 3. The name of the author may not be used to endorse or promote
     16 *    products derived from this software without specific prior
     17 *    written permission.
     18 *
     19 * ALTERNATIVELY, this product may be distributed under the terms of
     20 * the GNU General Public License, in which case the provisions of the GPL are
     21 * required INSTEAD OF the above restrictions.  (This clause is
     22 * necessary due to a potential bad interaction between the GPL and
     23 * the restrictions contained in a BSD-style copyright.)
     24 *
     25 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
     26 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     27 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     28 * DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
     29 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
     30 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     31 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     32 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
     33 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
     35 * OF THE POSSIBILITY OF SUCH DAMAGE.
     36 */
     37
     38#include "fp_emu.h"
     39#include "fp_decode.h"
     40
     41	.globl	fp_scan, fp_datasize
     42
     43	.data
     44
     45| %d2 - first two instr words
     46| %d1 - operand size
     47
     48/* operand formats are:
     49
     50	Long = 0,		i.e. fmove.l
     51	Single,			i.e. fmove.s
     52	Extended,		i.e. fmove.x
     53	Packed-BCD,		i.e. fmove.p
     54	Word,			i.e. fmove.w
     55	Double,			i.e. fmove.d
     56*/
     57
     58	.text
     59
     60| On entry:
     61| FPDATA - base of emulated FPU registers
     62
     63fp_scan:
     64| normal fpu instruction? (this excludes fsave/frestore)
     65	fp_get_pc %a0
     66	printf	PDECODE,"%08x: ",1,%a0
     67	getuser.b (%a0),%d0,fp_err_ua1,%a0
     68#if 1
     69	cmp.b	#0xf2,%d0		| cpid = 1
     70#else
     71	cmp.b	#0xfc,%d0		| cpid = 6
     72#endif
     73	jne	fp_nonstd
     74| first two instruction words are kept in %d2
     75	getuser.l (%a0)+,%d2,fp_err_ua1,%a0
     76	fp_put_pc %a0
     77fp_decode_cond:				| separate conditional instr
     78	fp_decode_cond_instr_type
     79
     80	.long	fp_decode_move, fp_fscc
     81	.long	fp_fbccw, fp_fbccl
     82
     83fp_decode_move:				| separate move instr
     84	fp_decode_move_instr_type
     85
     86	.long	fp_fgen_fp, fp_ill
     87	.long	fp_fgen_ea, fp_fmove_fp2mem
     88	.long	fp_fmovem_cr, fp_fmovem_cr
     89	.long	fp_fmovem_fp, fp_fmovem_fp
     90
     91| now all arithmetic instr and a few move instr are left
     92fp_fgen_fp:				| source is a fpu register
     93	clr.b	(FPD_FPSR+2,FPDATA)	| clear the exception byte
     94	fp_decode_sourcespec
     95	printf	PDECODE,"f<op>.x fp%d",1,%d0
     96	fp_get_fp_reg
     97	lea	(FPD_TEMPFP1,FPDATA),%a1 | copy src into a temp location
     98	move.l	(%a0)+,(%a1)+
     99	move.l	(%a0)+,(%a1)+
    100	move.l	(%a0),(%a1)
    101	lea	(-8,%a1),%a0
    102	jra	fp_getdest
    103
    104fp_fgen_ea:				| source is <ea>
    105	clr.b	(FPD_FPSR+2,FPDATA)	| clear the exception byte
    106	| sort out fmovecr, keep data size in %d1
    107	fp_decode_sourcespec
    108	cmp.w	#7,%d0
    109	jeq	fp_fmovecr
    110	move.w	%d0,%d1			| store data size twice in %d1
    111	swap	%d1			| one can be trashed below
    112	move.w	%d0,%d1
    113#ifdef FPU_EMU_DEBUG
    114	lea	0f,%a0
    115	clr.l	%d0
    116	move.b	(%a0,%d1.w),%d0
    117	printf	PDECODE,"f<op>.%c ",1,%d0
    118
    119	.data
    1200:	.byte	'l','s','x','p','w','d','b',0
    121	.previous
    122#endif
    123
    124/*
    125	fp_getsource, fp_getdest
    126
    127	basically, we end up with a pointer to the source operand in
    128	%a1, and a pointer to the destination operand in %a0.  both
    129	are, of course, 96-bit extended floating point numbers.
    130*/
    131
    132fp_getsource:
    133	| decode addressing mode for source
    134	fp_decode_addr_mode
    135
    136	.long	fp_data, fp_ill
    137	.long	fp_indirect, fp_postinc
    138	.long	fp_predecr, fp_disp16
    139	.long	fp_extmode0, fp_extmode1
    140
    141	| addressing mode: data register direct
    142fp_data:
    143	fp_mode_data_direct
    144	jsr	fp_get_data_reg
    145	lea	(FPD_TEMPFP1,FPDATA),%a0
    146	jmp	([0f:w,%pc,%d1.w*4])
    147
    148	.align	4
    1490:
    150	.long	fp_data_long, fp_data_single
    151	.long	fp_ill, fp_ill
    152	.long	fp_data_word, fp_ill
    153	.long	fp_data_byte, fp_ill
    154
    155	| data types that fit in an integer data register
    156fp_data_byte:
    157	extb.l	%d0
    158	jra	fp_data_long
    159
    160fp_data_word:
    161	ext.l	%d0
    162
    163fp_data_long:
    164	jsr	fp_conv_long2ext
    165	jra	fp_getdest
    166
    167fp_data_single:
    168	jsr	fp_conv_single2ext
    169	jra	fp_getdest
    170
    171	| addressing mode: address register indirect
    172fp_indirect:
    173	fp_mode_addr_indirect
    174	jra	fp_fetchsource
    175
    176	| addressing mode: address register indirect with postincrement
    177fp_postinc:
    178	fp_mode_addr_indirect_postinc
    179	jra	fp_fetchsource
    180
    181	| addressing mode: address register indirect with predecrement
    182fp_predecr:
    183	fp_mode_addr_indirect_predec
    184	jra	fp_fetchsource
    185
    186	| addressing mode: address register/programm counter indirect
    187	|		   with 16bit displacement
    188fp_disp16:
    189	fp_mode_addr_indirect_disp16
    190	jra	fp_fetchsource
    191
    192	| all other indirect addressing modes will finally end up here
    193fp_extmode0:
    194	fp_mode_addr_indirect_extmode0
    195	jra	fp_fetchsource
    196
    197| all pc relative addressing modes and immediate/absolute modes end up here
    198| the first ones are sent to fp_extmode0 or fp_disp16
    199| and only the latter are handled here
    200fp_extmode1:
    201	fp_decode_addr_reg
    202	jmp	([0f:w,%pc,%d0*4])
    203
    204	.align	4
    2050:
    206	.long	fp_abs_short, fp_abs_long
    207	.long	fp_disp16, fp_extmode0
    208	.long	fp_immediate, fp_ill
    209	.long	fp_ill, fp_ill
    210
    211	| addressing mode: absolute short
    212fp_abs_short:
    213	fp_mode_abs_short
    214	jra	fp_fetchsource
    215
    216	| addressing mode: absolute long
    217fp_abs_long:
    218	fp_mode_abs_long
    219	jra	fp_fetchsource
    220
    221	| addressing mode: immediate data
    222fp_immediate:
    223	printf	PDECODE,"#"
    224	fp_get_pc %a0
    225	move.w	(fp_datasize,%d1.w*2),%d0
    226	addq.w	#1,%d0
    227	and.w	#-2,%d0
    228#ifdef FPU_EMU_DEBUG
    229	movem.l	%d0/%d1,-(%sp)
    230	movel	%a0,%a1
    231	clr.l	%d1
    232	jra	2f
    2331:	getuser.b (%a1)+,%d1,fp_err_ua1,%a1
    234	printf	PDECODE,"%02x",1,%d1
    2352:	dbra	%d0,1b
    236	movem.l	(%sp)+,%d0/%d1
    237#endif
    238	lea	(%a0,%d0.w),%a1
    239	fp_put_pc %a1
    240|	jra	fp_fetchsource
    241
    242fp_fetchsource:
    243	move.l	%a0,%a1
    244	swap	%d1
    245	lea	(FPD_TEMPFP1,FPDATA),%a0
    246	jmp	([0f:w,%pc,%d1.w*4])
    247
    248	.align	4
    2490:	.long	fp_long, fp_single
    250	.long	fp_ext, fp_pack
    251	.long	fp_word, fp_double
    252	.long	fp_byte, fp_ill
    253
    254fp_long:
    255	getuser.l (%a1),%d0,fp_err_ua1,%a1
    256	jsr	fp_conv_long2ext
    257	jra	fp_getdest
    258
    259fp_single:
    260	getuser.l (%a1),%d0,fp_err_ua1,%a1
    261	jsr	fp_conv_single2ext
    262	jra	fp_getdest
    263
    264fp_ext:
    265	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
    266	lsr.l	#8,%d0
    267	lsr.l	#7,%d0
    268	lsr.w	#1,%d0
    269	move.l	%d0,(%a0)+
    270	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
    271	move.l	%d0,(%a0)+
    272	getuser.l (%a1),%d0,fp_err_ua1,%a1
    273	move.l	%d0,(%a0)
    274	subq.l	#8,%a0
    275	jra	fp_getdest
    276
    277fp_pack:
    278	/* not supported yet */
    279	jra	fp_ill
    280
    281fp_word:
    282	getuser.w (%a1),%d0,fp_err_ua1,%a1
    283	ext.l	%d0
    284	jsr	fp_conv_long2ext
    285	jra	fp_getdest
    286
    287fp_double:
    288	jsr	fp_conv_double2ext
    289	jra	fp_getdest
    290
    291fp_byte:
    292	getuser.b (%a1),%d0,fp_err_ua1,%a1
    293	extb.l	%d0
    294	jsr	fp_conv_long2ext
    295|	jra	fp_getdest
    296
    297fp_getdest:
    298	move.l	%a0,%a1
    299	bfextu	%d2{#22,#3},%d0
    300	printf	PDECODE,",fp%d\n",1,%d0
    301	fp_get_fp_reg
    302	movem.l	%a0/%a1,-(%sp)
    303	pea	fp_finalrounding
    304	bfextu	%d2{#25,#7},%d0
    305	jmp	([0f:w,%pc,%d0*4])
    306
    307	.align	4
    3080:
    309	.long	fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz
    310	.long	fp_fsqrt, fp_ill, fp_flognp1, fp_ill
    311	.long	fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill
    312	.long	fp_fasin, fp_fatanh, fp_fsin, fp_ftan
    313	.long	fp_fetox, fp_ftwotox, fp_ftentox, fp_ill
    314	.long	fp_flogn, fp_flog10, fp_flog2, fp_ill
    315	.long	fp_fabs, fp_fcosh, fp_fneg, fp_ill
    316	.long	fp_facos, fp_fcos, fp_fgetexp, fp_fgetman
    317	.long	fp_fdiv, fp_fmod, fp_fadd, fp_fmul
    318	.long	fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul
    319	.long	fp_fsub, fp_ill, fp_ill, fp_ill
    320	.long	fp_ill, fp_ill, fp_ill, fp_ill
    321	.long	fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3
    322	.long	fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7
    323	.long	fp_fcmp, fp_ill, fp_ftst, fp_ill
    324	.long	fp_ill, fp_ill, fp_ill, fp_ill
    325	.long	fp_fsmove, fp_fssqrt, fp_ill, fp_ill
    326	.long	fp_fdmove, fp_fdsqrt, fp_ill, fp_ill
    327	.long	fp_ill, fp_ill, fp_ill, fp_ill
    328	.long	fp_ill, fp_ill, fp_ill, fp_ill
    329	.long	fp_ill, fp_ill, fp_ill, fp_ill
    330	.long	fp_ill, fp_ill, fp_ill, fp_ill
    331	.long	fp_fsabs, fp_ill, fp_fsneg, fp_ill
    332	.long	fp_fdabs, fp_ill, fp_fdneg, fp_ill
    333	.long	fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul
    334	.long	fp_fddiv, fp_ill, fp_fdadd, fp_fdmul
    335	.long	fp_fssub, fp_ill, fp_ill, fp_ill
    336	.long	fp_fdsub, fp_ill, fp_ill, fp_ill
    337	.long	fp_ill, fp_ill, fp_ill, fp_ill
    338	.long	fp_ill, fp_ill, fp_ill, fp_ill
    339	.long	fp_ill, fp_ill, fp_ill, fp_ill
    340	.long	fp_ill, fp_ill, fp_ill, fp_ill
    341
    342	| Instructions follow
    343
    344	| Move an (emulated) ROM constant
    345fp_fmovecr:
    346	bfextu	%d2{#27,#5},%d0
    347	printf	PINSTR,"fp_fmovecr #%d",1,%d0
    348	move.l	%d0,%d1
    349	add.l	%d0,%d0
    350	add.l	%d1,%d0
    351	lea	(fp_constants,%d0*4),%a0
    352	move.l	#0x801cc0ff,%d0
    353	addq.l	#1,%d1
    354	lsl.l	%d1,%d0
    355	jcc	1f
    356	fp_set_sr FPSR_EXC_INEX2			| INEX2 exception
    3571:	moveq	#-128,%d0				| continue with fmove
    358	and.l	%d0,%d2
    359	jra	fp_getdest
    360
    361	.data
    362	.align	4
    363fp_constants:
    364	.long	0x00004000,0xc90fdaa2,0x2168c235	| pi
    365	.extend	0,0,0,0,0,0,0,0,0,0
    366	.long	0x00003ffd,0x9a209a84,0xfbcff798	| log10(2)
    367	.long	0x00004000,0xadf85458,0xa2bb4a9a	| e
    368	.long	0x00003fff,0xb8aa3b29,0x5c17f0bc	| log2(e)
    369	.long	0x00003ffd,0xde5bd8a9,0x37287195	| log10(e)
    370	.long	0x00000000,0x00000000,0x00000000	| 0.0
    371	.long	0x00003ffe,0xb17217f7,0xd1cf79ac	| 1n(2)
    372	.long	0x00004000,0x935d8ddd,0xaaa8ac17	| 1n(10)
    373	| read this as "1.0 * 2^0" - note the high bit in the mantissa
    374	.long	0x00003fff,0x80000000,0x00000000	| 10^0
    375	.long	0x00004002,0xa0000000,0x00000000	| 10^1
    376	.long	0x00004005,0xc8000000,0x00000000	| 10^2
    377	.long	0x0000400c,0x9c400000,0x00000000	| 10^4
    378	.long	0x00004019,0xbebc2000,0x00000000	| 10^8
    379	.long	0x00004034,0x8e1bc9bf,0x04000000	| 10^16
    380	.long	0x00004069,0x9dc5ada8,0x2b70b59e	| 10^32
    381	.long	0x000040d3,0xc2781f49,0xffcfa6d5	| 10^64
    382	.long	0x000041a8,0x93ba47c9,0x80e98ce0	| 10^128
    383	.long	0x00004351,0xaa7eebfb,0x9df9de8e	| 10^256
    384	.long	0x000046a3,0xe319a0ae,0xa60e91c7	| 10^512
    385	.long	0x00004d48,0xc9767586,0x81750c17	| 10^1024
    386	.long	0x00005a92,0x9e8b3b5d,0xc53d5de5	| 10^2048
    387	.long	0x00007525,0xc4605202,0x8a20979b	| 10^4096
    388	.previous
    389
    390fp_fmove_mem2fp:
    391	printf	PINSTR,"fmove %p,%p\n",2,%a0,%a1
    392	move.l	(%a1)+,(%a0)+
    393	move.l	(%a1)+,(%a0)+
    394	move.l	(%a1),(%a0)
    395	subq.l	#8,%a0
    396	rts
    397
    398fpa_fsglmul:
    399	move.l	#fp_finalrounding_single_fast,(%sp)
    400	jra	fp_fsglmul
    401
    402fpa_fsgldiv:
    403	move.l	#fp_finalrounding_single_fast,(%sp)
    404	jra	fp_fsgldiv
    405
    406.macro	fp_dosingleprec instr
    407	printf	PINSTR,"single "
    408	move.l	#fp_finalrounding_single,(%sp)
    409	jra	\instr
    410.endm
    411
    412.macro	fp_dodoubleprec instr
    413	printf	PINSTR,"double "
    414	move.l	#fp_finalrounding_double,(%sp)
    415	jra	\instr
    416.endm
    417
    418fp_fsmove:
    419	fp_dosingleprec fp_fmove_mem2fp
    420
    421fp_fssqrt:
    422	fp_dosingleprec fp_fsqrt
    423
    424fp_fdmove:
    425	fp_dodoubleprec fp_fmove_mem2fp
    426
    427fp_fdsqrt:
    428	fp_dodoubleprec fp_fsqrt
    429
    430fp_fsabs:
    431	fp_dosingleprec fp_fabs
    432
    433fp_fsneg:
    434	fp_dosingleprec fp_fneg
    435
    436fp_fdabs:
    437	fp_dodoubleprec fp_fabs
    438
    439fp_fdneg:
    440	fp_dodoubleprec fp_fneg
    441
    442fp_fsdiv:
    443	fp_dosingleprec fp_fdiv
    444
    445fp_fsadd:
    446	fp_dosingleprec fp_fadd
    447
    448fp_fsmul:
    449	fp_dosingleprec fp_fmul
    450
    451fp_fddiv:
    452	fp_dodoubleprec fp_fdiv
    453
    454fp_fdadd:
    455	fp_dodoubleprec fp_fadd
    456
    457fp_fdmul:
    458	fp_dodoubleprec fp_fmul
    459
    460fp_fssub:
    461	fp_dosingleprec fp_fsub
    462
    463fp_fdsub:
    464	fp_dodoubleprec fp_fsub
    465
    466fp_nonstd:
    467	fp_get_pc %a0
    468	getuser.l (%a0),%d0,fp_err_ua1,%a0
    469	printf	,"nonstd ((%08x)=%08x)\n",2,%a0,%d0
    470	moveq	#-1,%d0
    471	rts
    472
    473	.data
    474	.align	4
    475
    476	| data sizes corresponding to the operand formats
    477fp_datasize:
    478	.word	4, 4, 12, 12, 2, 8, 1, 0