cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

mca_asm.S (27971B)


      1/* SPDX-License-Identifier: GPL-2.0 */
      2/*
      3 * File:	mca_asm.S
      4 * Purpose:	assembly portion of the IA64 MCA handling
      5 *
      6 * Mods by cfleck to integrate into kernel build
      7 *
      8 * 2000-03-15 David Mosberger-Tang <davidm@hpl.hp.com>
      9 *		Added various stop bits to get a clean compile
     10 *
     11 * 2000-03-29 Chuck Fleckenstein <cfleck@co.intel.com>
     12 *		Added code to save INIT handoff state in pt_regs format,
     13 *		switch to temp kstack, switch modes, jump to C INIT handler
     14 *
     15 * 2002-01-04 J.Hall <jenna.s.hall@intel.com>
     16 *		Before entering virtual mode code:
     17 *		 1. Check for TLB CPU error
     18 *		 2. Restore current thread pointer to kr6
     19 *		 3. Move stack ptr 16 bytes to conform to C calling convention
     20 *
     21 * 2004-11-12 Russ Anderson <rja@sgi.com>
     22 *		Added per cpu MCA/INIT stack save areas.
     23 *
     24 * 2005-12-08 Keith Owens <kaos@sgi.com>
     25 *		Use per cpu MCA/INIT stacks for all data.
     26 */
     27#include <linux/threads.h>
     28#include <linux/pgtable.h>
     29
     30#include <asm/asmmacro.h>
     31#include <asm/processor.h>
     32#include <asm/mca_asm.h>
     33#include <asm/mca.h>
     34
     35#include "entry.h"
     36
     37#define GET_IA64_MCA_DATA(reg)						\
     38	GET_THIS_PADDR(reg, ia64_mca_data)				\
     39	;;								\
     40	ld8 reg=[reg]
     41
     42	.global ia64_do_tlb_purge
     43	.global ia64_os_mca_dispatch
     44	.global ia64_os_init_on_kdump
     45	.global ia64_os_init_dispatch_monarch
     46	.global ia64_os_init_dispatch_slave
     47
     48	.text
     49	.align 16
     50
     51//StartMain////////////////////////////////////////////////////////////////////
     52
     53/*
     54 * Just the TLB purge part is moved to a separate function
     55 * so we can re-use the code for cpu hotplug code as well
     56 * Caller should now setup b1, so we can branch once the
     57 * tlb flush is complete.
     58 */
     59
     60ia64_do_tlb_purge:
     61#define O(member)	IA64_CPUINFO_##member##_OFFSET
     62
     63	GET_THIS_PADDR(r2, ia64_cpu_info) // load phys addr of cpu_info into r2
     64	;;
     65	addl r17=O(PTCE_STRIDE),r2
     66	addl r2=O(PTCE_BASE),r2
     67	;;
     68	ld8 r18=[r2],(O(PTCE_COUNT)-O(PTCE_BASE));;	// r18=ptce_base
     69	ld4 r19=[r2],4					// r19=ptce_count[0]
     70	ld4 r21=[r17],4					// r21=ptce_stride[0]
     71	;;
     72	ld4 r20=[r2]					// r20=ptce_count[1]
     73	ld4 r22=[r17]					// r22=ptce_stride[1]
     74	mov r24=0
     75	;;
     76	adds r20=-1,r20
     77	;;
     78#undef O
     79
     802:
     81	cmp.ltu p6,p7=r24,r19
     82(p7)	br.cond.dpnt.few 4f
     83	mov ar.lc=r20
     843:
     85	ptc.e r18
     86	;;
     87	add r18=r22,r18
     88	br.cloop.sptk.few 3b
     89	;;
     90	add r18=r21,r18
     91	add r24=1,r24
     92	;;
     93	br.sptk.few 2b
     944:
     95	srlz.i 			// srlz.i implies srlz.d
     96	;;
     97
     98        // Now purge addresses formerly mapped by TR registers
     99	// 1. Purge ITR&DTR for kernel.
    100	movl r16=KERNEL_START
    101	mov r18=KERNEL_TR_PAGE_SHIFT<<2
    102	;;
    103	ptr.i r16, r18
    104	ptr.d r16, r18
    105	;;
    106	srlz.i
    107	;;
    108	srlz.d
    109	;;
    110	// 3. Purge ITR for PAL code.
    111	GET_THIS_PADDR(r2, ia64_mca_pal_base)
    112	;;
    113	ld8 r16=[r2]
    114	mov r18=IA64_GRANULE_SHIFT<<2
    115	;;
    116	ptr.i r16,r18
    117	;;
    118	srlz.i
    119	;;
    120	// 4. Purge DTR for stack.
    121	mov r16=IA64_KR(CURRENT_STACK)
    122	;;
    123	shl r16=r16,IA64_GRANULE_SHIFT
    124	movl r19=PAGE_OFFSET
    125	;;
    126	add r16=r19,r16
    127	mov r18=IA64_GRANULE_SHIFT<<2
    128	;;
    129	ptr.d r16,r18
    130	;;
    131	srlz.i
    132	;;
    133	// Now branch away to caller.
    134	br.sptk.many b1
    135	;;
    136
    137//EndMain//////////////////////////////////////////////////////////////////////
    138
    139//StartMain////////////////////////////////////////////////////////////////////
    140
    141ia64_os_mca_dispatch:
    142	mov r3=IA64_MCA_CPU_MCA_STACK_OFFSET	// use the MCA stack
    143	LOAD_PHYSICAL(p0,r2,1f)			// return address
    144	mov r19=1				// All MCA events are treated as monarch (for now)
    145	br.sptk ia64_state_save			// save the state that is not in minstate
    1461:
    147
    148	GET_IA64_MCA_DATA(r2)
    149	// Using MCA stack, struct ia64_sal_os_state, variable proc_state_param
    150	;;
    151	add r3=IA64_MCA_CPU_MCA_STACK_OFFSET+MCA_SOS_OFFSET+SOS(PROC_STATE_PARAM), r2
    152	;;
    153	ld8 r18=[r3]				// Get processor state parameter on existing PALE_CHECK.
    154	;;
    155	tbit.nz p6,p7=r18,60
    156(p7)	br.spnt done_tlb_purge_and_reload
    157
    158	// The following code purges TC and TR entries. Then reload all TC entries.
    159	// Purge percpu data TC entries.
    160begin_tlb_purge_and_reload:
    161	movl r18=ia64_reload_tr;;
    162	LOAD_PHYSICAL(p0,r18,ia64_reload_tr);;
    163	mov b1=r18;;
    164	br.sptk.many ia64_do_tlb_purge;;
    165
    166ia64_reload_tr:
    167	// Finally reload the TR registers.
    168	// 1. Reload DTR/ITR registers for kernel.
    169	mov r18=KERNEL_TR_PAGE_SHIFT<<2
    170	movl r17=KERNEL_START
    171	;;
    172	mov cr.itir=r18
    173	mov cr.ifa=r17
    174        mov r16=IA64_TR_KERNEL
    175	mov r19=ip
    176	movl r18=PAGE_KERNEL
    177	;;
    178        dep r17=0,r19,0, KERNEL_TR_PAGE_SHIFT
    179	;;
    180	or r18=r17,r18
    181	;;
    182        itr.i itr[r16]=r18
    183	;;
    184        itr.d dtr[r16]=r18
    185        ;;
    186	srlz.i
    187	srlz.d
    188	;;
    189	// 3. Reload ITR for PAL code.
    190	GET_THIS_PADDR(r2, ia64_mca_pal_pte)
    191	;;
    192	ld8 r18=[r2]			// load PAL PTE
    193	;;
    194	GET_THIS_PADDR(r2, ia64_mca_pal_base)
    195	;;
    196	ld8 r16=[r2]			// load PAL vaddr
    197	mov r19=IA64_GRANULE_SHIFT<<2
    198	;;
    199	mov cr.itir=r19
    200	mov cr.ifa=r16
    201	mov r20=IA64_TR_PALCODE
    202	;;
    203	itr.i itr[r20]=r18
    204	;;
    205	srlz.i
    206	;;
    207	// 4. Reload DTR for stack.
    208	mov r16=IA64_KR(CURRENT_STACK)
    209	;;
    210	shl r16=r16,IA64_GRANULE_SHIFT
    211	movl r19=PAGE_OFFSET
    212	;;
    213	add r18=r19,r16
    214	movl r20=PAGE_KERNEL
    215	;;
    216	add r16=r20,r16
    217	mov r19=IA64_GRANULE_SHIFT<<2
    218	;;
    219	mov cr.itir=r19
    220	mov cr.ifa=r18
    221	mov r20=IA64_TR_CURRENT_STACK
    222	;;
    223	itr.d dtr[r20]=r16
    224	GET_THIS_PADDR(r2, ia64_mca_tr_reload)
    225	mov r18 = 1
    226	;;
    227	srlz.d
    228	;;
    229	st8 [r2] =r18
    230	;;
    231
    232done_tlb_purge_and_reload:
    233
    234	// switch to per cpu MCA stack
    235	mov r3=IA64_MCA_CPU_MCA_STACK_OFFSET	// use the MCA stack
    236	LOAD_PHYSICAL(p0,r2,1f)			// return address
    237	br.sptk ia64_new_stack
    2381:
    239
    240	// everything saved, now we can set the kernel registers
    241	mov r3=IA64_MCA_CPU_MCA_STACK_OFFSET	// use the MCA stack
    242	LOAD_PHYSICAL(p0,r2,1f)			// return address
    243	br.sptk ia64_set_kernel_registers
    2441:
    245
    246	// This must be done in physical mode
    247	GET_IA64_MCA_DATA(r2)
    248	;;
    249	mov r7=r2
    250
    251        // Enter virtual mode from physical mode
    252	VIRTUAL_MODE_ENTER(r2, r3, ia64_os_mca_virtual_begin, r4)
    253
    254	// This code returns to SAL via SOS r2, in general SAL has no unwind
    255	// data.  To get a clean termination when backtracing the C MCA/INIT
    256	// handler, set a dummy return address of 0 in this routine.  That
    257	// requires that ia64_os_mca_virtual_begin be a global function.
    258ENTRY(ia64_os_mca_virtual_begin)
    259	.prologue
    260	.save rp,r0
    261	.body
    262
    263	mov ar.rsc=3				// set eager mode for C handler
    264	mov r2=r7				// see GET_IA64_MCA_DATA above
    265	;;
    266
    267	// Call virtual mode handler
    268	alloc r14=ar.pfs,0,0,3,0
    269	;;
    270	DATA_PA_TO_VA(r2,r7)
    271	;;
    272	add out0=IA64_MCA_CPU_MCA_STACK_OFFSET+MCA_PT_REGS_OFFSET, r2
    273	add out1=IA64_MCA_CPU_MCA_STACK_OFFSET+MCA_SWITCH_STACK_OFFSET, r2
    274	add out2=IA64_MCA_CPU_MCA_STACK_OFFSET+MCA_SOS_OFFSET, r2
    275	br.call.sptk.many    b0=ia64_mca_handler
    276
    277	// Revert back to physical mode before going back to SAL
    278	PHYSICAL_MODE_ENTER(r2, r3, ia64_os_mca_virtual_end, r4)
    279ia64_os_mca_virtual_end:
    280
    281END(ia64_os_mca_virtual_begin)
    282
    283	// switch back to previous stack
    284	alloc r14=ar.pfs,0,0,0,0		// remove the MCA handler frame
    285	mov r3=IA64_MCA_CPU_MCA_STACK_OFFSET	// use the MCA stack
    286	LOAD_PHYSICAL(p0,r2,1f)			// return address
    287	br.sptk ia64_old_stack
    2881:
    289
    290	mov r3=IA64_MCA_CPU_MCA_STACK_OFFSET	// use the MCA stack
    291	LOAD_PHYSICAL(p0,r2,1f)			// return address
    292	br.sptk ia64_state_restore		// restore the SAL state
    2931:
    294
    295	mov		b0=r12			// SAL_CHECK return address
    296
    297	br		b0
    298
    299//EndMain//////////////////////////////////////////////////////////////////////
    300
    301//StartMain////////////////////////////////////////////////////////////////////
    302
    303//
    304// NOP init handler for kdump.  In panic situation, we may receive INIT
    305// while kernel transition.  Since we initialize registers on leave from
    306// current kernel, no longer monarch/slave handlers of current kernel in
    307// virtual mode are called safely.
    308// We can unregister these init handlers from SAL, however then the INIT
    309// will result in warmboot by SAL and we cannot retrieve the crashdump.
    310// Therefore register this NOP function to SAL, to prevent entering virtual
    311// mode and resulting warmboot by SAL.
    312//
    313ia64_os_init_on_kdump:
    314	mov		r8=r0		// IA64_INIT_RESUME
    315	mov             r9=r10		// SAL_GP
    316	mov		r22=r17		// *minstate
    317	;;
    318	mov		r10=r0		// return to same context
    319	mov		b0=r12		// SAL_CHECK return address
    320	br		b0
    321
    322//
    323// SAL to OS entry point for INIT on all processors.  This has been defined for
    324// registration purposes with SAL as a part of ia64_mca_init.  Monarch and
    325// slave INIT have identical processing, except for the value of the
    326// sos->monarch flag in r19.
    327//
    328
    329ia64_os_init_dispatch_monarch:
    330	mov r19=1				// Bow, bow, ye lower middle classes!
    331	br.sptk ia64_os_init_dispatch
    332
    333ia64_os_init_dispatch_slave:
    334	mov r19=0				// <igor>yeth, mathter</igor>
    335
    336ia64_os_init_dispatch:
    337
    338	mov r3=IA64_MCA_CPU_INIT_STACK_OFFSET	// use the INIT stack
    339	LOAD_PHYSICAL(p0,r2,1f)			// return address
    340	br.sptk ia64_state_save			// save the state that is not in minstate
    3411:
    342
    343	// switch to per cpu INIT stack
    344	mov r3=IA64_MCA_CPU_INIT_STACK_OFFSET	// use the INIT stack
    345	LOAD_PHYSICAL(p0,r2,1f)			// return address
    346	br.sptk ia64_new_stack
    3471:
    348
    349	// everything saved, now we can set the kernel registers
    350	mov r3=IA64_MCA_CPU_INIT_STACK_OFFSET	// use the INIT stack
    351	LOAD_PHYSICAL(p0,r2,1f)			// return address
    352	br.sptk ia64_set_kernel_registers
    3531:
    354
    355	// This must be done in physical mode
    356	GET_IA64_MCA_DATA(r2)
    357	;;
    358	mov r7=r2
    359
    360        // Enter virtual mode from physical mode
    361	VIRTUAL_MODE_ENTER(r2, r3, ia64_os_init_virtual_begin, r4)
    362
    363	// This code returns to SAL via SOS r2, in general SAL has no unwind
    364	// data.  To get a clean termination when backtracing the C MCA/INIT
    365	// handler, set a dummy return address of 0 in this routine.  That
    366	// requires that ia64_os_init_virtual_begin be a global function.
    367ENTRY(ia64_os_init_virtual_begin)
    368	.prologue
    369	.save rp,r0
    370	.body
    371
    372	mov ar.rsc=3				// set eager mode for C handler
    373	mov r2=r7				// see GET_IA64_MCA_DATA above
    374	;;
    375
    376	// Call virtual mode handler
    377	alloc r14=ar.pfs,0,0,3,0
    378	;;
    379	DATA_PA_TO_VA(r2,r7)
    380	;;
    381	add out0=IA64_MCA_CPU_INIT_STACK_OFFSET+MCA_PT_REGS_OFFSET, r2
    382	add out1=IA64_MCA_CPU_INIT_STACK_OFFSET+MCA_SWITCH_STACK_OFFSET, r2
    383	add out2=IA64_MCA_CPU_INIT_STACK_OFFSET+MCA_SOS_OFFSET, r2
    384	br.call.sptk.many    b0=ia64_init_handler
    385
    386	// Revert back to physical mode before going back to SAL
    387	PHYSICAL_MODE_ENTER(r2, r3, ia64_os_init_virtual_end, r4)
    388ia64_os_init_virtual_end:
    389
    390END(ia64_os_init_virtual_begin)
    391
    392	mov r3=IA64_MCA_CPU_INIT_STACK_OFFSET	// use the INIT stack
    393	LOAD_PHYSICAL(p0,r2,1f)			// return address
    394	br.sptk ia64_state_restore		// restore the SAL state
    3951:
    396
    397	// switch back to previous stack
    398	alloc r14=ar.pfs,0,0,0,0		// remove the INIT handler frame
    399	mov r3=IA64_MCA_CPU_INIT_STACK_OFFSET	// use the INIT stack
    400	LOAD_PHYSICAL(p0,r2,1f)			// return address
    401	br.sptk ia64_old_stack
    4021:
    403
    404	mov		b0=r12			// SAL_CHECK return address
    405	br		b0
    406
    407//EndMain//////////////////////////////////////////////////////////////////////
    408
    409// common defines for the stubs
    410#define	ms		r4
    411#define	regs		r5
    412#define	temp1		r2	/* careful, it overlaps with input registers */
    413#define	temp2		r3	/* careful, it overlaps with input registers */
    414#define	temp3		r7
    415#define	temp4		r14
    416
    417
    418//++
    419// Name:
    420//	ia64_state_save()
    421//
    422// Stub Description:
    423//
    424//	Save the state that is not in minstate.  This is sensitive to the layout of
    425//	struct ia64_sal_os_state in mca.h.
    426//
    427//	r2 contains the return address, r3 contains either
    428//	IA64_MCA_CPU_MCA_STACK_OFFSET or IA64_MCA_CPU_INIT_STACK_OFFSET.
    429//
    430//	The OS to SAL section of struct ia64_sal_os_state is set to a default
    431//	value of cold boot (MCA) or warm boot (INIT) and return to the same
    432//	context.  ia64_sal_os_state is also used to hold some registers that
    433//	need to be saved and restored across the stack switches.
    434//
    435//	Most input registers to this stub come from PAL/SAL
    436//	r1  os gp, physical
    437//	r8  pal_proc entry point
    438//	r9  sal_proc entry point
    439//	r10 sal gp
    440//	r11 MCA - rendevzous state, INIT - reason code
    441//	r12 sal return address
    442//	r17 pal min_state
    443//	r18 processor state parameter
    444//	r19 monarch flag, set by the caller of this routine
    445//
    446//	In addition to the SAL to OS state, this routine saves all the
    447//	registers that appear in struct pt_regs and struct switch_stack,
    448//	excluding those that are already in the PAL minstate area.  This
    449//	results in a partial pt_regs and switch_stack, the C code copies the
    450//	remaining registers from PAL minstate to pt_regs and switch_stack.  The
    451//	resulting structures contain all the state of the original process when
    452//	MCA/INIT occurred.
    453//
    454//--
    455
    456ia64_state_save:
    457	add regs=MCA_SOS_OFFSET, r3
    458	add ms=MCA_SOS_OFFSET+8, r3
    459	mov b0=r2		// save return address
    460	cmp.eq p1,p2=IA64_MCA_CPU_MCA_STACK_OFFSET, r3
    461	;;
    462	GET_IA64_MCA_DATA(temp2)
    463	;;
    464	add temp1=temp2, regs	// struct ia64_sal_os_state on MCA or INIT stack
    465	add temp2=temp2, ms	// struct ia64_sal_os_state+8 on MCA or INIT stack
    466	;;
    467	mov regs=temp1		// save the start of sos
    468	st8 [temp1]=r1,16	// os_gp
    469	st8 [temp2]=r8,16	// pal_proc
    470	;;
    471	st8 [temp1]=r9,16	// sal_proc
    472	st8 [temp2]=r11,16	// rv_rc
    473	mov r11=cr.iipa
    474	;;
    475	st8 [temp1]=r18		// proc_state_param
    476	st8 [temp2]=r19		// monarch
    477	mov r6=IA64_KR(CURRENT)
    478	add temp1=SOS(SAL_RA), regs
    479	add temp2=SOS(SAL_GP), regs
    480	;;
    481	st8 [temp1]=r12,16	// sal_ra
    482	st8 [temp2]=r10,16	// sal_gp
    483	mov r12=cr.isr
    484	;;
    485	st8 [temp1]=r17,16	// pal_min_state
    486	st8 [temp2]=r6,16	// prev_IA64_KR_CURRENT
    487	mov r6=IA64_KR(CURRENT_STACK)
    488	;;
    489	st8 [temp1]=r6,16	// prev_IA64_KR_CURRENT_STACK
    490	st8 [temp2]=r0,16	// prev_task, starts off as NULL
    491	mov r6=cr.ifa
    492	;;
    493	st8 [temp1]=r12,16	// cr.isr
    494	st8 [temp2]=r6,16	// cr.ifa
    495	mov r12=cr.itir
    496	;;
    497	st8 [temp1]=r12,16	// cr.itir
    498	st8 [temp2]=r11,16	// cr.iipa
    499	mov r12=cr.iim
    500	;;
    501	st8 [temp1]=r12		// cr.iim
    502(p1)	mov r12=IA64_MCA_COLD_BOOT
    503(p2)	mov r12=IA64_INIT_WARM_BOOT
    504	mov r6=cr.iha
    505	add temp1=SOS(OS_STATUS), regs
    506	;;
    507	st8 [temp2]=r6		// cr.iha
    508	add temp2=SOS(CONTEXT), regs
    509	st8 [temp1]=r12		// os_status, default is cold boot
    510	mov r6=IA64_MCA_SAME_CONTEXT
    511	;;
    512	st8 [temp2]=r6		// context, default is same context
    513
    514	// Save the pt_regs data that is not in minstate.  The previous code
    515	// left regs at sos.
    516	add regs=MCA_PT_REGS_OFFSET-MCA_SOS_OFFSET, regs
    517	;;
    518	add temp1=PT(B6), regs
    519	mov temp3=b6
    520	mov temp4=b7
    521	add temp2=PT(B7), regs
    522	;;
    523	st8 [temp1]=temp3,PT(AR_CSD)-PT(B6)		// save b6
    524	st8 [temp2]=temp4,PT(AR_SSD)-PT(B7)		// save b7
    525	mov temp3=ar.csd
    526	mov temp4=ar.ssd
    527	cover						// must be last in group
    528	;;
    529	st8 [temp1]=temp3,PT(AR_UNAT)-PT(AR_CSD)	// save ar.csd
    530	st8 [temp2]=temp4,PT(AR_PFS)-PT(AR_SSD)		// save ar.ssd
    531	mov temp3=ar.unat
    532	mov temp4=ar.pfs
    533	;;
    534	st8 [temp1]=temp3,PT(AR_RNAT)-PT(AR_UNAT)	// save ar.unat
    535	st8 [temp2]=temp4,PT(AR_BSPSTORE)-PT(AR_PFS)	// save ar.pfs
    536	mov temp3=ar.rnat
    537	mov temp4=ar.bspstore
    538	;;
    539	st8 [temp1]=temp3,PT(LOADRS)-PT(AR_RNAT)	// save ar.rnat
    540	st8 [temp2]=temp4,PT(AR_FPSR)-PT(AR_BSPSTORE)	// save ar.bspstore
    541	mov temp3=ar.bsp
    542	;;
    543	sub temp3=temp3, temp4	// ar.bsp - ar.bspstore
    544	mov temp4=ar.fpsr
    545	;;
    546	shl temp3=temp3,16	// compute ar.rsc to be used for "loadrs"
    547	;;
    548	st8 [temp1]=temp3,PT(AR_CCV)-PT(LOADRS)		// save loadrs
    549	st8 [temp2]=temp4,PT(F6)-PT(AR_FPSR)		// save ar.fpsr
    550	mov temp3=ar.ccv
    551	;;
    552	st8 [temp1]=temp3,PT(F7)-PT(AR_CCV)		// save ar.ccv
    553	stf.spill [temp2]=f6,PT(F8)-PT(F6)
    554	;;
    555	stf.spill [temp1]=f7,PT(F9)-PT(F7)
    556	stf.spill [temp2]=f8,PT(F10)-PT(F8)
    557	;;
    558	stf.spill [temp1]=f9,PT(F11)-PT(F9)
    559	stf.spill [temp2]=f10
    560	;;
    561	stf.spill [temp1]=f11
    562
    563	// Save the switch_stack data that is not in minstate nor pt_regs.  The
    564	// previous code left regs at pt_regs.
    565	add regs=MCA_SWITCH_STACK_OFFSET-MCA_PT_REGS_OFFSET, regs
    566	;;
    567	add temp1=SW(F2), regs
    568	add temp2=SW(F3), regs
    569	;;
    570	stf.spill [temp1]=f2,32
    571	stf.spill [temp2]=f3,32
    572	;;
    573	stf.spill [temp1]=f4,32
    574	stf.spill [temp2]=f5,32
    575	;;
    576	stf.spill [temp1]=f12,32
    577	stf.spill [temp2]=f13,32
    578	;;
    579	stf.spill [temp1]=f14,32
    580	stf.spill [temp2]=f15,32
    581	;;
    582	stf.spill [temp1]=f16,32
    583	stf.spill [temp2]=f17,32
    584	;;
    585	stf.spill [temp1]=f18,32
    586	stf.spill [temp2]=f19,32
    587	;;
    588	stf.spill [temp1]=f20,32
    589	stf.spill [temp2]=f21,32
    590	;;
    591	stf.spill [temp1]=f22,32
    592	stf.spill [temp2]=f23,32
    593	;;
    594	stf.spill [temp1]=f24,32
    595	stf.spill [temp2]=f25,32
    596	;;
    597	stf.spill [temp1]=f26,32
    598	stf.spill [temp2]=f27,32
    599	;;
    600	stf.spill [temp1]=f28,32
    601	stf.spill [temp2]=f29,32
    602	;;
    603	stf.spill [temp1]=f30,SW(B2)-SW(F30)
    604	stf.spill [temp2]=f31,SW(B3)-SW(F31)
    605	mov temp3=b2
    606	mov temp4=b3
    607	;;
    608	st8 [temp1]=temp3,16	// save b2
    609	st8 [temp2]=temp4,16	// save b3
    610	mov temp3=b4
    611	mov temp4=b5
    612	;;
    613	st8 [temp1]=temp3,SW(AR_LC)-SW(B4)	// save b4
    614	st8 [temp2]=temp4	// save b5
    615	mov temp3=ar.lc
    616	;;
    617	st8 [temp1]=temp3	// save ar.lc
    618
    619	// FIXME: Some proms are incorrectly accessing the minstate area as
    620	// cached data.  The C code uses region 6, uncached virtual.  Ensure
    621	// that there is no cache data lying around for the first 1K of the
    622	// minstate area.
    623	// Remove this code in September 2006, that gives platforms a year to
    624	// fix their proms and get their customers updated.
    625
    626	add r1=32*1,r17
    627	add r2=32*2,r17
    628	add r3=32*3,r17
    629	add r4=32*4,r17
    630	add r5=32*5,r17
    631	add r6=32*6,r17
    632	add r7=32*7,r17
    633	;;
    634	fc r17
    635	fc r1
    636	fc r2
    637	fc r3
    638	fc r4
    639	fc r5
    640	fc r6
    641	fc r7
    642	add r17=32*8,r17
    643	add r1=32*8,r1
    644	add r2=32*8,r2
    645	add r3=32*8,r3
    646	add r4=32*8,r4
    647	add r5=32*8,r5
    648	add r6=32*8,r6
    649	add r7=32*8,r7
    650	;;
    651	fc r17
    652	fc r1
    653	fc r2
    654	fc r3
    655	fc r4
    656	fc r5
    657	fc r6
    658	fc r7
    659	add r17=32*8,r17
    660	add r1=32*8,r1
    661	add r2=32*8,r2
    662	add r3=32*8,r3
    663	add r4=32*8,r4
    664	add r5=32*8,r5
    665	add r6=32*8,r6
    666	add r7=32*8,r7
    667	;;
    668	fc r17
    669	fc r1
    670	fc r2
    671	fc r3
    672	fc r4
    673	fc r5
    674	fc r6
    675	fc r7
    676	add r17=32*8,r17
    677	add r1=32*8,r1
    678	add r2=32*8,r2
    679	add r3=32*8,r3
    680	add r4=32*8,r4
    681	add r5=32*8,r5
    682	add r6=32*8,r6
    683	add r7=32*8,r7
    684	;;
    685	fc r17
    686	fc r1
    687	fc r2
    688	fc r3
    689	fc r4
    690	fc r5
    691	fc r6
    692	fc r7
    693
    694	br.sptk b0
    695
    696//EndStub//////////////////////////////////////////////////////////////////////
    697
    698
    699//++
    700// Name:
    701//	ia64_state_restore()
    702//
    703// Stub Description:
    704//
    705//	Restore the SAL/OS state.  This is sensitive to the layout of struct
    706//	ia64_sal_os_state in mca.h.
    707//
    708//	r2 contains the return address, r3 contains either
    709//	IA64_MCA_CPU_MCA_STACK_OFFSET or IA64_MCA_CPU_INIT_STACK_OFFSET.
    710//
    711//	In addition to the SAL to OS state, this routine restores all the
    712//	registers that appear in struct pt_regs and struct switch_stack,
    713//	excluding those in the PAL minstate area.
    714//
    715//--
    716
    717ia64_state_restore:
    718	// Restore the switch_stack data that is not in minstate nor pt_regs.
    719	add regs=MCA_SWITCH_STACK_OFFSET, r3
    720	mov b0=r2		// save return address
    721	;;
    722	GET_IA64_MCA_DATA(temp2)
    723	;;
    724	add regs=temp2, regs
    725	;;
    726	add temp1=SW(F2), regs
    727	add temp2=SW(F3), regs
    728	;;
    729	ldf.fill f2=[temp1],32
    730	ldf.fill f3=[temp2],32
    731	;;
    732	ldf.fill f4=[temp1],32
    733	ldf.fill f5=[temp2],32
    734	;;
    735	ldf.fill f12=[temp1],32
    736	ldf.fill f13=[temp2],32
    737	;;
    738	ldf.fill f14=[temp1],32
    739	ldf.fill f15=[temp2],32
    740	;;
    741	ldf.fill f16=[temp1],32
    742	ldf.fill f17=[temp2],32
    743	;;
    744	ldf.fill f18=[temp1],32
    745	ldf.fill f19=[temp2],32
    746	;;
    747	ldf.fill f20=[temp1],32
    748	ldf.fill f21=[temp2],32
    749	;;
    750	ldf.fill f22=[temp1],32
    751	ldf.fill f23=[temp2],32
    752	;;
    753	ldf.fill f24=[temp1],32
    754	ldf.fill f25=[temp2],32
    755	;;
    756	ldf.fill f26=[temp1],32
    757	ldf.fill f27=[temp2],32
    758	;;
    759	ldf.fill f28=[temp1],32
    760	ldf.fill f29=[temp2],32
    761	;;
    762	ldf.fill f30=[temp1],SW(B2)-SW(F30)
    763	ldf.fill f31=[temp2],SW(B3)-SW(F31)
    764	;;
    765	ld8 temp3=[temp1],16	// restore b2
    766	ld8 temp4=[temp2],16	// restore b3
    767	;;
    768	mov b2=temp3
    769	mov b3=temp4
    770	ld8 temp3=[temp1],SW(AR_LC)-SW(B4)	// restore b4
    771	ld8 temp4=[temp2]	// restore b5
    772	;;
    773	mov b4=temp3
    774	mov b5=temp4
    775	ld8 temp3=[temp1]	// restore ar.lc
    776	;;
    777	mov ar.lc=temp3
    778
    779	// Restore the pt_regs data that is not in minstate.  The previous code
    780	// left regs at switch_stack.
    781	add regs=MCA_PT_REGS_OFFSET-MCA_SWITCH_STACK_OFFSET, regs
    782	;;
    783	add temp1=PT(B6), regs
    784	add temp2=PT(B7), regs
    785	;;
    786	ld8 temp3=[temp1],PT(AR_CSD)-PT(B6)		// restore b6
    787	ld8 temp4=[temp2],PT(AR_SSD)-PT(B7)		// restore b7
    788	;;
    789	mov b6=temp3
    790	mov b7=temp4
    791	ld8 temp3=[temp1],PT(AR_UNAT)-PT(AR_CSD)	// restore ar.csd
    792	ld8 temp4=[temp2],PT(AR_PFS)-PT(AR_SSD)		// restore ar.ssd
    793	;;
    794	mov ar.csd=temp3
    795	mov ar.ssd=temp4
    796	ld8 temp3=[temp1]				// restore ar.unat
    797	add temp1=PT(AR_CCV)-PT(AR_UNAT), temp1
    798	ld8 temp4=[temp2],PT(AR_FPSR)-PT(AR_PFS)	// restore ar.pfs
    799	;;
    800	mov ar.unat=temp3
    801	mov ar.pfs=temp4
    802	// ar.rnat, ar.bspstore, loadrs are restore in ia64_old_stack.
    803	ld8 temp3=[temp1],PT(F6)-PT(AR_CCV)		// restore ar.ccv
    804	ld8 temp4=[temp2],PT(F7)-PT(AR_FPSR)		// restore ar.fpsr
    805	;;
    806	mov ar.ccv=temp3
    807	mov ar.fpsr=temp4
    808	ldf.fill f6=[temp1],PT(F8)-PT(F6)
    809	ldf.fill f7=[temp2],PT(F9)-PT(F7)
    810	;;
    811	ldf.fill f8=[temp1],PT(F10)-PT(F8)
    812	ldf.fill f9=[temp2],PT(F11)-PT(F9)
    813	;;
    814	ldf.fill f10=[temp1]
    815	ldf.fill f11=[temp2]
    816
    817	// Restore the SAL to OS state. The previous code left regs at pt_regs.
    818	add regs=MCA_SOS_OFFSET-MCA_PT_REGS_OFFSET, regs
    819	;;
    820	add temp1=SOS(SAL_RA), regs
    821	add temp2=SOS(SAL_GP), regs
    822	;;
    823	ld8 r12=[temp1],16	// sal_ra
    824	ld8 r9=[temp2],16	// sal_gp
    825	;;
    826	ld8 r22=[temp1],16	// pal_min_state, virtual
    827	ld8 r13=[temp2],16	// prev_IA64_KR_CURRENT
    828	;;
    829	ld8 r16=[temp1],16	// prev_IA64_KR_CURRENT_STACK
    830	ld8 r20=[temp2],16	// prev_task
    831	;;
    832	ld8 temp3=[temp1],16	// cr.isr
    833	ld8 temp4=[temp2],16	// cr.ifa
    834	;;
    835	mov cr.isr=temp3
    836	mov cr.ifa=temp4
    837	ld8 temp3=[temp1],16	// cr.itir
    838	ld8 temp4=[temp2],16	// cr.iipa
    839	;;
    840	mov cr.itir=temp3
    841	mov cr.iipa=temp4
    842	ld8 temp3=[temp1]	// cr.iim
    843	ld8 temp4=[temp2]		// cr.iha
    844	add temp1=SOS(OS_STATUS), regs
    845	add temp2=SOS(CONTEXT), regs
    846	;;
    847	mov cr.iim=temp3
    848	mov cr.iha=temp4
    849	dep r22=0,r22,62,1	// pal_min_state, physical, uncached
    850	mov IA64_KR(CURRENT)=r13
    851	ld8 r8=[temp1]		// os_status
    852	ld8 r10=[temp2]		// context
    853
    854	/* Wire IA64_TR_CURRENT_STACK to the stack that we are resuming to.  To
    855	 * avoid any dependencies on the algorithm in ia64_switch_to(), just
    856	 * purge any existing CURRENT_STACK mapping and insert the new one.
    857	 *
    858	 * r16 contains prev_IA64_KR_CURRENT_STACK, r13 contains
    859	 * prev_IA64_KR_CURRENT, these values may have been changed by the C
    860	 * code.  Do not use r8, r9, r10, r22, they contain values ready for
    861	 * the return to SAL.
    862	 */
    863
    864	mov r15=IA64_KR(CURRENT_STACK)		// physical granule mapped by IA64_TR_CURRENT_STACK
    865	;;
    866	shl r15=r15,IA64_GRANULE_SHIFT
    867	;;
    868	dep r15=-1,r15,61,3			// virtual granule
    869	mov r18=IA64_GRANULE_SHIFT<<2		// for cr.itir.ps
    870	;;
    871	ptr.d r15,r18
    872	;;
    873	srlz.d
    874
    875	extr.u r19=r13,61,3			// r13 = prev_IA64_KR_CURRENT
    876	shl r20=r16,IA64_GRANULE_SHIFT		// r16 = prev_IA64_KR_CURRENT_STACK
    877	movl r21=PAGE_KERNEL			// page properties
    878	;;
    879	mov IA64_KR(CURRENT_STACK)=r16
    880	cmp.ne p6,p0=RGN_KERNEL,r19		// new stack is in the kernel region?
    881	or r21=r20,r21				// construct PA | page properties
    882(p6)	br.spnt 1f				// the dreaded cpu 0 idle task in region 5:(
    883	;;
    884	mov cr.itir=r18
    885	mov cr.ifa=r13
    886	mov r20=IA64_TR_CURRENT_STACK
    887	;;
    888	itr.d dtr[r20]=r21
    889	;;
    890	srlz.d
    8911:
    892
    893	br.sptk b0
    894
    895//EndStub//////////////////////////////////////////////////////////////////////
    896
    897
    898//++
    899// Name:
    900//	ia64_new_stack()
    901//
    902// Stub Description:
    903//
    904//	Switch to the MCA/INIT stack.
    905//
    906//	r2 contains the return address, r3 contains either
    907//	IA64_MCA_CPU_MCA_STACK_OFFSET or IA64_MCA_CPU_INIT_STACK_OFFSET.
    908//
    909//	On entry RBS is still on the original stack, this routine switches RBS
    910//	to use the MCA/INIT stack.
    911//
    912//	On entry, sos->pal_min_state is physical, on exit it is virtual.
    913//
    914//--
    915
    916ia64_new_stack:
    917	add regs=MCA_PT_REGS_OFFSET, r3
    918	add temp2=MCA_SOS_OFFSET+SOS(PAL_MIN_STATE), r3
    919	mov b0=r2			// save return address
    920	GET_IA64_MCA_DATA(temp1)
    921	invala
    922	;;
    923	add temp2=temp2, temp1		// struct ia64_sal_os_state.pal_min_state on MCA or INIT stack
    924	add regs=regs, temp1		// struct pt_regs on MCA or INIT stack
    925	;;
    926	// Address of minstate area provided by PAL is physical, uncacheable.
    927	// Convert to Linux virtual address in region 6 for C code.
    928	ld8 ms=[temp2]			// pal_min_state, physical
    929	;;
    930	dep temp1=-1,ms,62,2		// set region 6
    931	mov temp3=IA64_RBS_OFFSET-MCA_PT_REGS_OFFSET
    932	;;
    933	st8 [temp2]=temp1		// pal_min_state, virtual
    934
    935	add temp4=temp3, regs		// start of bspstore on new stack
    936	;;
    937	mov ar.bspstore=temp4		// switch RBS to MCA/INIT stack
    938	;;
    939	flushrs				// must be first in group
    940	br.sptk b0
    941
    942//EndStub//////////////////////////////////////////////////////////////////////
    943
    944
    945//++
    946// Name:
    947//	ia64_old_stack()
    948//
    949// Stub Description:
    950//
    951//	Switch to the old stack.
    952//
    953//	r2 contains the return address, r3 contains either
    954//	IA64_MCA_CPU_MCA_STACK_OFFSET or IA64_MCA_CPU_INIT_STACK_OFFSET.
    955//
    956//	On entry, pal_min_state is virtual, on exit it is physical.
    957//
    958//	On entry RBS is on the MCA/INIT stack, this routine switches RBS
    959//	back to the previous stack.
    960//
    961//	The psr is set to all zeroes.  SAL return requires either all zeroes or
    962//	just psr.mc set.  Leaving psr.mc off allows INIT to be issued if this
    963//	code does not perform correctly.
    964//
    965//	The dirty registers at the time of the event were flushed to the
    966//	MCA/INIT stack in ia64_pt_regs_save().  Restore the dirty registers
    967//	before reverting to the previous bspstore.
    968//--
    969
    970ia64_old_stack:
    971	add regs=MCA_PT_REGS_OFFSET, r3
    972	mov b0=r2			// save return address
    973	GET_IA64_MCA_DATA(temp2)
    974	LOAD_PHYSICAL(p0,temp1,1f)
    975	;;
    976	mov cr.ipsr=r0
    977	mov cr.ifs=r0
    978	mov cr.iip=temp1
    979	;;
    980	invala
    981	rfi
    9821:
    983
    984	add regs=regs, temp2		// struct pt_regs on MCA or INIT stack
    985	;;
    986	add temp1=PT(LOADRS), regs
    987	;;
    988	ld8 temp2=[temp1],PT(AR_BSPSTORE)-PT(LOADRS)	// restore loadrs
    989	;;
    990	ld8 temp3=[temp1],PT(AR_RNAT)-PT(AR_BSPSTORE)	// restore ar.bspstore
    991	mov ar.rsc=temp2
    992	;;
    993	loadrs
    994	ld8 temp4=[temp1]		// restore ar.rnat
    995	;;
    996	mov ar.bspstore=temp3		// back to old stack
    997	;;
    998	mov ar.rnat=temp4
    999	;;
   1000
   1001	br.sptk b0
   1002
   1003//EndStub//////////////////////////////////////////////////////////////////////
   1004
   1005
   1006//++
   1007// Name:
   1008//	ia64_set_kernel_registers()
   1009//
   1010// Stub Description:
   1011//
   1012//	Set the registers that are required by the C code in order to run on an
   1013//	MCA/INIT stack.
   1014//
   1015//	r2 contains the return address, r3 contains either
   1016//	IA64_MCA_CPU_MCA_STACK_OFFSET or IA64_MCA_CPU_INIT_STACK_OFFSET.
   1017//
   1018//--
   1019
   1020ia64_set_kernel_registers:
   1021	add temp3=MCA_SP_OFFSET, r3
   1022	mov b0=r2		// save return address
   1023	GET_IA64_MCA_DATA(temp1)
   1024	;;
   1025	add r12=temp1, temp3	// kernel stack pointer on MCA/INIT stack
   1026	add r13=temp1, r3	// set current to start of MCA/INIT stack
   1027	add r20=temp1, r3	// physical start of MCA/INIT stack
   1028	;;
   1029	DATA_PA_TO_VA(r12,temp2)
   1030	DATA_PA_TO_VA(r13,temp3)
   1031	;;
   1032	mov IA64_KR(CURRENT)=r13
   1033
   1034	/* Wire IA64_TR_CURRENT_STACK to the MCA/INIT handler stack.  To avoid
   1035	 * any dependencies on the algorithm in ia64_switch_to(), just purge
   1036	 * any existing CURRENT_STACK mapping and insert the new one.
   1037	 */
   1038
   1039	mov r16=IA64_KR(CURRENT_STACK)		// physical granule mapped by IA64_TR_CURRENT_STACK
   1040	;;
   1041	shl r16=r16,IA64_GRANULE_SHIFT
   1042	;;
   1043	dep r16=-1,r16,61,3			// virtual granule
   1044	mov r18=IA64_GRANULE_SHIFT<<2		// for cr.itir.ps
   1045	;;
   1046	ptr.d r16,r18
   1047	;;
   1048	srlz.d
   1049
   1050	shr.u r16=r20,IA64_GRANULE_SHIFT	// r20 = physical start of MCA/INIT stack
   1051	movl r21=PAGE_KERNEL			// page properties
   1052	;;
   1053	mov IA64_KR(CURRENT_STACK)=r16
   1054	or r21=r20,r21				// construct PA | page properties
   1055	;;
   1056	mov cr.itir=r18
   1057	mov cr.ifa=r13
   1058	mov r20=IA64_TR_CURRENT_STACK
   1059
   1060	movl r17=FPSR_DEFAULT
   1061	;;
   1062	mov.m ar.fpsr=r17			// set ar.fpsr to kernel default value
   1063	;;
   1064	itr.d dtr[r20]=r21
   1065	;;
   1066	srlz.d
   1067
   1068	br.sptk b0
   1069
   1070//EndStub//////////////////////////////////////////////////////////////////////
   1071
   1072#undef	ms
   1073#undef	regs
   1074#undef	temp1
   1075#undef	temp2
   1076#undef	temp3
   1077#undef	temp4
   1078
   1079
   1080// Support function for mca.c, it is here to avoid using inline asm.  Given the
   1081// address of an rnat slot, if that address is below the current ar.bspstore
   1082// then return the contents of that slot, otherwise return the contents of
   1083// ar.rnat.
   1084GLOBAL_ENTRY(ia64_get_rnat)
   1085	alloc r14=ar.pfs,1,0,0,0
   1086	mov ar.rsc=0
   1087	;;
   1088	mov r14=ar.bspstore
   1089	;;
   1090	cmp.lt p6,p7=in0,r14
   1091	;;
   1092(p6)	ld8 r8=[in0]
   1093(p7)	mov r8=ar.rnat
   1094	mov ar.rsc=3
   1095	br.ret.sptk.many rp
   1096END(ia64_get_rnat)
   1097
   1098
   1099// void ia64_set_psr_mc(void)
   1100//
   1101// Set psr.mc bit to mask MCA/INIT.
   1102GLOBAL_ENTRY(ia64_set_psr_mc)
   1103	rsm psr.i | psr.ic		// disable interrupts
   1104	;;
   1105	srlz.d
   1106	;;
   1107	mov r14 = psr			// get psr{36:35,31:0}
   1108	movl r15 = 1f
   1109	;;
   1110	dep r14 = -1, r14, PSR_MC, 1	// set psr.mc
   1111	;;
   1112	dep r14 = -1, r14, PSR_IC, 1	// set psr.ic
   1113	;;
   1114	dep r14 = -1, r14, PSR_BN, 1	// keep bank1 in use
   1115	;;
   1116	mov cr.ipsr = r14
   1117	mov cr.ifs = r0
   1118	mov cr.iip = r15
   1119	;;
   1120	rfi
   11211:
   1122	br.ret.sptk.many rp
   1123END(ia64_set_psr_mc)