/* Copyright (C) 1999-2015 Free Software Foundation, Inc. Contributed by David Mosberger-Tang <davidm@hpl.hp.com>. The GNU C Library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. The GNU C Library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with the GNU C Library; if not, see <http://www.gnu.org/licenses/>. */ #include <sysdep.h> #include <features.h> LEAF(__ia64_flush_rbs) flushrs mov r9 = ar.rsc // 12 cyc latency ;; mov r8 = ar.bsp // 12 cyc latency ;; and r16 = ~0x3, r9 // clear ar.rsc.mode ;; mov ar.rsc = r16 // put RSE into enforced-lazy mode ;; mov r10 = ar.rnat // 5 cyc latency ret END(__ia64_flush_rbs) # define pPos p6 /* is rotate count positive? */ # define pNeg p7 /* is rotate count negative? */ /* __ia64_longjmp(__jmp_buf buf, int val, long rnat, long rsc) */ LEAF(__ia64_longjmp) alloc r8=ar.pfs,4,0,0,0 add r2=0x98,in0 // r2 <- &jmpbuf.orig_jmp_buf_addr add r3=0x88,in0 // r3 <- &jmpbuf.ar_bsp ;; ld8 r8=[r2] // r8 <- orig_jmp_buf_addr ld8 r23=[r3],8 // r23 <- jmpbuf.ar_bsp mov r2=in0 ;; // // Note: we need to redo the "flushrs" here even though it's // already been done by __ia64_flush_rbs. It is needed to // ensure that ar.bspstore == ar.bsp. // flushrs // flush dirty regs to backing store ld8 r25=[r3] // r25 <- jmpbuf.ar_unat sub r8=r8,in0 // r8 <- &orig_jmpbuf - &jmpbuf ;; add r3=8,in0 // r3 <- &jmpbuf.r1 extr.u r8=r8,3,6 // r8 <- (&orig_jmpbuf - &jmpbuf)/8 & 0x3f ;; cmp.lt pNeg,pPos=r8,r0 ;; (pPos) mov r16=r8 (pNeg) add r16=64,r8 (pPos) sub r17=64,r8 (pNeg) sub r17=r0,r8 ;; shr.u r8=r25,r16 shl r9=r25,r17 ;; or r25=r8,r9 ;; mov ar.unat=r25 // setup ar.unat (NaT bits for r1, r4-r7, and r12) ;; ld8.fill.nta sp=[r2],16 // r12 (sp) ld8.fill.nta gp=[r3],32 // r1 (gp) dep r11=-1,r23,3,6 // r11 <- ia64_rse_rnat_addr(jmpbuf.ar_bsp) ;; ld8.nta r16=[r2],16 // caller's unat // ld8.nta r17=[r3],16 // fpsr ;; ld8.fill.nta r4=[r2],16 // r4 ld8.fill.nta r5=[r3],16 // r5 (gp) ;; ld8.fill.nta r6=[r2],16 // r6 ld8.fill.nta r7=[r3],16 // r7 ;; mov ar.unat=r16 // restore caller's unat // mov ar.fpsr=r17 // restore fpsr ;; ld8.nta r16=[r2],16 // b0 ld8.nta r17=[r3],16 // b1 ;; mov ar.bspstore=r23 // restore ar.bspstore ld8.nta r18=[r2],16 // b2 ;; mov ar.rnat=in2 // restore ar.rnat ld8.nta r19=[r3],16 // b3 ;; ld8.nta r20=[r2],16 // b4 ld8.nta r21=[r3],16 // b5 #ifdef PTR_DEMANGLE PTR_DEMANGLE (r16, r24) #endif ;; ld8.nta r11=[r2],16 // ar.pfs ld8.nta r22=[r3],56 // ar.lc ;; ld8.nta r24=[r2],32 // pr mov ar.rsc=in3 // restore ar.rsc mov b0=r16 ;; ldf.fill.nta f2=[r2],32 ldf.fill.nta f3=[r3],32 mov b1=r17 ;; ldf.fill.nta f4=[r2],32 ldf.fill.nta f5=[r3],32 mov b2=r18 ;; ldf.fill.nta f16=[r2],32 ldf.fill.nta f17=[r3],32 mov b3=r19 ;; ldf.fill.nta f18=[r2],32 ldf.fill.nta f19=[r3],32 mov b4=r20 ;; ldf.fill.nta f20=[r2],32 ldf.fill.nta f21=[r3],32 mov b5=r21 ;; ldf.fill.nta f22=[r2],32 ldf.fill.nta f23=[r3],32 mov ar.lc=r22 ;; ldf.fill.nta f24=[r2],32 ldf.fill.nta f25=[r3],32 cmp.eq p8,p9=0,in1 ;; ldf.fill.nta f26=[r2],32 ldf.fill.nta f27=[r3],32 mov ar.pfs=r11 ;; ldf.fill.nta f28=[r2],32 ldf.fill.nta f29=[r3],32 (p8) mov r8=1 ;; ldf.fill.nta f30=[r2] ldf.fill.nta f31=[r3] (p9) mov r8=in1 invala // virt. -> phys. regnum mapping may change mov pr=r24,-1 ret END(__ia64_longjmp)