_setjmp.S revision 85229
182936Sdfr// $FreeBSD: head/lib/libc/ia64/gen/_setjmp.S 85229 2001-10-20 15:19:08Z dfr $
282936Sdfr//
382936Sdfr// Copyright (c) 1999, 2000
482936Sdfr// Intel Corporation.
582936Sdfr// All rights reserved.
682936Sdfr//
782936Sdfr// Redistribution and use in source and binary forms, with or without
882936Sdfr// modification, are permitted provided that the following conditions
982936Sdfr// are met:
1082936Sdfr//
1182936Sdfr// 1. Redistributions of source code must retain the above copyright
1282936Sdfr//    notice, this list of conditions and the following disclaimer.
1382936Sdfr//
1482936Sdfr// 2. Redistributions in binary form must reproduce the above copyright
1582936Sdfr//   notice, this list of conditions and the following disclaimer in the
1682936Sdfr//    documentation and/or other materials provided with the distribution.
1782936Sdfr//
1882936Sdfr// 3. All advertising materials mentioning features or use of this software
1982936Sdfr//    must display the following acknowledgement:
2082936Sdfr//
2182936Sdfr//    This product includes software developed by Intel Corporation and
2282936Sdfr//    its contributors.
2382936Sdfr//
2482936Sdfr// 4. Neither the name of Intel Corporation or its contributors may be
2582936Sdfr//    used to endorse or promote products derived from this software
2682936Sdfr//    without specific prior written permission.
2782936Sdfr//
2882936Sdfr// THIS SOFTWARE IS PROVIDED BY INTEL CORPORATION AND CONTRIBUTORS ``AS IS''
2982936Sdfr// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
3082936Sdfr// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
3182936Sdfr// ARE DISCLAIMED.  IN NO EVENT SHALL INTEL CORPORATION OR CONTRIBUTORS BE
3282936Sdfr// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
3382936Sdfr// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
3482936Sdfr// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
3582936Sdfr// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
3682936Sdfr// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
3782936Sdfr// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
3882936Sdfr// THE POSSIBILITY OF SUCH DAMAGE.
3982936Sdfr//
4082936Sdfr//
4167117Sdfr
4282936Sdfr//
4382936Sdfr// Module Name:
4482936Sdfr//
4582936Sdfr//  setjmp.s
4682936Sdfr//
4782936Sdfr// Abstract:
4882936Sdfr//
4982936Sdfr//  Contains an implementation of setjmp and longjmp for the
5082936Sdfr//  IA-64 architecture.
5167117Sdfr
5282936Sdfr    .file   "setjmp.s"
5367117Sdfr
5482936Sdfr#define     LOCORE
5582936Sdfr#include    <machine/asm.h>
5682936Sdfr#include    <machine/setjmp.h>
5767117Sdfr
5882936Sdfr// int _setjmp(struct jmp_buffer *)
5982936Sdfr//
6082936Sdfr//  Setup a non-local goto.
6182936Sdfr//
6282936Sdfr// Description:
6382936Sdfr//
6482936Sdfr//  SetJump stores the current register set in the area pointed to
6582936Sdfr//  by "save".  It returns zero.  Subsequent calls to "LongJump" will
6682936Sdfr//  restore the registers and return non-zero to the same location.
6782936Sdfr//
6882936Sdfr// On entry, r32 contains the pointer to the jmp_buffer
6982936Sdfr//
7082936Sdfr
7167117SdfrENTRY(_setjmp, 1)
7282936Sdfr    //
7382936Sdfr    //  Make sure buffer is aligned at 16byte boundary
7482936Sdfr    //
7582936Sdfr    add     r10 = -0x10,r0  ;;  // mask the lower 4 bits
7682936Sdfr    and     r32 = r32, r10;;
7782936Sdfr    add     r32 = 0x10, r32;;   // move to next 16 byte boundary
7867117Sdfr
7982936Sdfr    add     r10 = J_PREDS, r32  // skip Unats & pfs save area
8082936Sdfr    add     r11 = J_BSP, r32
8182936Sdfr    //
8282936Sdfr    //  save immediate context
8382936Sdfr    //
8482936Sdfr    mov     r2 = ar.bsp         // save backing store pointer
8582936Sdfr    mov     r3 = pr             // save predicates
8682936Sdfr    flushrs
8782936Sdfr    ;;
8882936Sdfr    //
8982936Sdfr    // save user Unat register
9082936Sdfr    //
9182936Sdfr    mov     r16 = ar.lc         // save loop count register
9282936Sdfr    mov     r14 = ar.unat       // save user Unat register
9382936Sdfr
9482936Sdfr    st8     [r10] = r3, J_LC-J_PREDS
9582936Sdfr    st8     [r11] = r2, J_R4-J_BSP
9682936Sdfr    ;;
9782936Sdfr    st8     [r10] = r16, J_R5-J_LC
9882936Sdfr    st8     [r32] = r14, J_NATS // Note: Unat at the
9982936Sdfr                                // beginning of the save area
10082936Sdfr    mov     r15 = ar.pfs
10182936Sdfr    ;;
10282936Sdfr    //
10382936Sdfr    //  save preserved general registers & NaT's
10482936Sdfr    //
10582936Sdfr    st8.spill   [r11] = r4, J_R6-J_R4
10682936Sdfr    ;;
10782936Sdfr    st8.spill   [r10] = r5, J_R7-J_R5
10882936Sdfr    ;;
10982936Sdfr    st8.spill   [r11] = r6, J_SP-J_R6
11082936Sdfr    ;;
11182936Sdfr    st8.spill   [r10] = r7, J_F3-J_R7
11282936Sdfr    ;;
11382936Sdfr    st8.spill   [r11] = sp, J_F2-J_SP
11482936Sdfr    ;;
11582936Sdfr    //
11682936Sdfr    // save spilled Unat and pfs registers
11782936Sdfr    //
11882936Sdfr    mov     r2 = ar.unat        // save Unat register after spill
11982936Sdfr    ;;
12082936Sdfr    st8     [r32] = r2, J_PFS-J_NATS    // save unat for spilled regs
12182936Sdfr    ;;
12282936Sdfr    st8     [r32] = r15         // save pfs
12382936Sdfr    //
12482936Sdfr    //  save floating registers
12582936Sdfr    //
12682936Sdfr    stf.spill   [r11] = f2, J_F4-J_F2
12782936Sdfr    stf.spill   [r10] = f3, J_F5-J_F3
12882936Sdfr    ;;
12982936Sdfr    stf.spill   [r11] = f4, J_F16-J_F4
13082936Sdfr    stf.spill   [r10] = f5, J_F17-J_F5
13182936Sdfr    ;;
13282936Sdfr    stf.spill   [r11] = f16, J_F18-J_F16
13382936Sdfr    stf.spill   [r10] = f17, J_F19-J_F17
13482936Sdfr    ;;
13582936Sdfr    stf.spill   [r11] = f18, J_F20-J_F18
13682936Sdfr    stf.spill   [r10] = f19, J_F21-J_F19
13782936Sdfr    ;;
13882936Sdfr    stf.spill   [r11] = f20, J_F22-J_F20
13982936Sdfr    stf.spill   [r10] = f21, J_F23-J_F21
14082936Sdfr    ;;
14182936Sdfr    stf.spill   [r11] = f22, J_F24-J_F22
14282936Sdfr    stf.spill   [r10] = f23, J_F25-J_F23
14382936Sdfr    ;;
14482936Sdfr    stf.spill   [r11] = f24, J_F26-J_F24
14582936Sdfr    stf.spill   [r10] = f25, J_F27-J_F25
14682936Sdfr    ;;
14782936Sdfr    stf.spill   [r11] = f26, J_F28-J_F26
14882936Sdfr    stf.spill   [r10] = f27, J_F29-J_F27
14982936Sdfr    ;;
15082936Sdfr    stf.spill   [r11] = f28, J_F30-J_F28
15182936Sdfr    stf.spill   [r10] = f29, J_F31-J_F29
15282936Sdfr    ;;
15382936Sdfr    stf.spill   [r11] = f30, J_FPSR-J_F30
15482936Sdfr    stf.spill   [r10] = f31, J_B0-J_F31     // size of f31 + fpsr
15582936Sdfr    //
15682936Sdfr    // save FPSR register & branch registers
15782936Sdfr    //
15882936Sdfr    mov     r2 = ar.fpsr    // save fpsr register
15982936Sdfr    mov     r3 = b0
16082936Sdfr    ;;
16182936Sdfr    st8     [r11] = r2, J_B1-J_FPSR
16282936Sdfr    st8     [r10] = r3, J_B2-J_B0
16382936Sdfr    mov     r2 = b1
16482936Sdfr    mov     r3 = b2
16582936Sdfr    ;;
16682936Sdfr    st8     [r11] = r2, J_B3-J_B1
16782936Sdfr    st8     [r10] = r3, J_B4-J_B2
16882936Sdfr    mov     r2 = b3
16982936Sdfr    mov     r3 = b4
17082936Sdfr    ;;
17182936Sdfr    st8     [r11] = r2, J_B5-J_B3
17282936Sdfr    st8     [r10] = r3
17382936Sdfr    mov     r2 = b5
17482936Sdfr    ;;
17582936Sdfr    st8     [r11] = r2
17682936Sdfr    ;;
17782936Sdfr    //
17882936Sdfr    // return
17982936Sdfr    //
18082936Sdfr    mov     r8 = r0         // return 0 from setjmp
18182936Sdfr    mov     ar.unat = r14   // restore unat
18282936Sdfr    br.ret.sptk b0
18382936Sdfr
18467117SdfrEND(_setjmp)
18567117Sdfr
18667117Sdfr
18782936Sdfr//
18882936Sdfr// void _longjmp(struct jmp_buffer *, int val)
18982936Sdfr//
19082936Sdfr//  Perform a non-local goto.
19182936Sdfr//
19282936Sdfr// Description:
19382936Sdfr//
19482936Sdfr//  LongJump initializes the register set to the values saved by a
19582936Sdfr//  previous 'SetJump' and jumps to the return location saved by that
19682936Sdfr//  'SetJump'.  This has the effect of unwinding the stack and returning
19782936Sdfr//  for a second time to the 'SetJump'.
19882936Sdfr//
19967117Sdfr
20085229Sdfr	WEAK_ALIAS(_longjmp,___longjmp)
20185229SdfrENTRY(___longjmp, 2)
20282936Sdfr    //
20382936Sdfr    //  Make sure buffer is aligned at 16byte boundary
20482936Sdfr    //
20582936Sdfr    add     r10 = -0x10,r0  ;;  // mask the lower 4 bits
20682936Sdfr    and     r32 = r32, r10;;
20782936Sdfr    add     r32 = 0x10, r32;;   // move to next 16 byte boundary
20867117Sdfr
20982936Sdfr    //
21082936Sdfr    // caching the return value as we do invala in the end
21182936Sdfr    //
21282936Sdfr    mov     r8 = r33            // return value
21382936Sdfr
21482936Sdfr    //
21582936Sdfr    //  get immediate context
21682936Sdfr    //
21782936Sdfr    mov     r14 = ar.rsc        // get user RSC conf
21882936Sdfr    add     r10 = J_PFS, r32    // get address of pfs
21982936Sdfr    add     r11 = J_NATS, r32
22082936Sdfr    ;;
22182936Sdfr    ld8     r15 = [r10], J_BSP-J_PFS    // get pfs
22282936Sdfr    ld8     r2 = [r11], J_LC-J_NATS     // get unat for spilled regs
22382936Sdfr    ;;
22482936Sdfr    mov     ar.unat = r2
22582936Sdfr    ;;
22682936Sdfr    ld8     r16 = [r10], J_PREDS-J_BSP  // get backing store pointer
22782936Sdfr    mov     ar.rsc = r0         // put RSE in enforced lazy
22882936Sdfr    mov     ar.pfs = r15
22982936Sdfr    ;;
23082936Sdfr
23182936Sdfr    //
23282936Sdfr    // while returning from longjmp the BSPSTORE and BSP needs to be
23382936Sdfr    // same and discard all the registers allocated after we did
23482936Sdfr    // setjmp. Also, we need to generate the RNAT register since we
23582936Sdfr    // did not flushed the RSE on setjmp.
23682936Sdfr    //
23782936Sdfr    mov     r17 = ar.bspstore   // get current BSPSTORE
23882936Sdfr    ;;
23982936Sdfr    cmp.ltu p6,p7 = r17, r16    // is it less than BSP of
24082936Sdfr(p6)    br.spnt.few .flush_rse
24182936Sdfr    mov     r19 = ar.rnat       // get current RNAT
24282936Sdfr    ;;
24382936Sdfr    loadrs                      // invalidate dirty regs
24482936Sdfr    br.sptk.many    .restore_rnat       // restore RNAT
24582936Sdfr
24682936Sdfr.flush_rse:
24782936Sdfr    flushrs
24882936Sdfr    ;;
24982936Sdfr    mov     r19 = ar.rnat       // get current RNAT
25082936Sdfr    mov     r17 = r16           // current BSPSTORE
25182936Sdfr    ;;
25282936Sdfr.restore_rnat:
25382936Sdfr    //
25482936Sdfr    // check if RNAT is saved between saved BSP and curr BSPSTORE
25582936Sdfr    //
25682936Sdfr    mov     r18 = 0x3f
25782936Sdfr    ;;
25882936Sdfr    dep     r18 = r18,r16,3,6   // get RNAT address
25982936Sdfr    ;;
26082936Sdfr    cmp.ltu p8,p9 = r18, r17    // RNAT saved on RSE
26182936Sdfr    ;;
26282936Sdfr(p8)    ld8     r19 = [r18]     // get RNAT from RSE
26382936Sdfr    ;;
26482936Sdfr    mov     ar.bspstore = r16   // set new BSPSTORE
26582936Sdfr    ;;
26682936Sdfr    mov     ar.rnat = r19       // restore RNAT
26782936Sdfr    mov     ar.rsc = r14        // restore RSC conf
26882936Sdfr
26982936Sdfr
27082936Sdfr    ld8     r3 = [r11], J_R4-J_LC       // get lc register
27182936Sdfr    ld8     r2 = [r10], J_R5-J_PREDS    // get predicates
27282936Sdfr    ;;
27382936Sdfr    mov     pr = r2, -1
27482936Sdfr    mov     ar.lc = r3
27582936Sdfr    //
27682936Sdfr    //  restore preserved general registers & NaT's
27782936Sdfr    //
27882936Sdfr    ld8.fill    r4 = [r11], J_R6-J_R4
27982936Sdfr    ;;
28082936Sdfr    ld8.fill    r5 = [r10], J_R7-J_R5
28182936Sdfr    ld8.fill    r6 = [r11], J_SP-J_R6
28282936Sdfr    ;;
28382936Sdfr    ld8.fill    r7 = [r10], J_F2-J_R7
28482936Sdfr    ld8.fill    sp = [r11], J_F3-J_SP
28582936Sdfr    ;;
28682936Sdfr    //
28782936Sdfr    //  restore floating registers
28882936Sdfr    //
28982936Sdfr    ldf.fill    f2 = [r10], J_F4-J_F2
29082936Sdfr    ldf.fill    f3 = [r11], J_F5-J_F3
29182936Sdfr    ;;
29282936Sdfr    ldf.fill    f4 = [r10], J_F16-J_F4
29382936Sdfr    ldf.fill    f5 = [r11], J_F17-J_F5
29482936Sdfr    ;;
29582936Sdfr    ldf.fill    f16 = [r10], J_F18-J_F16
29682936Sdfr    ldf.fill    f17 = [r11], J_F19-J_F17
29782936Sdfr    ;;
29882936Sdfr    ldf.fill    f18 = [r10], J_F20-J_F18
29982936Sdfr    ldf.fill    f19 = [r11], J_F21-J_F19
30082936Sdfr    ;;
30182936Sdfr    ldf.fill    f20 = [r10], J_F22-J_F20
30282936Sdfr    ldf.fill    f21 = [r11], J_F23-J_F21
30382936Sdfr    ;;
30482936Sdfr    ldf.fill    f22 = [r10], J_F24-J_F22
30582936Sdfr    ldf.fill    f23 = [r11], J_F25-J_F23
30682936Sdfr    ;;
30782936Sdfr    ldf.fill    f24 = [r10], J_F26-J_F24
30882936Sdfr    ldf.fill    f25 = [r11], J_F27-J_F25
30982936Sdfr    ;;
31082936Sdfr    ldf.fill    f26 = [r10], J_F28-J_F26
31182936Sdfr    ldf.fill    f27 = [r11], J_F29-J_F27
31282936Sdfr    ;;
31382936Sdfr    ldf.fill    f28 = [r10], J_F30-J_F28
31482936Sdfr    ldf.fill    f29 = [r11], J_F31-J_F29
31582936Sdfr    ;;
31682936Sdfr    ldf.fill    f30 = [r10], J_FPSR-J_F30
31782936Sdfr    ldf.fill    f31 = [r11], J_B0-J_F31 ;;
31882936Sdfr
31982936Sdfr    //
32082936Sdfr    // restore branch registers and fpsr
32182936Sdfr    //
32282936Sdfr    ld8     r16 = [r10], J_B1-J_FPSR    // get fpsr
32382936Sdfr    ld8     r17 = [r11], J_B2-J_B0      // get return pointer
32482936Sdfr    ;;
32582936Sdfr    mov     ar.fpsr = r16
32682936Sdfr    mov     b0 = r17
32782936Sdfr    ld8     r2 = [r10], J_B3-J_B1
32882936Sdfr    ld8     r3 = [r11], J_B4-J_B2
32982936Sdfr    ;;
33082936Sdfr    mov     b1 = r2
33182936Sdfr    mov     b2 = r3
33282936Sdfr    ld8     r2 = [r10], J_B5-J_B3
33382936Sdfr    ld8     r3 = [r11]
33482936Sdfr    ;;
33582936Sdfr    mov     b3 = r2
33682936Sdfr    mov     b4 = r3
33782936Sdfr    ld8     r2 = [r10]
33882936Sdfr    ld8     r21 = [r32]         // get user unat
33982936Sdfr    ;;
34082936Sdfr    mov     b5 = r2
34182936Sdfr    mov     ar.unat = r21
34282936Sdfr
34382936Sdfr    //
34482936Sdfr    // invalidate ALAT
34582936Sdfr    //
34682936Sdfr    invala ;;
34782936Sdfr
34882936Sdfr    br.ret.sptk b0
34982936Sdfr
35085229SdfrEND(___longjmp)
351