Merge branch 'x86-fpu-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git...
[linux-2.6] / arch / ia64 / kernel / minstate.h
1
2 #include <asm/cache.h>
3
4 #include "entry.h"
5 #include "paravirt_inst.h"
6
7 #ifdef CONFIG_VIRT_CPU_ACCOUNTING
8 /* read ar.itc in advance, and use it before leaving bank 0 */
9 #define ACCOUNT_GET_STAMP                               \
10 (pUStk) mov.m r20=ar.itc;
11 #define ACCOUNT_SYS_ENTER                               \
12 (pUStk) br.call.spnt rp=account_sys_enter               \
13         ;;
14 #else
15 #define ACCOUNT_GET_STAMP
16 #define ACCOUNT_SYS_ENTER
17 #endif
18
19 .section ".data.patch.rse", "a"
20 .previous
21
22 /*
23  * DO_SAVE_MIN switches to the kernel stacks (if necessary) and saves
24  * the minimum state necessary that allows us to turn psr.ic back
25  * on.
26  *
27  * Assumed state upon entry:
28  *      psr.ic: off
29  *      r31:    contains saved predicates (pr)
30  *
31  * Upon exit, the state is as follows:
32  *      psr.ic: off
33  *       r2 = points to &pt_regs.r16
34  *       r8 = contents of ar.ccv
35  *       r9 = contents of ar.csd
36  *      r10 = contents of ar.ssd
37  *      r11 = FPSR_DEFAULT
38  *      r12 = kernel sp (kernel virtual address)
39  *      r13 = points to current task_struct (kernel virtual address)
40  *      p15 = TRUE if psr.i is set in cr.ipsr
41  *      predicate registers (other than p2, p3, and p15), b6, r3, r14, r15:
42  *              preserved
43  *
44  * Note that psr.ic is NOT turned on by this macro.  This is so that
45  * we can pass interruption state as arguments to a handler.
46  */
47 #define IA64_NATIVE_DO_SAVE_MIN(__COVER,SAVE_IFS,EXTRA,WORKAROUND)                              \
48         mov r16=IA64_KR(CURRENT);       /* M */                                                 \
49         mov r27=ar.rsc;                 /* M */                                                 \
50         mov r20=r1;                     /* A */                                                 \
51         mov r25=ar.unat;                /* M */                                                 \
52         MOV_FROM_IPSR(p0,r29);          /* M */                                                 \
53         mov r26=ar.pfs;                 /* I */                                                 \
54         MOV_FROM_IIP(r28);                      /* M */                                         \
55         mov r21=ar.fpsr;                /* M */                                                 \
56         __COVER;                                /* B;; (or nothing) */                          \
57         ;;                                                                                      \
58         adds r16=IA64_TASK_THREAD_ON_USTACK_OFFSET,r16;                                         \
59         ;;                                                                                      \
60         ld1 r17=[r16];                          /* load current->thread.on_ustack flag */       \
61         st1 [r16]=r0;                           /* clear current->thread.on_ustack flag */      \
62         adds r1=-IA64_TASK_THREAD_ON_USTACK_OFFSET,r16                                          \
63         /* switch from user to kernel RBS: */                                                   \
64         ;;                                                                                      \
65         invala;                         /* M */                                                 \
66         SAVE_IFS;                                                                               \
67         cmp.eq pKStk,pUStk=r0,r17;              /* are we in kernel mode already? */            \
68         ;;                                                                                      \
69 (pUStk) mov ar.rsc=0;           /* set enforced lazy mode, pl 0, little-endian, loadrs=0 */     \
70         ;;                                                                                      \
71 (pUStk) mov.m r24=ar.rnat;                                                                      \
72 (pUStk) addl r22=IA64_RBS_OFFSET,r1;                    /* compute base of RBS */               \
73 (pKStk) mov r1=sp;                                      /* get sp  */                           \
74         ;;                                                                                      \
75 (pUStk) lfetch.fault.excl.nt1 [r22];                                                            \
76 (pUStk) addl r1=IA64_STK_OFFSET-IA64_PT_REGS_SIZE,r1;   /* compute base of memory stack */      \
77 (pUStk) mov r23=ar.bspstore;                            /* save ar.bspstore */                  \
78         ;;                                                                                      \
79 (pUStk) mov ar.bspstore=r22;                            /* switch to kernel RBS */              \
80 (pKStk) addl r1=-IA64_PT_REGS_SIZE,r1;                  /* if in kernel mode, use sp (r12) */   \
81         ;;                                                                                      \
82 (pUStk) mov r18=ar.bsp;                                                                         \
83 (pUStk) mov ar.rsc=0x3;         /* set eager mode, pl 0, little-endian, loadrs=0 */             \
84         adds r17=2*L1_CACHE_BYTES,r1;           /* really: biggest cache-line size */           \
85         adds r16=PT(CR_IPSR),r1;                                                                \
86         ;;                                                                                      \
87         lfetch.fault.excl.nt1 [r17],L1_CACHE_BYTES;                                             \
88         st8 [r16]=r29;          /* save cr.ipsr */                                              \
89         ;;                                                                                      \
90         lfetch.fault.excl.nt1 [r17];                                                            \
91         tbit.nz p15,p0=r29,IA64_PSR_I_BIT;                                                      \
92         mov r29=b0                                                                              \
93         ;;                                                                                      \
94         WORKAROUND;                                                                             \
95         adds r16=PT(R8),r1;     /* initialize first base pointer */                             \
96         adds r17=PT(R9),r1;     /* initialize second base pointer */                            \
97 (pKStk) mov r18=r0;             /* make sure r18 isn't NaT */                                   \
98         ;;                                                                                      \
99 .mem.offset 0,0; st8.spill [r16]=r8,16;                                                         \
100 .mem.offset 8,0; st8.spill [r17]=r9,16;                                                         \
101         ;;                                                                                      \
102 .mem.offset 0,0; st8.spill [r16]=r10,24;                                                        \
103 .mem.offset 8,0; st8.spill [r17]=r11,24;                                                        \
104         ;;                                                                                      \
105         st8 [r16]=r28,16;       /* save cr.iip */                                               \
106         st8 [r17]=r30,16;       /* save cr.ifs */                                               \
107 (pUStk) sub r18=r18,r22;        /* r18=RSE.ndirty*8 */                                          \
108         mov r8=ar.ccv;                                                                          \
109         mov r9=ar.csd;                                                                          \
110         mov r10=ar.ssd;                                                                         \
111         movl r11=FPSR_DEFAULT;   /* L-unit */                                                   \
112         ;;                                                                                      \
113         st8 [r16]=r25,16;       /* save ar.unat */                                              \
114         st8 [r17]=r26,16;       /* save ar.pfs */                                               \
115         shl r18=r18,16;         /* compute ar.rsc to be used for "loadrs" */                    \
116         ;;                                                                                      \
117         st8 [r16]=r27,16;       /* save ar.rsc */                                               \
118 (pUStk) st8 [r17]=r24,16;       /* save ar.rnat */                                              \
119 (pKStk) adds r17=16,r17;        /* skip over ar_rnat field */                                   \
120         ;;                      /* avoid RAW on r16 & r17 */                                    \
121 (pUStk) st8 [r16]=r23,16;       /* save ar.bspstore */                                          \
122         st8 [r17]=r31,16;       /* save predicates */                                           \
123 (pKStk) adds r16=16,r16;        /* skip over ar_bspstore field */                               \
124         ;;                                                                                      \
125         st8 [r16]=r29,16;       /* save b0 */                                                   \
126         st8 [r17]=r18,16;       /* save ar.rsc value for "loadrs" */                            \
127         cmp.eq pNonSys,pSys=r0,r0       /* initialize pSys=0, pNonSys=1 */                      \
128         ;;                                                                                      \
129 .mem.offset 0,0; st8.spill [r16]=r20,16;        /* save original r1 */                          \
130 .mem.offset 8,0; st8.spill [r17]=r12,16;                                                        \
131         adds r12=-16,r1;        /* switch to kernel memory stack (with 16 bytes of scratch) */  \
132         ;;                                                                                      \
133 .mem.offset 0,0; st8.spill [r16]=r13,16;                                                        \
134 .mem.offset 8,0; st8.spill [r17]=r21,16;        /* save ar.fpsr */                              \
135         mov r13=IA64_KR(CURRENT);       /* establish `current' */                               \
136         ;;                                                                                      \
137 .mem.offset 0,0; st8.spill [r16]=r15,16;                                                        \
138 .mem.offset 8,0; st8.spill [r17]=r14,16;                                                        \
139         ;;                                                                                      \
140 .mem.offset 0,0; st8.spill [r16]=r2,16;                                                         \
141 .mem.offset 8,0; st8.spill [r17]=r3,16;                                                         \
142         ACCOUNT_GET_STAMP                                                                       \
143         adds r2=IA64_PT_REGS_R16_OFFSET,r1;                                                     \
144         ;;                                                                                      \
145         EXTRA;                                                                                  \
146         movl r1=__gp;           /* establish kernel global pointer */                           \
147         ;;                                                                                      \
148         ACCOUNT_SYS_ENTER                                                                       \
149         bsw.1;                  /* switch back to bank 1 (must be last in insn group) */        \
150         ;;
151
152 /*
153  * SAVE_REST saves the remainder of pt_regs (with psr.ic on).
154  *
155  * Assumed state upon entry:
156  *      psr.ic: on
157  *      r2:     points to &pt_regs.r16
158  *      r3:     points to &pt_regs.r17
159  *      r8:     contents of ar.ccv
160  *      r9:     contents of ar.csd
161  *      r10:    contents of ar.ssd
162  *      r11:    FPSR_DEFAULT
163  *
164  * Registers r14 and r15 are guaranteed not to be touched by SAVE_REST.
165  */
166 #define SAVE_REST                               \
167 .mem.offset 0,0; st8.spill [r2]=r16,16;         \
168 .mem.offset 8,0; st8.spill [r3]=r17,16;         \
169         ;;                                      \
170 .mem.offset 0,0; st8.spill [r2]=r18,16;         \
171 .mem.offset 8,0; st8.spill [r3]=r19,16;         \
172         ;;                                      \
173 .mem.offset 0,0; st8.spill [r2]=r20,16;         \
174 .mem.offset 8,0; st8.spill [r3]=r21,16;         \
175         mov r18=b6;                             \
176         ;;                                      \
177 .mem.offset 0,0; st8.spill [r2]=r22,16;         \
178 .mem.offset 8,0; st8.spill [r3]=r23,16;         \
179         mov r19=b7;                             \
180         ;;                                      \
181 .mem.offset 0,0; st8.spill [r2]=r24,16;         \
182 .mem.offset 8,0; st8.spill [r3]=r25,16;         \
183         ;;                                      \
184 .mem.offset 0,0; st8.spill [r2]=r26,16;         \
185 .mem.offset 8,0; st8.spill [r3]=r27,16;         \
186         ;;                                      \
187 .mem.offset 0,0; st8.spill [r2]=r28,16;         \
188 .mem.offset 8,0; st8.spill [r3]=r29,16;         \
189         ;;                                      \
190 .mem.offset 0,0; st8.spill [r2]=r30,16;         \
191 .mem.offset 8,0; st8.spill [r3]=r31,32;         \
192         ;;                                      \
193         mov ar.fpsr=r11;        /* M-unit */    \
194         st8 [r2]=r8,8;          /* ar.ccv */    \
195         adds r24=PT(B6)-PT(F7),r3;              \
196         ;;                                      \
197         stf.spill [r2]=f6,32;                   \
198         stf.spill [r3]=f7,32;                   \
199         ;;                                      \
200         stf.spill [r2]=f8,32;                   \
201         stf.spill [r3]=f9,32;                   \
202         ;;                                      \
203         stf.spill [r2]=f10;                     \
204         stf.spill [r3]=f11;                     \
205         adds r25=PT(B7)-PT(F11),r3;             \
206         ;;                                      \
207         st8 [r24]=r18,16;       /* b6 */        \
208         st8 [r25]=r19,16;       /* b7 */        \
209         ;;                                      \
210         st8 [r24]=r9;           /* ar.csd */    \
211         st8 [r25]=r10;          /* ar.ssd */    \
212         ;;
213
214 #define RSE_WORKAROUND                          \
215 (pUStk) extr.u r17=r18,3,6;                     \
216 (pUStk) sub r16=r18,r22;                        \
217 [1:](pKStk)     br.cond.sptk.many 1f;           \
218         .xdata4 ".data.patch.rse",1b-.          \
219         ;;                                      \
220         cmp.ge p6,p7 = 33,r17;                  \
221         ;;                                      \
222 (p6)    mov r17=0x310;                          \
223 (p7)    mov r17=0x308;                          \
224         ;;                                      \
225         cmp.leu p1,p0=r16,r17;                  \
226 (p1)    br.cond.sptk.many 1f;                   \
227         dep.z r17=r26,0,62;                     \
228         movl r16=2f;                            \
229         ;;                                      \
230         mov ar.pfs=r17;                         \
231         dep r27=r0,r27,16,14;                   \
232         mov b0=r16;                             \
233         ;;                                      \
234         br.ret.sptk b0;                         \
235         ;;                                      \
236 2:                                              \
237         mov ar.rsc=r0                           \
238         ;;                                      \
239         flushrs;                                \
240         ;;                                      \
241         mov ar.bspstore=r22                     \
242         ;;                                      \
243         mov r18=ar.bsp;                         \
244         ;;                                      \
245 1:                                              \
246         .pred.rel "mutex", pKStk, pUStk
247
248 #define SAVE_MIN_WITH_COVER     DO_SAVE_MIN(COVER, mov r30=cr.ifs, , RSE_WORKAROUND)
249 #define SAVE_MIN_WITH_COVER_R19 DO_SAVE_MIN(COVER, mov r30=cr.ifs, mov r15=r19, RSE_WORKAROUND)
250 #define SAVE_MIN                        DO_SAVE_MIN(     , mov r30=r0, , )