2 * linux/arch/arm/kernel/entry-armv.S
4 * Copyright (C) 1996,1997,1998 Russell King.
5 * ARM700 fix by Matthew Godbolt (linux-user@willothewisp.demon.co.uk)
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
11 * Low-level vector interface routines
13 * Note: there is a StrongARM bug in the STMIA rn, {regs}^ instruction that causes
14 * it to save wrong values... Be aware!
16 #include <linux/config.h>
19 #include <asm/vfpmacros.h>
20 #include <asm/hardware.h> /* should be moved into entry-macro.S */
21 #include <asm/arch/irqs.h> /* should be moved into entry-macro.S */
22 #include <asm/arch/entry-macro.S>
24 #include "entry-header.S"
27 * Interrupt handling. Preserves r7, r8, r9
30 1: get_irqnr_and_base r0, r6, r5, lr
33 @ routine called with r0 = irq number, r1 = struct pt_regs *
42 * this macro assumes that irqstat (r6) and base (r5) are
43 * preserved from get_irqnr_and_base above
45 test_for_ipi r0, r6, r5, lr
54 * Invalid mode handlers
56 .macro inv_entry, reason
57 sub sp, sp, #S_FRAME_SIZE
63 inv_entry BAD_PREFETCH
75 inv_entry BAD_UNDEFINSTR
78 @ XXX fall through to common_invalid
82 @ common_invalid - generic code for failed exception (re-entrant version of handlers)
88 add r0, sp, #S_PC @ here for interlock avoidance
89 mov r7, #-1 @ "" "" "" ""
90 str r4, [sp] @ save preserved r0
91 stmia r0, {r5 - r7} @ lr_<exception>,
92 @ cpsr_<exception>, "old_r0"
102 sub sp, sp, #S_FRAME_SIZE
106 add r5, sp, #S_SP @ here for interlock avoidance
107 mov r4, #-1 @ "" "" "" ""
108 add r0, sp, #S_FRAME_SIZE @ "" "" "" ""
109 str r1, [sp] @ save the "real" r0 copied
110 @ from the exception stack
115 @ We are now ready to fill in the remaining blanks on the stack:
119 @ r2 - lr_<exception>, already fixed up for correct return/restart
120 @ r3 - spsr_<exception>
121 @ r4 - orig_r0 (see pt_regs definition in ptrace.h)
131 @ get ready to re-enable interrupts if appropriate
135 biceq r9, r9, #PSR_I_BIT
138 @ Call the processor-specific abort handler:
140 @ r2 - aborted context pc
141 @ r3 - aborted context cpsr
143 @ The abort handler must return the aborted address in r0, and
144 @ the fault status register in r1. r9 must be preserved.
155 @ set desired IRQ state, then call main handler
162 @ IRQs off again before pulling preserved data off the stack
167 @ restore SPSR and restart the instruction
171 ldmia sp, {r0 - pc}^ @ load r0 - pc, cpsr
177 #ifdef CONFIG_PREEMPT
179 ldr r8, [tsk, #TI_PREEMPT] @ get preempt count
180 add r7, r8, #1 @ increment it
181 str r7, [tsk, #TI_PREEMPT]
185 #ifdef CONFIG_PREEMPT
186 ldr r0, [tsk, #TI_FLAGS] @ get flags
187 tst r0, #_TIF_NEED_RESCHED
190 ldr r0, [tsk, #TI_PREEMPT] @ read preempt value
191 str r8, [tsk, #TI_PREEMPT] @ restore preempt count
193 strne r0, [r0, -r0] @ bug()
195 ldr r0, [sp, #S_PSR] @ irqs are already disabled
197 ldmia sp, {r0 - pc}^ @ load r0 - pc, cpsr
201 #ifdef CONFIG_PREEMPT
203 teq r8, #0 @ was preempt count = 0
204 ldreq r6, .LCirq_stat
206 ldr r0, [r6, #4] @ local_irq_count
207 ldr r1, [r6, #8] @ local_bh_count
210 mov r7, #0 @ preempt_schedule_irq
211 str r7, [tsk, #TI_PREEMPT] @ expects preempt_count == 0
212 1: bl preempt_schedule_irq @ irq en/disable is done inside
213 ldr r0, [tsk, #TI_FLAGS] @ get new tasks TI_FLAGS
214 tst r0, #_TIF_NEED_RESCHED
215 beq preempt_return @ go again
224 @ call emulation code, which returns using r9 if it has emulated
225 @ the instruction, or the more conventional lr if we are to treat
226 @ this as a real undefined instruction
234 mov r0, sp @ struct pt_regs *regs
238 @ IRQs off again before pulling preserved data off the stack
243 @ restore SPSR and restart the instruction
245 ldr lr, [sp, #S_PSR] @ Get SVC cpsr
247 ldmia sp, {r0 - pc}^ @ Restore SVC registers
254 @ re-enable interrupts if appropriate
258 biceq r9, r9, #PSR_I_BIT
262 @ set args, then call main handler
264 @ r0 - address of faulting instruction
265 @ r1 - pointer to registers on stack
267 mov r0, r2 @ address (pc)
269 bl do_PrefetchAbort @ call abort handler
272 @ IRQs off again before pulling preserved data off the stack
277 @ restore SPSR and restart the instruction
281 ldmia sp, {r0 - pc}^ @ load r0 - pc, cpsr
292 #ifdef CONFIG_PREEMPT
301 sub sp, sp, #S_FRAME_SIZE
305 add r0, sp, #S_PC @ here for interlock avoidance
306 mov r4, #-1 @ "" "" "" ""
308 str r1, [sp] @ save the "real" r0 copied
309 @ from the exception stack
311 #if __LINUX_ARM_ARCH__ < 6 && !defined(CONFIG_NEEDS_SYSCALL_FOR_CMPXCHG)
312 @ make sure our user space atomic helper is aborted
314 bichs r3, r3, #PSR_Z_BIT
318 @ We are now ready to fill in the remaining blanks on the stack:
320 @ r2 - lr_<exception>, already fixed up for correct return/restart
321 @ r3 - spsr_<exception>
322 @ r4 - orig_r0 (see pt_regs definition in ptrace.h)
324 @ Also, separately save sp_usr and lr_usr
330 @ Enable the alignment trap while in kernel mode
335 @ Clear FP to mark the first stack frame
345 @ Call the processor-specific abort handler:
347 @ r2 - aborted context pc
348 @ r3 - aborted context cpsr
350 @ The abort handler must return the aborted address in r0, and
351 @ the fault status register in r1.
362 @ IRQs on, then call the main handler
366 adr lr, ret_from_exception
374 #ifdef CONFIG_PREEMPT
375 ldr r8, [tsk, #TI_PREEMPT] @ get preempt count
376 add r7, r8, #1 @ increment it
377 str r7, [tsk, #TI_PREEMPT]
381 #ifdef CONFIG_PREEMPT
382 ldr r0, [tsk, #TI_PREEMPT]
383 str r8, [tsk, #TI_PREEMPT]
397 tst r3, #PSR_T_BIT @ Thumb mode?
398 bne fpundefinstr @ ignore FP
402 @ fall through to the emulation code, which returns using r9 if
403 @ it has emulated the instruction, or the more conventional lr
404 @ if we are to treat this as a real undefined instruction
409 adr r9, ret_from_exception
412 @ fallthrough to call_fpe
416 * The out of line fixup for the ldrt above.
418 .section .fixup, "ax"
421 .section __ex_table,"a"
426 * Check whether the instruction is a co-processor instruction.
427 * If yes, we need to call the relevant co-processor handler.
429 * Note that we don't do a full check here for the co-processor
430 * instructions; all instructions with bit 27 set are well
431 * defined. The only instructions that should fault are the
432 * co-processor instructions. However, we have to watch out
433 * for the ARM6/ARM7 SWI bug.
435 * Emulators may wish to make use of the following registers:
436 * r0 = instruction opcode.
438 * r10 = this threads thread_info structure.
441 tst r0, #0x08000000 @ only CDP/CPRT/LDC/STC have bit 27
442 #if defined(CONFIG_CPU_ARM610) || defined(CONFIG_CPU_ARM710)
443 and r8, r0, #0x0f000000 @ mask out op-code bits
444 teqne r8, #0x0f000000 @ SWI (ARM6/7 bug)?
447 get_thread_info r10 @ get current thread
448 and r8, r0, #0x00000f00 @ mask out CP number
450 add r6, r10, #TI_USED_CP
451 strb r7, [r6, r8, lsr #8] @ set appropriate used_cp[]
453 @ Test if we need to give access to iWMMXt coprocessors
454 ldr r5, [r10, #TI_FLAGS]
455 rsbs r7, r8, #(1 << 8) @ CP 0 or 1 only
456 movcss r7, r5, lsr #(TIF_USING_IWMMXT + 1)
457 bcs iwmmxt_task_enable
460 add pc, pc, r8, lsr #6
464 b do_fpe @ CP#1 (FPE)
465 b do_fpe @ CP#2 (FPE)
474 b do_vfp @ CP#10 (VFP)
475 b do_vfp @ CP#11 (VFP)
477 mov pc, lr @ CP#10 (VFP)
478 mov pc, lr @ CP#11 (VFP)
482 mov pc, lr @ CP#14 (Debug)
483 mov pc, lr @ CP#15 (Control)
487 add r10, r10, #TI_FPSTATE @ r10 = workspace
488 ldr pc, [r4] @ Call FP module USR entry point
491 * The FP module is called with these registers set:
494 * r9 = normal "successful" return address
496 * lr = unrecognised FP instruction return address
506 adr lr, ret_from_exception
513 enable_irq @ Enable interrupts
514 mov r0, r2 @ address (pc)
516 bl do_PrefetchAbort @ call abort handler
519 * This is the return code to user mode for abort handlers
521 ENTRY(ret_from_exception)
527 * Register switch for ARMv3 and ARMv4 processors
528 * r0 = previous task_struct, r1 = previous thread_info, r2 = next thread_info
529 * previous and next are guaranteed not to be the same.
532 add ip, r1, #TI_CPU_SAVE
533 ldr r3, [r2, #TI_TP_VALUE]
534 stmia ip!, {r4 - sl, fp, sp, lr} @ Store most regs on stack
535 ldr r6, [r2, #TI_CPU_DOMAIN]!
536 #if __LINUX_ARM_ARCH__ >= 6
537 #ifdef CONFIG_CPU_MPCORE
540 strex r3, r4, [ip] @ Clear exclusive monitor
543 #if defined(CONFIG_CPU_XSCALE) && !defined(CONFIG_IWMMXT)
547 #if defined(CONFIG_HAS_TLS_REG)
548 mcr p15, 0, r3, c13, c0, 3 @ set TLS register
549 #elif !defined(CONFIG_TLS_REG_EMUL)
551 str r3, [r4, #-15] @ TLS val at 0xffff0ff0
553 mcr p15, 0, r6, c3, c0, 0 @ Set domain register
555 @ Always disable VFP so we can lazily save/restore the old
556 @ state. This occurs in the context of the previous thread.
558 bic r4, r4, #FPEXC_ENABLE
561 #if defined(CONFIG_IWMMXT)
562 bl iwmmxt_task_switch
563 #elif defined(CONFIG_CPU_XSCALE)
564 add r4, r2, #40 @ cpu_context_save->extra
568 ldmib r2, {r4 - sl, fp, sp, pc} @ Load all regs saved previously
575 * These are segment of kernel provided user code reachable from user space
576 * at a fixed address in kernel memory. This is used to provide user space
577 * with some operations which require kernel help because of unimplemented
578 * native feature and/or instructions in many ARM CPUs. The idea is for
579 * this code to be executed directly in user mode for best efficiency but
580 * which is too intimate with the kernel counter part to be left to user
581 * libraries. In fact this code might even differ from one CPU to another
582 * depending on the available instruction set and restrictions like on
583 * SMP systems. In other words, the kernel reserves the right to change
584 * this code as needed without warning. Only the entry points and their
585 * results are guaranteed to be stable.
587 * Each segment is 32-byte aligned and will be moved to the top of the high
588 * vector page. New segments (if ever needed) must be added in front of
589 * existing ones. This mechanism should be used only for things that are
590 * really small and justified, and not be abused freely.
592 * User space is expected to implement those things inline when optimizing
593 * for a processor that has the necessary native support, but only if such
594 * resulting binaries are already to be incompatible with earlier ARM
595 * processors due to the use of unsupported instructions other than what
596 * is provided here. In other words don't make binaries unable to run on
597 * earlier processors just for the sake of not using these kernel helpers
598 * if your compiled code is not going to use the new instructions for other
603 .globl __kuser_helper_start
604 __kuser_helper_start:
607 * Reference prototype:
609 * int __kernel_cmpxchg(int oldval, int newval, int *ptr)
616 * lr = return address
620 * r0 = returned value (zero or non-zero)
621 * C flag = set if r0 == 0, clear if r0 != 0
627 * Definition and user space usage example:
629 * typedef int (__kernel_cmpxchg_t)(int oldval, int newval, int *ptr);
630 * #define __kernel_cmpxchg (*(__kernel_cmpxchg_t *)0xffff0fc0)
632 * Atomically store newval in *ptr if *ptr is equal to oldval for user space.
633 * Return zero if *ptr was changed or non-zero if no exchange happened.
634 * The C flag is also set if *ptr was changed to allow for assembly
635 * optimization in the calling code.
637 * For example, a user space atomic_add implementation could look like this:
639 * #define atomic_add(ptr, val) \
640 * ({ register unsigned int *__ptr asm("r2") = (ptr); \
641 * register unsigned int __result asm("r1"); \
643 * "1: @ atomic_add\n\t" \
644 * "ldr r0, [r2]\n\t" \
645 * "mov r3, #0xffff0fff\n\t" \
646 * "add lr, pc, #4\n\t" \
647 * "add r1, r0, %2\n\t" \
648 * "add pc, r3, #(0xffff0fc0 - 0xffff0fff)\n\t" \
650 * : "=&r" (__result) \
651 * : "r" (__ptr), "rIL" (val) \
652 * : "r0","r3","ip","lr","cc","memory" ); \
656 __kuser_cmpxchg: @ 0xffff0fc0
658 #if defined(CONFIG_NEEDS_SYSCALL_FOR_CMPXCHG)
661 * Poor you. No fast solution possible...
662 * The kernel itself must perform the operation.
663 * A special ghost syscall is used for that (see traps.c).
668 #elif __LINUX_ARM_ARCH__ < 6
671 * Theory of operation:
673 * We set the Z flag before loading oldval. If ever an exception
674 * occurs we can not be sure the loaded value will still be the same
675 * when the exception returns, therefore the user exception handler
676 * will clear the Z flag whenever the interrupted user code was
677 * actually from the kernel address space (see the usr_entry macro).
679 * The post-increment on the str is used to prevent a race with an
680 * exception happening just after the str instruction which would
681 * clear the Z flag although the exchange was done.
683 teq ip, ip @ set Z flag
684 ldr ip, [r2] @ load current val
685 add r3, r2, #1 @ prepare store ptr
686 teqeq ip, r0 @ compare with oldval if still allowed
687 streq r1, [r3, #-1]! @ store newval if still allowed
688 subs r0, r2, r3 @ if r2 == r3 the str occured
704 * Reference prototype:
706 * int __kernel_get_tls(void)
710 * lr = return address
718 * the Z flag might be lost
720 * Definition and user space usage example:
722 * typedef int (__kernel_get_tls_t)(void);
723 * #define __kernel_get_tls (*(__kernel_get_tls_t *)0xffff0fe0)
725 * Get the TLS value as previously set via the __ARM_NR_set_tls syscall.
727 * This could be used as follows:
729 * #define __kernel_get_tls() \
730 * ({ register unsigned int __val asm("r0"); \
731 * asm( "mov r0, #0xffff0fff; mov lr, pc; sub pc, r0, #31" \
732 * : "=r" (__val) : : "lr","cc" ); \
736 __kuser_get_tls: @ 0xffff0fe0
738 #if !defined(CONFIG_HAS_TLS_REG) && !defined(CONFIG_TLS_REG_EMUL)
740 ldr r0, [pc, #(16 - 8)] @ TLS stored at 0xffff0ff0
745 mrc p15, 0, r0, c13, c0, 3 @ read TLS register
751 .word 0 @ pad up to __kuser_helper_version
755 * Reference declaration:
757 * extern unsigned int __kernel_helper_version;
759 * Definition and user space usage example:
761 * #define __kernel_helper_version (*(unsigned int *)0xffff0ffc)
763 * User space may read this to determine the curent number of helpers
767 __kuser_helper_version: @ 0xffff0ffc
768 .word ((__kuser_helper_end - __kuser_helper_start) >> 5)
770 .globl __kuser_helper_end
777 * This code is copied to 0xffff0200 so we can use branches in the
778 * vectors, rather than ldr's. Note that this code must not
779 * exceed 0x300 bytes.
781 * Common stub entry macro:
782 * Enter in IRQ mode, spsr = SVC/USR CPSR, lr = SVC/USR PC
784 * SP points to a minimal amount of processor-private memory, the address
785 * of which is copied into r0 for the mode specific abort handler.
787 .macro vector_stub, name, correction=0
792 sub lr, lr, #\correction
796 @ Save r0, lr_<exception> (parent PC) and spsr_<exception>
799 stmia sp, {r0, lr} @ save r0, lr
801 str lr, [sp, #8] @ save spsr
804 @ Prepare for SVC32 mode. IRQs remain disabled.
807 bic r0, r0, #MODE_MASK
808 orr r0, r0, #SVC_MODE
812 @ the branch table must immediately follow this code
816 ldr lr, [pc, lr, lsl #2]
817 movs pc, lr @ branch to handler in SVC mode
823 * Interrupt dispatcher
827 .long __irq_usr @ 0 (USR_26 / USR_32)
828 .long __irq_invalid @ 1 (FIQ_26 / FIQ_32)
829 .long __irq_invalid @ 2 (IRQ_26 / IRQ_32)
830 .long __irq_svc @ 3 (SVC_26 / SVC_32)
831 .long __irq_invalid @ 4
832 .long __irq_invalid @ 5
833 .long __irq_invalid @ 6
834 .long __irq_invalid @ 7
835 .long __irq_invalid @ 8
836 .long __irq_invalid @ 9
837 .long __irq_invalid @ a
838 .long __irq_invalid @ b
839 .long __irq_invalid @ c
840 .long __irq_invalid @ d
841 .long __irq_invalid @ e
842 .long __irq_invalid @ f
845 * Data abort dispatcher
846 * Enter in ABT mode, spsr = USR CPSR, lr = USR PC
850 .long __dabt_usr @ 0 (USR_26 / USR_32)
851 .long __dabt_invalid @ 1 (FIQ_26 / FIQ_32)
852 .long __dabt_invalid @ 2 (IRQ_26 / IRQ_32)
853 .long __dabt_svc @ 3 (SVC_26 / SVC_32)
854 .long __dabt_invalid @ 4
855 .long __dabt_invalid @ 5
856 .long __dabt_invalid @ 6
857 .long __dabt_invalid @ 7
858 .long __dabt_invalid @ 8
859 .long __dabt_invalid @ 9
860 .long __dabt_invalid @ a
861 .long __dabt_invalid @ b
862 .long __dabt_invalid @ c
863 .long __dabt_invalid @ d
864 .long __dabt_invalid @ e
865 .long __dabt_invalid @ f
868 * Prefetch abort dispatcher
869 * Enter in ABT mode, spsr = USR CPSR, lr = USR PC
873 .long __pabt_usr @ 0 (USR_26 / USR_32)
874 .long __pabt_invalid @ 1 (FIQ_26 / FIQ_32)
875 .long __pabt_invalid @ 2 (IRQ_26 / IRQ_32)
876 .long __pabt_svc @ 3 (SVC_26 / SVC_32)
877 .long __pabt_invalid @ 4
878 .long __pabt_invalid @ 5
879 .long __pabt_invalid @ 6
880 .long __pabt_invalid @ 7
881 .long __pabt_invalid @ 8
882 .long __pabt_invalid @ 9
883 .long __pabt_invalid @ a
884 .long __pabt_invalid @ b
885 .long __pabt_invalid @ c
886 .long __pabt_invalid @ d
887 .long __pabt_invalid @ e
888 .long __pabt_invalid @ f
891 * Undef instr entry dispatcher
892 * Enter in UND mode, spsr = SVC/USR CPSR, lr = SVC/USR PC
896 .long __und_usr @ 0 (USR_26 / USR_32)
897 .long __und_invalid @ 1 (FIQ_26 / FIQ_32)
898 .long __und_invalid @ 2 (IRQ_26 / IRQ_32)
899 .long __und_svc @ 3 (SVC_26 / SVC_32)
900 .long __und_invalid @ 4
901 .long __und_invalid @ 5
902 .long __und_invalid @ 6
903 .long __und_invalid @ 7
904 .long __und_invalid @ 8
905 .long __und_invalid @ 9
906 .long __und_invalid @ a
907 .long __und_invalid @ b
908 .long __und_invalid @ c
909 .long __und_invalid @ d
910 .long __und_invalid @ e
911 .long __und_invalid @ f
915 /*=============================================================================
917 *-----------------------------------------------------------------------------
918 * Enter in FIQ mode, spsr = ANY CPSR, lr = ANY PC
919 * MUST PRESERVE SVC SPSR, but need to switch to SVC mode to show our msg.
920 * Basically to switch modes, we *HAVE* to clobber one register... brain
921 * damage alert! I don't think that we can execute any code in here in any
922 * other mode than FIQ... Ok you can switch to another mode, but you can't
923 * get out of that mode without clobbering one register.
929 /*=============================================================================
930 * Address exception handler
931 *-----------------------------------------------------------------------------
932 * These aren't too critical.
933 * (they're not supposed to happen, and won't happen in 32-bit data mode).
940 * We group all the following data together to optimise
941 * for CPUs with separate I & D caches.
951 .equ stubs_offset, __vectors_start + 0x200 - __stubs_start
953 .globl __vectors_start
956 b vector_und + stubs_offset
957 ldr pc, .LCvswi + stubs_offset
958 b vector_pabt + stubs_offset
959 b vector_dabt + stubs_offset
960 b vector_addrexcptn + stubs_offset
961 b vector_irq + stubs_offset
962 b vector_fiq + stubs_offset
970 .globl cr_no_alignment