Commit 9a2533c3 authored by Linus Torvalds's avatar Linus Torvalds

Merge branch 'fixes' of git://git.linaro.org/people/rmk/linux-arm

Pull ARM fixes from Russell King:
 "This fixes various issues found during July"

* 'fixes' of git://git.linaro.org/people/rmk/linux-arm:
  ARM: 7479/1: mm: avoid NULL dereference when flushing gate_vma with VIVT caches
  ARM: Fix undefined instruction exception handling
  ARM: 7480/1: only call smp_send_stop() on SMP
  ARM: 7478/1: errata: extend workaround for erratum #720789
  ARM: 7477/1: vfp: Always save VFP state in vfp_pm_suspend on UP
  ARM: 7476/1: vfp: only clear vfp state for current cpu in vfp_pm_suspend
  ARM: 7468/1: ftrace: Trace function entry before updating index
  ARM: 7467/1: mutex: use generic xchg-based implementation for ARMv6+
  ARM: 7466/1: disable interrupt before spinning endlessly
  ARM: 7465/1: Handle >4GB memory sizes in device tree and mem=size@start option
parents d4fdc325 b74253f7
...@@ -215,7 +215,9 @@ static inline void vivt_flush_cache_mm(struct mm_struct *mm) ...@@ -215,7 +215,9 @@ static inline void vivt_flush_cache_mm(struct mm_struct *mm)
static inline void static inline void
vivt_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned long end) vivt_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned long end)
{ {
if (cpumask_test_cpu(smp_processor_id(), mm_cpumask(vma->vm_mm))) struct mm_struct *mm = vma->vm_mm;
if (!mm || cpumask_test_cpu(smp_processor_id(), mm_cpumask(mm)))
__cpuc_flush_user_range(start & PAGE_MASK, PAGE_ALIGN(end), __cpuc_flush_user_range(start & PAGE_MASK, PAGE_ALIGN(end),
vma->vm_flags); vma->vm_flags);
} }
...@@ -223,7 +225,9 @@ vivt_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned ...@@ -223,7 +225,9 @@ vivt_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned
static inline void static inline void
vivt_flush_cache_page(struct vm_area_struct *vma, unsigned long user_addr, unsigned long pfn) vivt_flush_cache_page(struct vm_area_struct *vma, unsigned long user_addr, unsigned long pfn)
{ {
if (cpumask_test_cpu(smp_processor_id(), mm_cpumask(vma->vm_mm))) { struct mm_struct *mm = vma->vm_mm;
if (!mm || cpumask_test_cpu(smp_processor_id(), mm_cpumask(mm))) {
unsigned long addr = user_addr & PAGE_MASK; unsigned long addr = user_addr & PAGE_MASK;
__cpuc_flush_user_range(addr, addr + PAGE_SIZE, vma->vm_flags); __cpuc_flush_user_range(addr, addr + PAGE_SIZE, vma->vm_flags);
} }
......
...@@ -7,121 +7,10 @@ ...@@ -7,121 +7,10 @@
*/ */
#ifndef _ASM_MUTEX_H #ifndef _ASM_MUTEX_H
#define _ASM_MUTEX_H #define _ASM_MUTEX_H
#if __LINUX_ARM_ARCH__ < 6
/* On pre-ARMv6 hardware the swp based implementation is the most efficient. */
# include <asm-generic/mutex-xchg.h>
#else
/* /*
* Attempting to lock a mutex on ARMv6+ can be done with a bastardized * On pre-ARMv6 hardware this results in a swp-based implementation,
* atomic decrement (it is not a reliable atomic decrement but it satisfies * which is the most efficient. For ARMv6+, we emit a pair of exclusive
* the defined semantics for our purpose, while being smaller and faster * accesses instead.
* than a real atomic decrement or atomic swap. The idea is to attempt
* decrementing the lock value only once. If once decremented it isn't zero,
* or if its store-back fails due to a dispute on the exclusive store, we
* simply bail out immediately through the slow path where the lock will be
* reattempted until it succeeds.
*/ */
static inline void #include <asm-generic/mutex-xchg.h>
__mutex_fastpath_lock(atomic_t *count, void (*fail_fn)(atomic_t *))
{
int __ex_flag, __res;
__asm__ (
"ldrex %0, [%2] \n\t"
"sub %0, %0, #1 \n\t"
"strex %1, %0, [%2] "
: "=&r" (__res), "=&r" (__ex_flag)
: "r" (&(count)->counter)
: "cc","memory" );
__res |= __ex_flag;
if (unlikely(__res != 0))
fail_fn(count);
}
static inline int
__mutex_fastpath_lock_retval(atomic_t *count, int (*fail_fn)(atomic_t *))
{
int __ex_flag, __res;
__asm__ (
"ldrex %0, [%2] \n\t"
"sub %0, %0, #1 \n\t"
"strex %1, %0, [%2] "
: "=&r" (__res), "=&r" (__ex_flag)
: "r" (&(count)->counter)
: "cc","memory" );
__res |= __ex_flag;
if (unlikely(__res != 0))
__res = fail_fn(count);
return __res;
}
/*
* Same trick is used for the unlock fast path. However the original value,
* rather than the result, is used to test for success in order to have
* better generated assembly.
*/
static inline void
__mutex_fastpath_unlock(atomic_t *count, void (*fail_fn)(atomic_t *))
{
int __ex_flag, __res, __orig;
__asm__ (
"ldrex %0, [%3] \n\t"
"add %1, %0, #1 \n\t"
"strex %2, %1, [%3] "
: "=&r" (__orig), "=&r" (__res), "=&r" (__ex_flag)
: "r" (&(count)->counter)
: "cc","memory" );
__orig |= __ex_flag;
if (unlikely(__orig != 0))
fail_fn(count);
}
/*
* If the unlock was done on a contended lock, or if the unlock simply fails
* then the mutex remains locked.
*/
#define __mutex_slowpath_needs_to_unlock() 1
/*
* For __mutex_fastpath_trylock we use another construct which could be
* described as a "single value cmpxchg".
*
* This provides the needed trylock semantics like cmpxchg would, but it is
* lighter and less generic than a true cmpxchg implementation.
*/
static inline int
__mutex_fastpath_trylock(atomic_t *count, int (*fail_fn)(atomic_t *))
{
int __ex_flag, __res, __orig;
__asm__ (
"1: ldrex %0, [%3] \n\t"
"subs %1, %0, #1 \n\t"
"strexeq %2, %1, [%3] \n\t"
"movlt %0, #0 \n\t"
"cmpeq %2, #0 \n\t"
"bgt 1b "
: "=&r" (__orig), "=&r" (__res), "=&r" (__ex_flag)
: "r" (&count->counter)
: "cc", "memory" );
return __orig;
}
#endif
#endif #endif
...@@ -196,7 +196,7 @@ static const struct tagtable __tagtable_##fn __tag = { tag, fn } ...@@ -196,7 +196,7 @@ static const struct tagtable __tagtable_##fn __tag = { tag, fn }
struct membank { struct membank {
phys_addr_t start; phys_addr_t start;
unsigned long size; phys_addr_t size;
unsigned int highmem; unsigned int highmem;
}; };
...@@ -217,7 +217,7 @@ extern struct meminfo meminfo; ...@@ -217,7 +217,7 @@ extern struct meminfo meminfo;
#define bank_phys_end(bank) ((bank)->start + (bank)->size) #define bank_phys_end(bank) ((bank)->start + (bank)->size)
#define bank_phys_size(bank) (bank)->size #define bank_phys_size(bank) (bank)->size
extern int arm_add_memory(phys_addr_t start, unsigned long size); extern int arm_add_memory(phys_addr_t start, phys_addr_t size);
extern void early_print(const char *str, ...); extern void early_print(const char *str, ...);
extern void dump_machine_table(void); extern void dump_machine_table(void);
......
...@@ -244,6 +244,19 @@ svc_preempt: ...@@ -244,6 +244,19 @@ svc_preempt:
b 1b b 1b
#endif #endif
__und_fault:
@ Correct the PC such that it is pointing at the instruction
@ which caused the fault. If the faulting instruction was ARM
@ the PC will be pointing at the next instruction, and have to
@ subtract 4. Otherwise, it is Thumb, and the PC will be
@ pointing at the second half of the Thumb instruction. We
@ have to subtract 2.
ldr r2, [r0, #S_PC]
sub r2, r2, r1
str r2, [r0, #S_PC]
b do_undefinstr
ENDPROC(__und_fault)
.align 5 .align 5
__und_svc: __und_svc:
#ifdef CONFIG_KPROBES #ifdef CONFIG_KPROBES
...@@ -261,25 +274,32 @@ __und_svc: ...@@ -261,25 +274,32 @@ __und_svc:
@ @
@ r0 - instruction @ r0 - instruction
@ @
#ifndef CONFIG_THUMB2_KERNEL #ifndef CONFIG_THUMB2_KERNEL
ldr r0, [r4, #-4] ldr r0, [r4, #-4]
#else #else
mov r1, #2
ldrh r0, [r4, #-2] @ Thumb instruction at LR - 2 ldrh r0, [r4, #-2] @ Thumb instruction at LR - 2
cmp r0, #0xe800 @ 32-bit instruction if xx >= 0 cmp r0, #0xe800 @ 32-bit instruction if xx >= 0
ldrhhs r9, [r4] @ bottom 16 bits blo __und_svc_fault
orrhs r0, r9, r0, lsl #16 ldrh r9, [r4] @ bottom 16 bits
add r4, r4, #2
str r4, [sp, #S_PC]
orr r0, r9, r0, lsl #16
#endif #endif
adr r9, BSYM(1f) adr r9, BSYM(__und_svc_finish)
mov r2, r4 mov r2, r4
bl call_fpe bl call_fpe
mov r1, #4 @ PC correction to apply
__und_svc_fault:
mov r0, sp @ struct pt_regs *regs mov r0, sp @ struct pt_regs *regs
bl do_undefinstr bl __und_fault
@ @
@ IRQs off again before pulling preserved data off the stack @ IRQs off again before pulling preserved data off the stack
@ @
1: disable_irq_notrace __und_svc_finish:
disable_irq_notrace
@ @
@ restore SPSR and restart the instruction @ restore SPSR and restart the instruction
...@@ -423,25 +443,33 @@ __und_usr: ...@@ -423,25 +443,33 @@ __und_usr:
mov r2, r4 mov r2, r4
mov r3, r5 mov r3, r5
@ r2 = regs->ARM_pc, which is either 2 or 4 bytes ahead of the
@ faulting instruction depending on Thumb mode.
@ r3 = regs->ARM_cpsr
@ @
@ fall through to the emulation code, which returns using r9 if @ The emulation code returns using r9 if it has emulated the
@ it has emulated the instruction, or the more conventional lr @ instruction, or the more conventional lr if we are to treat
@ if we are to treat this as a real undefined instruction @ this as a real undefined instruction
@
@ r0 - instruction
@ @
adr r9, BSYM(ret_from_exception) adr r9, BSYM(ret_from_exception)
adr lr, BSYM(__und_usr_unknown)
tst r3, #PSR_T_BIT @ Thumb mode? tst r3, #PSR_T_BIT @ Thumb mode?
itet eq @ explicit IT needed for the 1f label bne __und_usr_thumb
subeq r4, r2, #4 @ ARM instr at LR - 4 sub r4, r2, #4 @ ARM instr at LR - 4
subne r4, r2, #2 @ Thumb instr at LR - 2 1: ldrt r0, [r4]
1: ldreqt r0, [r4]
#ifdef CONFIG_CPU_ENDIAN_BE8 #ifdef CONFIG_CPU_ENDIAN_BE8
reveq r0, r0 @ little endian instruction rev r0, r0 @ little endian instruction
#endif #endif
beq call_fpe @ r0 = 32-bit ARM instruction which caused the exception
@ r2 = PC value for the following instruction (:= regs->ARM_pc)
@ r4 = PC value for the faulting instruction
@ lr = 32-bit undefined instruction function
adr lr, BSYM(__und_usr_fault_32)
b call_fpe
__und_usr_thumb:
@ Thumb instruction @ Thumb instruction
sub r4, r2, #2 @ First half of thumb instr at LR - 2
#if CONFIG_ARM_THUMB && __LINUX_ARM_ARCH__ >= 6 && CONFIG_CPU_V7 #if CONFIG_ARM_THUMB && __LINUX_ARM_ARCH__ >= 6 && CONFIG_CPU_V7
/* /*
* Thumb-2 instruction handling. Note that because pre-v6 and >= v6 platforms * Thumb-2 instruction handling. Note that because pre-v6 and >= v6 platforms
...@@ -455,7 +483,7 @@ __und_usr: ...@@ -455,7 +483,7 @@ __und_usr:
ldr r5, .LCcpu_architecture ldr r5, .LCcpu_architecture
ldr r5, [r5] ldr r5, [r5]
cmp r5, #CPU_ARCH_ARMv7 cmp r5, #CPU_ARCH_ARMv7
blo __und_usr_unknown blo __und_usr_fault_16 @ 16bit undefined instruction
/* /*
* The following code won't get run unless the running CPU really is v7, so * The following code won't get run unless the running CPU really is v7, so
* coding round the lack of ldrht on older arches is pointless. Temporarily * coding round the lack of ldrht on older arches is pointless. Temporarily
...@@ -463,15 +491,18 @@ __und_usr: ...@@ -463,15 +491,18 @@ __und_usr:
*/ */
.arch armv6t2 .arch armv6t2
#endif #endif
2: 2: ldrht r5, [r4]
ARM( ldrht r5, [r4], #2 )
THUMB( ldrht r5, [r4] )
THUMB( add r4, r4, #2 )
cmp r5, #0xe800 @ 32bit instruction if xx != 0 cmp r5, #0xe800 @ 32bit instruction if xx != 0
blo __und_usr_unknown blo __und_usr_fault_16 @ 16bit undefined instruction
3: ldrht r0, [r4] 3: ldrht r0, [r2]
add r2, r2, #2 @ r2 is PC + 2, make it PC + 4 add r2, r2, #2 @ r2 is PC + 2, make it PC + 4
str r2, [sp, #S_PC] @ it's a 2x16bit instr, update
orr r0, r0, r5, lsl #16 orr r0, r0, r5, lsl #16
adr lr, BSYM(__und_usr_fault_32)
@ r0 = the two 16-bit Thumb instructions which caused the exception
@ r2 = PC value for the following Thumb instruction (:= regs->ARM_pc)
@ r4 = PC value for the first 16-bit Thumb instruction
@ lr = 32bit undefined instruction function
#if __LINUX_ARM_ARCH__ < 7 #if __LINUX_ARM_ARCH__ < 7
/* If the target arch was overridden, change it back: */ /* If the target arch was overridden, change it back: */
...@@ -482,17 +513,13 @@ __und_usr: ...@@ -482,17 +513,13 @@ __und_usr:
#endif #endif
#endif /* __LINUX_ARM_ARCH__ < 7 */ #endif /* __LINUX_ARM_ARCH__ < 7 */
#else /* !(CONFIG_ARM_THUMB && __LINUX_ARM_ARCH__ >= 6 && CONFIG_CPU_V7) */ #else /* !(CONFIG_ARM_THUMB && __LINUX_ARM_ARCH__ >= 6 && CONFIG_CPU_V7) */
b __und_usr_unknown b __und_usr_fault_16
#endif #endif
UNWIND(.fnend ) UNWIND(.fnend)
ENDPROC(__und_usr) ENDPROC(__und_usr)
@
@ fallthrough to call_fpe
@
/* /*
* The out of line fixup for the ldrt above. * The out of line fixup for the ldrt instructions above.
*/ */
.pushsection .fixup, "ax" .pushsection .fixup, "ax"
.align 2 .align 2
...@@ -524,11 +551,12 @@ ENDPROC(__und_usr) ...@@ -524,11 +551,12 @@ ENDPROC(__und_usr)
* NEON handler code. * NEON handler code.
* *
* Emulators may wish to make use of the following registers: * Emulators may wish to make use of the following registers:
* r0 = instruction opcode. * r0 = instruction opcode (32-bit ARM or two 16-bit Thumb)
* r2 = PC+4 * r2 = PC value to resume execution after successful emulation
* r9 = normal "successful" return address * r9 = normal "successful" return address
* r10 = this threads thread_info structure. * r10 = this threads thread_info structure
* lr = unrecognised instruction return address * lr = unrecognised instruction return address
* IRQs disabled, FIQs enabled.
*/ */
@ @
@ Fall-through from Thumb-2 __und_usr @ Fall-through from Thumb-2 __und_usr
...@@ -659,12 +687,17 @@ ENTRY(no_fp) ...@@ -659,12 +687,17 @@ ENTRY(no_fp)
mov pc, lr mov pc, lr
ENDPROC(no_fp) ENDPROC(no_fp)
__und_usr_unknown: __und_usr_fault_32:
enable_irq mov r1, #4
b 1f
__und_usr_fault_16:
mov r1, #2
1: enable_irq
mov r0, sp mov r0, sp
adr lr, BSYM(ret_from_exception) adr lr, BSYM(ret_from_exception)
b do_undefinstr b __und_fault
ENDPROC(__und_usr_unknown) ENDPROC(__und_usr_fault_32)
ENDPROC(__und_usr_fault_16)
.align 5 .align 5
__pabt_usr: __pabt_usr:
......
...@@ -179,19 +179,20 @@ void prepare_ftrace_return(unsigned long *parent, unsigned long self_addr, ...@@ -179,19 +179,20 @@ void prepare_ftrace_return(unsigned long *parent, unsigned long self_addr,
old = *parent; old = *parent;
*parent = return_hooker; *parent = return_hooker;
err = ftrace_push_return_trace(old, self_addr, &trace.depth,
frame_pointer);
if (err == -EBUSY) {
*parent = old;
return;
}
trace.func = self_addr; trace.func = self_addr;
trace.depth = current->curr_ret_stack + 1;
/* Only trace if the calling function expects to */ /* Only trace if the calling function expects to */
if (!ftrace_graph_entry(&trace)) { if (!ftrace_graph_entry(&trace)) {
current->curr_ret_stack--;
*parent = old; *parent = old;
return;
}
err = ftrace_push_return_trace(old, self_addr, &trace.depth,
frame_pointer);
if (err == -EBUSY) {
*parent = old;
return;
} }
} }
......
...@@ -247,6 +247,7 @@ void machine_shutdown(void) ...@@ -247,6 +247,7 @@ void machine_shutdown(void)
void machine_halt(void) void machine_halt(void)
{ {
machine_shutdown(); machine_shutdown();
local_irq_disable();
while (1); while (1);
} }
...@@ -268,6 +269,7 @@ void machine_restart(char *cmd) ...@@ -268,6 +269,7 @@ void machine_restart(char *cmd)
/* Whoops - the platform was unable to reboot. Tell the user! */ /* Whoops - the platform was unable to reboot. Tell the user! */
printk("Reboot failed -- System halted\n"); printk("Reboot failed -- System halted\n");
local_irq_disable();
while (1); while (1);
} }
......
...@@ -508,7 +508,7 @@ void __init dump_machine_table(void) ...@@ -508,7 +508,7 @@ void __init dump_machine_table(void)
/* can't use cpu_relax() here as it may require MMU setup */; /* can't use cpu_relax() here as it may require MMU setup */;
} }
int __init arm_add_memory(phys_addr_t start, unsigned long size) int __init arm_add_memory(phys_addr_t start, phys_addr_t size)
{ {
struct membank *bank = &meminfo.bank[meminfo.nr_banks]; struct membank *bank = &meminfo.bank[meminfo.nr_banks];
...@@ -538,7 +538,7 @@ int __init arm_add_memory(phys_addr_t start, unsigned long size) ...@@ -538,7 +538,7 @@ int __init arm_add_memory(phys_addr_t start, unsigned long size)
} }
#endif #endif
bank->size = size & PAGE_MASK; bank->size = size & ~(phys_addr_t)(PAGE_SIZE - 1);
/* /*
* Check whether this memory region has non-zero size or * Check whether this memory region has non-zero size or
...@@ -558,7 +558,7 @@ int __init arm_add_memory(phys_addr_t start, unsigned long size) ...@@ -558,7 +558,7 @@ int __init arm_add_memory(phys_addr_t start, unsigned long size)
static int __init early_mem(char *p) static int __init early_mem(char *p)
{ {
static int usermem __initdata = 0; static int usermem __initdata = 0;
unsigned long size; phys_addr_t size;
phys_addr_t start; phys_addr_t start;
char *endp; char *endp;
......
...@@ -563,7 +563,8 @@ void smp_send_stop(void) ...@@ -563,7 +563,8 @@ void smp_send_stop(void)
cpumask_copy(&mask, cpu_online_mask); cpumask_copy(&mask, cpu_online_mask);
cpumask_clear_cpu(smp_processor_id(), &mask); cpumask_clear_cpu(smp_processor_id(), &mask);
smp_cross_call(&mask, IPI_CPU_STOP); if (!cpumask_empty(&mask))
smp_cross_call(&mask, IPI_CPU_STOP);
/* Wait up to one second for other CPUs to stop */ /* Wait up to one second for other CPUs to stop */
timeout = USEC_PER_SEC; timeout = USEC_PER_SEC;
......
...@@ -402,18 +402,10 @@ static int call_undef_hook(struct pt_regs *regs, unsigned int instr) ...@@ -402,18 +402,10 @@ static int call_undef_hook(struct pt_regs *regs, unsigned int instr)
asmlinkage void __exception do_undefinstr(struct pt_regs *regs) asmlinkage void __exception do_undefinstr(struct pt_regs *regs)
{ {
unsigned int correction = thumb_mode(regs) ? 2 : 4;
unsigned int instr; unsigned int instr;
siginfo_t info; siginfo_t info;
void __user *pc; void __user *pc;
/*
* According to the ARM ARM, PC is 2 or 4 bytes ahead,
* depending whether we're in Thumb mode or not.
* Correct this offset.
*/
regs->ARM_pc -= correction;
pc = (void __user *)instruction_pointer(regs); pc = (void __user *)instruction_pointer(regs);
if (processor_mode(regs) == SVC_MODE) { if (processor_mode(regs) == SVC_MODE) {
......
...@@ -38,11 +38,19 @@ ENTRY(v7wbi_flush_user_tlb_range) ...@@ -38,11 +38,19 @@ ENTRY(v7wbi_flush_user_tlb_range)
dsb dsb
mov r0, r0, lsr #PAGE_SHIFT @ align address mov r0, r0, lsr #PAGE_SHIFT @ align address
mov r1, r1, lsr #PAGE_SHIFT mov r1, r1, lsr #PAGE_SHIFT
#ifdef CONFIG_ARM_ERRATA_720789
mov r3, #0
#else
asid r3, r3 @ mask ASID asid r3, r3 @ mask ASID
#endif
orr r0, r3, r0, lsl #PAGE_SHIFT @ Create initial MVA orr r0, r3, r0, lsl #PAGE_SHIFT @ Create initial MVA
mov r1, r1, lsl #PAGE_SHIFT mov r1, r1, lsl #PAGE_SHIFT
1: 1:
#ifdef CONFIG_ARM_ERRATA_720789
ALT_SMP(mcr p15, 0, r0, c8, c3, 3) @ TLB invalidate U MVA all ASID (shareable)
#else
ALT_SMP(mcr p15, 0, r0, c8, c3, 1) @ TLB invalidate U MVA (shareable) ALT_SMP(mcr p15, 0, r0, c8, c3, 1) @ TLB invalidate U MVA (shareable)
#endif
ALT_UP(mcr p15, 0, r0, c8, c7, 1) @ TLB invalidate U MVA ALT_UP(mcr p15, 0, r0, c8, c7, 1) @ TLB invalidate U MVA
add r0, r0, #PAGE_SZ add r0, r0, #PAGE_SZ
...@@ -67,7 +75,11 @@ ENTRY(v7wbi_flush_kern_tlb_range) ...@@ -67,7 +75,11 @@ ENTRY(v7wbi_flush_kern_tlb_range)
mov r0, r0, lsl #PAGE_SHIFT mov r0, r0, lsl #PAGE_SHIFT
mov r1, r1, lsl #PAGE_SHIFT mov r1, r1, lsl #PAGE_SHIFT
1: 1:
#ifdef CONFIG_ARM_ERRATA_720789
ALT_SMP(mcr p15, 0, r0, c8, c3, 3) @ TLB invalidate U MVA all ASID (shareable)
#else
ALT_SMP(mcr p15, 0, r0, c8, c3, 1) @ TLB invalidate U MVA (shareable) ALT_SMP(mcr p15, 0, r0, c8, c3, 1) @ TLB invalidate U MVA (shareable)
#endif
ALT_UP(mcr p15, 0, r0, c8, c7, 1) @ TLB invalidate U MVA ALT_UP(mcr p15, 0, r0, c8, c7, 1) @ TLB invalidate U MVA
add r0, r0, #PAGE_SZ add r0, r0, #PAGE_SZ
cmp r0, r1 cmp r0, r1
......
...@@ -7,18 +7,20 @@ ...@@ -7,18 +7,20 @@
* This program is free software; you can redistribute it and/or modify * This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License version 2 as * it under the terms of the GNU General Public License version 2 as
* published by the Free Software Foundation. * published by the Free Software Foundation.
*
* Basic entry code, called from the kernel's undefined instruction trap.
* r0 = faulted instruction
* r5 = faulted PC+4
* r9 = successful return
* r10 = thread_info structure
* lr = failure return
*/ */
#include <asm/thread_info.h> #include <asm/thread_info.h>
#include <asm/vfpmacros.h> #include <asm/vfpmacros.h>
#include "../kernel/entry-header.S" #include "../kernel/entry-header.S"
@ VFP entry point.
@
@ r0 = instruction opcode (32-bit ARM or two 16-bit Thumb)
@ r2 = PC value to resume execution after successful emulation
@ r9 = normal "successful" return address
@ r10 = this threads thread_info structure
@ lr = unrecognised instruction return address
@ IRQs disabled.
@
ENTRY(do_vfp) ENTRY(do_vfp)
#ifdef CONFIG_PREEMPT #ifdef CONFIG_PREEMPT
ldr r4, [r10, #TI_PREEMPT] @ get preempt count ldr r4, [r10, #TI_PREEMPT] @ get preempt count
......
...@@ -62,13 +62,13 @@ ...@@ -62,13 +62,13 @@
@ VFP hardware support entry point. @ VFP hardware support entry point.
@ @
@ r0 = faulted instruction @ r0 = instruction opcode (32-bit ARM or two 16-bit Thumb)
@ r2 = faulted PC+4 @ r2 = PC value to resume execution after successful emulation
@ r9 = successful return @ r9 = normal "successful" return address
@ r10 = vfp_state union @ r10 = vfp_state union
@ r11 = CPU number @ r11 = CPU number
@ lr = failure return @ lr = unrecognised instruction return address
@ IRQs enabled.
ENTRY(vfp_support_entry) ENTRY(vfp_support_entry)
DBGSTR3 "instr %08x pc %08x state %p", r0, r2, r10 DBGSTR3 "instr %08x pc %08x state %p", r0, r2, r10
...@@ -162,9 +162,12 @@ vfp_hw_state_valid: ...@@ -162,9 +162,12 @@ vfp_hw_state_valid:
@ exception before retrying branch @ exception before retrying branch
@ out before setting an FPEXC that @ out before setting an FPEXC that
@ stops us reading stuff @ stops us reading stuff
VFPFMXR FPEXC, r1 @ restore FPEXC last VFPFMXR FPEXC, r1 @ Restore FPEXC last
sub r2, r2, #4 sub r2, r2, #4 @ Retry current instruction - if Thumb
str r2, [sp, #S_PC] @ retry the instruction str r2, [sp, #S_PC] @ mode it's two 16-bit instructions,
@ else it's one 32-bit instruction, so
@ always subtract 4 from the following
@ instruction address.
#ifdef CONFIG_PREEMPT #ifdef CONFIG_PREEMPT
get_thread_info r10 get_thread_info r10
ldr r4, [r10, #TI_PREEMPT] @ get preempt count ldr r4, [r10, #TI_PREEMPT] @ get preempt count
......
...@@ -457,10 +457,16 @@ static int vfp_pm_suspend(void) ...@@ -457,10 +457,16 @@ static int vfp_pm_suspend(void)
/* disable, just in case */ /* disable, just in case */
fmxr(FPEXC, fmrx(FPEXC) & ~FPEXC_EN); fmxr(FPEXC, fmrx(FPEXC) & ~FPEXC_EN);
} else if (vfp_current_hw_state[ti->cpu]) {
#ifndef CONFIG_SMP
fmxr(FPEXC, fpexc | FPEXC_EN);
vfp_save_state(vfp_current_hw_state[ti->cpu], fpexc);
fmxr(FPEXC, fpexc);
#endif
} }
/* clear any information we had about last context state */ /* clear any information we had about last context state */
memset(vfp_current_hw_state, 0, sizeof(vfp_current_hw_state)); vfp_current_hw_state[ti->cpu] = NULL;
return 0; return 0;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment