Commit 2196c6f1 authored by Vasant Hegde's avatar Vasant Hegde Committed by Benjamin Herrenschmidt

powerpc/powernv: Return secondary CPUs to firmware before FW update

Firmware update on PowerNV platform takes several minutes. During
this time one CPU is stuck in FW and the kernel complains about "soft
lockups".

This patch returns all secondary CPUs to firmware before starting
firmware update process.

[ Reworked a bit and cleaned up -- BenH ]
Signed-off-by: default avatarVasant Hegde <hegdevasant@linux.vnet.ibm.com>
Signed-off-by: default avatarBenjamin Herrenschmidt <benh@kernel.crashing.org>
parent 654837e8
...@@ -916,6 +916,7 @@ extern void opal_get_rtc_time(struct rtc_time *tm); ...@@ -916,6 +916,7 @@ extern void opal_get_rtc_time(struct rtc_time *tm);
extern unsigned long opal_get_boot_time(void); extern unsigned long opal_get_boot_time(void);
extern void opal_nvram_init(void); extern void opal_nvram_init(void);
extern void opal_flash_init(void); extern void opal_flash_init(void);
extern void opal_flash_term_callback(void);
extern int opal_elog_init(void); extern int opal_elog_init(void);
extern void opal_platform_dump_init(void); extern void opal_platform_dump_init(void);
extern void opal_sys_param_init(void); extern void opal_sys_param_init(void);
......
...@@ -20,6 +20,7 @@ ...@@ -20,6 +20,7 @@
#include <linux/mm.h> #include <linux/mm.h>
#include <linux/vmalloc.h> #include <linux/vmalloc.h>
#include <linux/pagemap.h> #include <linux/pagemap.h>
#include <linux/delay.h>
#include <asm/opal.h> #include <asm/opal.h>
...@@ -290,11 +291,6 @@ static int opal_flash_update(int op) ...@@ -290,11 +291,6 @@ static int opal_flash_update(int op)
/* First entry address */ /* First entry address */
addr = __pa(list); addr = __pa(list);
pr_alert("FLASH: Image is %u bytes\n", image_data.size);
pr_alert("FLASH: Image update requested\n");
pr_alert("FLASH: Image will be updated during system reboot\n");
pr_alert("FLASH: This will take several minutes. Do not power off!\n");
flash: flash:
rc = opal_update_flash(addr); rc = opal_update_flash(addr);
...@@ -302,6 +298,47 @@ static int opal_flash_update(int op) ...@@ -302,6 +298,47 @@ static int opal_flash_update(int op)
return rc; return rc;
} }
/* Return CPUs to OPAL before starting FW update */
static void flash_return_cpu(void *info)
{
int cpu = smp_processor_id();
if (!cpu_online(cpu))
return;
/* Disable IRQ */
hard_irq_disable();
/* Return the CPU to OPAL */
opal_return_cpu();
}
/* This gets called just before system reboots */
void opal_flash_term_callback(void)
{
struct cpumask mask;
if (update_flash_data.status != FLASH_IMG_READY)
return;
pr_alert("FLASH: Flashing new firmware\n");
pr_alert("FLASH: Image is %u bytes\n", image_data.size);
pr_alert("FLASH: Performing flash and reboot/shutdown\n");
pr_alert("FLASH: This will take several minutes. Do not power off!\n");
/* Small delay to help getting the above message out */
msleep(500);
/* Return secondary CPUs to firmware */
cpumask_copy(&mask, cpu_online_mask);
cpumask_clear_cpu(smp_processor_id(), &mask);
if (!cpumask_empty(&mask))
smp_call_function_many(&mask,
flash_return_cpu, NULL, false);
/* Hard disable interrupts */
hard_irq_disable();
}
/* /*
* Show candidate image status * Show candidate image status
*/ */
......
...@@ -98,11 +98,32 @@ static void pnv_show_cpuinfo(struct seq_file *m) ...@@ -98,11 +98,32 @@ static void pnv_show_cpuinfo(struct seq_file *m)
of_node_put(root); of_node_put(root);
} }
static void pnv_prepare_going_down(void)
{
/*
* Disable all notifiers from OPAL, we can't
* service interrupts anymore anyway
*/
opal_notifier_disable();
/* Soft disable interrupts */
local_irq_disable();
/*
* Return secondary CPUs to firwmare if a flash update
* is pending otherwise we will get all sort of error
* messages about CPU being stuck etc.. This will also
* have the side effect of hard disabling interrupts so
* past this point, the kernel is effectively dead.
*/
opal_flash_term_callback();
}
static void __noreturn pnv_restart(char *cmd) static void __noreturn pnv_restart(char *cmd)
{ {
long rc = OPAL_BUSY; long rc = OPAL_BUSY;
opal_notifier_disable(); pnv_prepare_going_down();
while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) { while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
rc = opal_cec_reboot(); rc = opal_cec_reboot();
...@@ -119,7 +140,7 @@ static void __noreturn pnv_power_off(void) ...@@ -119,7 +140,7 @@ static void __noreturn pnv_power_off(void)
{ {
long rc = OPAL_BUSY; long rc = OPAL_BUSY;
opal_notifier_disable(); pnv_prepare_going_down();
while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) { while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
rc = opal_cec_power_down(0); rc = opal_cec_power_down(0);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment