Commit ec0f8d3f authored by Huacai Chen's avatar Huacai Chen Committed by Ralf Baechle

MIPS: Loongson: Allow booting from any core

By offering Logical->Physical core id mapping, so as to reserve some
physical cores via mask. This allow booting from any core when core-0
has problems. Since the maximun cores supported by Loongson-3 is 16,
32-bit cpu_startup_core_id can be split to 16-bit cpu_startup_core_id
and 16-bit reserved_cores_mask for compatibility.
Signed-off-by: default avatarHuacai Chen <chenhc@lemote.com>
Cc: John Crispin <john@phrozen.org>
Cc: Steven J. Hill <Steven.Hill@imgtec.com>
Cc: linux-mips@linux-mips.org
Cc: Fuxin Zhang <zhangfx@lemote.com>
Cc: Zhangjin Wu <wuzhangjin@gmail.com>
Patchwork: https://patchwork.linux-mips.org/patch/8323/Signed-off-by: default avatarRalf Baechle <ralf@linux-mips.org>
parent f490682a
...@@ -42,7 +42,8 @@ struct efi_cpuinfo_loongson { ...@@ -42,7 +42,8 @@ struct efi_cpuinfo_loongson {
u32 processor_id; /* PRID, e.g. 6305, 6306 */ u32 processor_id; /* PRID, e.g. 6305, 6306 */
u32 cputype; /* Loongson_3A/3B, etc. */ u32 cputype; /* Loongson_3A/3B, etc. */
u32 total_node; /* num of total numa nodes */ u32 total_node; /* num of total numa nodes */
u32 cpu_startup_core_id; /* Core id */ u16 cpu_startup_core_id; /* Boot core id */
u16 reserved_cores_mask;
u32 cpu_clock_freq; /* cpu_clock */ u32 cpu_clock_freq; /* cpu_clock */
u32 nr_cpus; u32 nr_cpus;
} __packed; } __packed;
...@@ -149,6 +150,8 @@ struct loongson_system_configuration { ...@@ -149,6 +150,8 @@ struct loongson_system_configuration {
u32 nr_nodes; u32 nr_nodes;
int cores_per_node; int cores_per_node;
int cores_per_package; int cores_per_package;
u16 boot_cpu_id;
u16 reserved_cpus_mask;
enum loongson_cpu_type cputype; enum loongson_cpu_type cputype;
u64 ht_control_base; u64 ht_control_base;
u64 pci_mem_start_addr; u64 pci_mem_start_addr;
......
...@@ -32,8 +32,7 @@ ...@@ -32,8 +32,7 @@
#define LOONGSON_INT_ROUTER_LPC LOONGSON_INT_ROUTER_ENTRY(0x0a) #define LOONGSON_INT_ROUTER_LPC LOONGSON_INT_ROUTER_ENTRY(0x0a)
#define LOONGSON_INT_ROUTER_HT1(n) LOONGSON_INT_ROUTER_ENTRY(n + 0x18) #define LOONGSON_INT_ROUTER_HT1(n) LOONGSON_INT_ROUTER_ENTRY(n + 0x18)
#define LOONGSON_INT_CORE0_INT0 0x11 /* route to int 0 of core 0 */ #define LOONGSON_INT_COREx_INTy(x, y) (1<<(x) | 1<<(y+4)) /* route to int y of core x */
#define LOONGSON_INT_CORE0_INT1 0x21 /* route to int 1 of core 0 */
#endif #endif
......
...@@ -3,7 +3,7 @@ ...@@ -3,7 +3,7 @@
#ifdef CONFIG_NUMA #ifdef CONFIG_NUMA
#define cpu_to_node(cpu) ((cpu) >> 2) #define cpu_to_node(cpu) (cpu_logical_map(cpu) >> 2)
#define parent_node(node) (node) #define parent_node(node) (node)
#define cpumask_of_node(node) (&__node_data[(node)]->cpumask) #define cpumask_of_node(node) (&__node_data[(node)]->cpumask)
......
...@@ -119,6 +119,8 @@ void __init prom_init_env(void) ...@@ -119,6 +119,8 @@ void __init prom_init_env(void)
} }
loongson_sysconf.nr_cpus = ecpu->nr_cpus; loongson_sysconf.nr_cpus = ecpu->nr_cpus;
loongson_sysconf.boot_cpu_id = ecpu->cpu_startup_core_id;
loongson_sysconf.reserved_cpus_mask = ecpu->reserved_cores_mask;
if (ecpu->nr_cpus > NR_CPUS || ecpu->nr_cpus == 0) if (ecpu->nr_cpus > NR_CPUS || ecpu->nr_cpus == 0)
loongson_sysconf.nr_cpus = NR_CPUS; loongson_sysconf.nr_cpus = NR_CPUS;
loongson_sysconf.nr_nodes = (loongson_sysconf.nr_cpus + loongson_sysconf.nr_nodes = (loongson_sysconf.nr_cpus +
......
...@@ -55,8 +55,8 @@ static inline void mask_loongson_irq(struct irq_data *d) ...@@ -55,8 +55,8 @@ static inline void mask_loongson_irq(struct irq_data *d)
/* Workaround: UART IRQ may deliver to any core */ /* Workaround: UART IRQ may deliver to any core */
if (d->irq == LOONGSON_UART_IRQ) { if (d->irq == LOONGSON_UART_IRQ) {
int cpu = smp_processor_id(); int cpu = smp_processor_id();
int node_id = cpu / loongson_sysconf.cores_per_node; int node_id = cpu_logical_map(cpu) / loongson_sysconf.cores_per_node;
int core_id = cpu % loongson_sysconf.cores_per_node; int core_id = cpu_logical_map(cpu) % loongson_sysconf.cores_per_node;
u64 intenclr_addr = smp_group[node_id] | u64 intenclr_addr = smp_group[node_id] |
(u64)(&LOONGSON_INT_ROUTER_INTENCLR); (u64)(&LOONGSON_INT_ROUTER_INTENCLR);
u64 introuter_lpc_addr = smp_group[node_id] | u64 introuter_lpc_addr = smp_group[node_id] |
...@@ -72,8 +72,8 @@ static inline void unmask_loongson_irq(struct irq_data *d) ...@@ -72,8 +72,8 @@ static inline void unmask_loongson_irq(struct irq_data *d)
/* Workaround: UART IRQ may deliver to any core */ /* Workaround: UART IRQ may deliver to any core */
if (d->irq == LOONGSON_UART_IRQ) { if (d->irq == LOONGSON_UART_IRQ) {
int cpu = smp_processor_id(); int cpu = smp_processor_id();
int node_id = cpu / loongson_sysconf.cores_per_node; int node_id = cpu_logical_map(cpu) / loongson_sysconf.cores_per_node;
int core_id = cpu % loongson_sysconf.cores_per_node; int core_id = cpu_logical_map(cpu) % loongson_sysconf.cores_per_node;
u64 intenset_addr = smp_group[node_id] | u64 intenset_addr = smp_group[node_id] |
(u64)(&LOONGSON_INT_ROUTER_INTENSET); (u64)(&LOONGSON_INT_ROUTER_INTENSET);
u64 introuter_lpc_addr = smp_group[node_id] | u64 introuter_lpc_addr = smp_group[node_id] |
...@@ -102,10 +102,12 @@ void irq_router_init(void) ...@@ -102,10 +102,12 @@ void irq_router_init(void)
int i; int i;
/* route LPC int to cpu core0 int 0 */ /* route LPC int to cpu core0 int 0 */
LOONGSON_INT_ROUTER_LPC = LOONGSON_INT_CORE0_INT0; LOONGSON_INT_ROUTER_LPC =
LOONGSON_INT_COREx_INTy(loongson_sysconf.boot_cpu_id, 0);
/* route HT1 int0 ~ int7 to cpu core0 INT1*/ /* route HT1 int0 ~ int7 to cpu core0 INT1*/
for (i = 0; i < 8; i++) for (i = 0; i < 8; i++)
LOONGSON_INT_ROUTER_HT1(i) = LOONGSON_INT_CORE0_INT1; LOONGSON_INT_ROUTER_HT1(i) =
LOONGSON_INT_COREx_INTy(loongson_sysconf.boot_cpu_id, 1);
/* enable HT1 interrupt */ /* enable HT1 interrupt */
LOONGSON_HT1_INTN_EN(0) = 0xffffffff; LOONGSON_HT1_INTN_EN(0) = 0xffffffff;
/* enable router interrupt intenset */ /* enable router interrupt intenset */
......
...@@ -224,7 +224,7 @@ static void __init node_mem_init(unsigned int node) ...@@ -224,7 +224,7 @@ static void __init node_mem_init(unsigned int node)
static __init void prom_meminit(void) static __init void prom_meminit(void)
{ {
unsigned int node, cpu; unsigned int node, cpu, active_cpu = 0;
cpu_node_probe(); cpu_node_probe();
init_topology_matrix(); init_topology_matrix();
...@@ -240,8 +240,14 @@ static __init void prom_meminit(void) ...@@ -240,8 +240,14 @@ static __init void prom_meminit(void)
node = cpu / loongson_sysconf.cores_per_node; node = cpu / loongson_sysconf.cores_per_node;
if (node >= num_online_nodes()) if (node >= num_online_nodes())
node = 0; node = 0;
pr_info("NUMA: set cpumask cpu %d on node %d\n", cpu, node);
cpu_set(cpu, __node_data[(node)]->cpumask); if (loongson_sysconf.reserved_cpus_mask & (1<<cpu))
continue;
cpu_set(active_cpu, __node_data[(node)]->cpumask);
pr_info("NUMA: set cpumask cpu %d on node %d\n", active_cpu, node);
active_cpu++;
} }
} }
......
...@@ -239,7 +239,7 @@ static void ipi_mailbox_buf_init(void) ...@@ -239,7 +239,7 @@ static void ipi_mailbox_buf_init(void)
*/ */
static void loongson3_send_ipi_single(int cpu, unsigned int action) static void loongson3_send_ipi_single(int cpu, unsigned int action)
{ {
loongson3_ipi_write32((u32)action, ipi_set0_regs[cpu]); loongson3_ipi_write32((u32)action, ipi_set0_regs[cpu_logical_map(cpu)]);
} }
static void static void
...@@ -248,7 +248,7 @@ loongson3_send_ipi_mask(const struct cpumask *mask, unsigned int action) ...@@ -248,7 +248,7 @@ loongson3_send_ipi_mask(const struct cpumask *mask, unsigned int action)
unsigned int i; unsigned int i;
for_each_cpu(i, mask) for_each_cpu(i, mask)
loongson3_ipi_write32((u32)action, ipi_set0_regs[i]); loongson3_ipi_write32((u32)action, ipi_set0_regs[cpu_logical_map(i)]);
} }
void loongson3_ipi_interrupt(struct pt_regs *regs) void loongson3_ipi_interrupt(struct pt_regs *regs)
...@@ -257,10 +257,10 @@ void loongson3_ipi_interrupt(struct pt_regs *regs) ...@@ -257,10 +257,10 @@ void loongson3_ipi_interrupt(struct pt_regs *regs)
unsigned int action, c0count; unsigned int action, c0count;
/* Load the ipi register to figure out what we're supposed to do */ /* Load the ipi register to figure out what we're supposed to do */
action = loongson3_ipi_read32(ipi_status0_regs[cpu]); action = loongson3_ipi_read32(ipi_status0_regs[cpu_logical_map(cpu)]);
/* Clear the ipi register to clear the interrupt */ /* Clear the ipi register to clear the interrupt */
loongson3_ipi_write32((u32)action, ipi_clear0_regs[cpu]); loongson3_ipi_write32((u32)action, ipi_clear0_regs[cpu_logical_map(cpu)]);
if (action & SMP_RESCHEDULE_YOURSELF) if (action & SMP_RESCHEDULE_YOURSELF)
scheduler_ipi(); scheduler_ipi();
...@@ -291,12 +291,14 @@ static void loongson3_init_secondary(void) ...@@ -291,12 +291,14 @@ static void loongson3_init_secondary(void)
/* Set interrupt mask, but don't enable */ /* Set interrupt mask, but don't enable */
change_c0_status(ST0_IM, imask); change_c0_status(ST0_IM, imask);
for (i = 0; i < loongson_sysconf.nr_cpus; i++) for (i = 0; i < num_possible_cpus(); i++)
loongson3_ipi_write32(0xffffffff, ipi_en0_regs[i]); loongson3_ipi_write32(0xffffffff, ipi_en0_regs[cpu_logical_map(i)]);
cpu_data[cpu].package = cpu / loongson_sysconf.cores_per_package;
cpu_data[cpu].core = cpu % loongson_sysconf.cores_per_package;
per_cpu(cpu_state, cpu) = CPU_ONLINE; per_cpu(cpu_state, cpu) = CPU_ONLINE;
cpu_data[cpu].core =
cpu_logical_map(cpu) % loongson_sysconf.cores_per_package;
cpu_data[cpu].package =
cpu_logical_map(cpu) / loongson_sysconf.cores_per_package;
i = 0; i = 0;
__this_cpu_write(core0_c0count, 0); __this_cpu_write(core0_c0count, 0);
...@@ -314,37 +316,50 @@ static void loongson3_init_secondary(void) ...@@ -314,37 +316,50 @@ static void loongson3_init_secondary(void)
static void loongson3_smp_finish(void) static void loongson3_smp_finish(void)
{ {
int cpu = smp_processor_id();
write_c0_compare(read_c0_count() + mips_hpt_frequency/HZ); write_c0_compare(read_c0_count() + mips_hpt_frequency/HZ);
local_irq_enable(); local_irq_enable();
loongson3_ipi_write64(0, loongson3_ipi_write64(0,
(void *)(ipi_mailbox_buf[smp_processor_id()]+0x0)); (void *)(ipi_mailbox_buf[cpu_logical_map(cpu)]+0x0));
pr_info("CPU#%d finished, CP0_ST=%x\n", pr_info("CPU#%d finished, CP0_ST=%x\n",
smp_processor_id(), read_c0_status()); smp_processor_id(), read_c0_status());
} }
static void __init loongson3_smp_setup(void) static void __init loongson3_smp_setup(void)
{ {
int i, num; int i = 0, num = 0; /* i: physical id, num: logical id */
init_cpu_possible(cpu_none_mask); init_cpu_possible(cpu_none_mask);
set_cpu_possible(0, true);
__cpu_number_map[0] = 0;
__cpu_logical_map[0] = 0;
/* For unified kernel, NR_CPUS is the maximum possible value, /* For unified kernel, NR_CPUS is the maximum possible value,
* loongson_sysconf.nr_cpus is the really present value */ * loongson_sysconf.nr_cpus is the really present value */
for (i = 1, num = 0; i < loongson_sysconf.nr_cpus; i++) { while (i < loongson_sysconf.nr_cpus) {
set_cpu_possible(i, true); if (loongson_sysconf.reserved_cpus_mask & (1<<i)) {
__cpu_number_map[i] = ++num; /* Reserved physical CPU cores */
__cpu_number_map[i] = -1;
} else {
__cpu_number_map[i] = num;
__cpu_logical_map[num] = i; __cpu_logical_map[num] = i;
set_cpu_possible(num, true);
num++;
}
i++;
} }
pr_info("Detected %i available CPU(s)\n", num);
while (num < loongson_sysconf.nr_cpus) {
__cpu_logical_map[num] = -1;
num++;
}
ipi_set0_regs_init(); ipi_set0_regs_init();
ipi_clear0_regs_init(); ipi_clear0_regs_init();
ipi_status0_regs_init(); ipi_status0_regs_init();
ipi_en0_regs_init(); ipi_en0_regs_init();
ipi_mailbox_buf_init(); ipi_mailbox_buf_init();
pr_info("Detected %i available secondary CPU(s)\n", num); cpu_data[0].core = cpu_logical_map(0) % loongson_sysconf.cores_per_package;
cpu_data[0].package = cpu_logical_map(0) / loongson_sysconf.cores_per_package;
} }
static void __init loongson3_prepare_cpus(unsigned int max_cpus) static void __init loongson3_prepare_cpus(unsigned int max_cpus)
...@@ -371,10 +386,14 @@ static void loongson3_boot_secondary(int cpu, struct task_struct *idle) ...@@ -371,10 +386,14 @@ static void loongson3_boot_secondary(int cpu, struct task_struct *idle)
pr_debug("CPU#%d, func_pc=%lx, sp=%lx, gp=%lx\n", pr_debug("CPU#%d, func_pc=%lx, sp=%lx, gp=%lx\n",
cpu, startargs[0], startargs[1], startargs[2]); cpu, startargs[0], startargs[1], startargs[2]);
loongson3_ipi_write64(startargs[3], (void *)(ipi_mailbox_buf[cpu]+0x18)); loongson3_ipi_write64(startargs[3],
loongson3_ipi_write64(startargs[2], (void *)(ipi_mailbox_buf[cpu]+0x10)); (void *)(ipi_mailbox_buf[cpu_logical_map(cpu)]+0x18));
loongson3_ipi_write64(startargs[1], (void *)(ipi_mailbox_buf[cpu]+0x8)); loongson3_ipi_write64(startargs[2],
loongson3_ipi_write64(startargs[0], (void *)(ipi_mailbox_buf[cpu]+0x0)); (void *)(ipi_mailbox_buf[cpu_logical_map(cpu)]+0x10));
loongson3_ipi_write64(startargs[1],
(void *)(ipi_mailbox_buf[cpu_logical_map(cpu)]+0x8));
loongson3_ipi_write64(startargs[0],
(void *)(ipi_mailbox_buf[cpu_logical_map(cpu)]+0x0));
} }
#ifdef CONFIG_HOTPLUG_CPU #ifdef CONFIG_HOTPLUG_CPU
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment