162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * SMP support for pSeries machines. 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Dave Engebretsen, Peter Bergner, and 662306a36Sopenharmony_ci * Mike Corrigan {engebret|bergner|mikec}@us.ibm.com 762306a36Sopenharmony_ci * 862306a36Sopenharmony_ci * Plus various changes from other IBM teams... 962306a36Sopenharmony_ci */ 1062306a36Sopenharmony_ci 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci#include <linux/kernel.h> 1362306a36Sopenharmony_ci#include <linux/sched.h> 1462306a36Sopenharmony_ci#include <linux/smp.h> 1562306a36Sopenharmony_ci#include <linux/interrupt.h> 1662306a36Sopenharmony_ci#include <linux/delay.h> 1762306a36Sopenharmony_ci#include <linux/init.h> 1862306a36Sopenharmony_ci#include <linux/spinlock.h> 1962306a36Sopenharmony_ci#include <linux/cache.h> 2062306a36Sopenharmony_ci#include <linux/err.h> 2162306a36Sopenharmony_ci#include <linux/device.h> 2262306a36Sopenharmony_ci#include <linux/cpu.h> 2362306a36Sopenharmony_ci#include <linux/pgtable.h> 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci#include <asm/ptrace.h> 2662306a36Sopenharmony_ci#include <linux/atomic.h> 2762306a36Sopenharmony_ci#include <asm/irq.h> 2862306a36Sopenharmony_ci#include <asm/page.h> 2962306a36Sopenharmony_ci#include <asm/io.h> 3062306a36Sopenharmony_ci#include <asm/smp.h> 3162306a36Sopenharmony_ci#include <asm/paca.h> 3262306a36Sopenharmony_ci#include <asm/machdep.h> 3362306a36Sopenharmony_ci#include <asm/cputable.h> 3462306a36Sopenharmony_ci#include <asm/firmware.h> 3562306a36Sopenharmony_ci#include <asm/rtas.h> 3662306a36Sopenharmony_ci#include <asm/vdso_datapage.h> 3762306a36Sopenharmony_ci#include <asm/cputhreads.h> 3862306a36Sopenharmony_ci#include <asm/xics.h> 3962306a36Sopenharmony_ci#include <asm/xive.h> 4062306a36Sopenharmony_ci#include <asm/dbell.h> 4162306a36Sopenharmony_ci#include <asm/plpar_wrappers.h> 4262306a36Sopenharmony_ci#include <asm/code-patching.h> 4362306a36Sopenharmony_ci#include <asm/svm.h> 4462306a36Sopenharmony_ci#include <asm/kvm_guest.h> 4562306a36Sopenharmony_ci 4662306a36Sopenharmony_ci#include "pseries.h" 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_ci/* 4962306a36Sopenharmony_ci * The Primary thread of each non-boot processor was started from the OF client 5062306a36Sopenharmony_ci * interface by prom_hold_cpus and is spinning on secondary_hold_spinloop. 5162306a36Sopenharmony_ci */ 5262306a36Sopenharmony_cistatic cpumask_var_t of_spin_mask; 5362306a36Sopenharmony_ci 5462306a36Sopenharmony_ci/* Query where a cpu is now. Return codes #defined in plpar_wrappers.h */ 5562306a36Sopenharmony_ciint smp_query_cpu_stopped(unsigned int pcpu) 5662306a36Sopenharmony_ci{ 5762306a36Sopenharmony_ci int cpu_status, status; 5862306a36Sopenharmony_ci int qcss_tok = rtas_function_token(RTAS_FN_QUERY_CPU_STOPPED_STATE); 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_ci if (qcss_tok == RTAS_UNKNOWN_SERVICE) { 6162306a36Sopenharmony_ci printk_once(KERN_INFO 6262306a36Sopenharmony_ci "Firmware doesn't support query-cpu-stopped-state\n"); 6362306a36Sopenharmony_ci return QCSS_HARDWARE_ERROR; 6462306a36Sopenharmony_ci } 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_ci status = rtas_call(qcss_tok, 1, 2, &cpu_status, pcpu); 6762306a36Sopenharmony_ci if (status != 0) { 6862306a36Sopenharmony_ci printk(KERN_ERR 6962306a36Sopenharmony_ci "RTAS query-cpu-stopped-state failed: %i\n", status); 7062306a36Sopenharmony_ci return status; 7162306a36Sopenharmony_ci } 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_ci return cpu_status; 7462306a36Sopenharmony_ci} 7562306a36Sopenharmony_ci 7662306a36Sopenharmony_ci/** 7762306a36Sopenharmony_ci * smp_startup_cpu() - start the given cpu 7862306a36Sopenharmony_ci * 7962306a36Sopenharmony_ci * At boot time, there is nothing to do for primary threads which were 8062306a36Sopenharmony_ci * started from Open Firmware. For anything else, call RTAS with the 8162306a36Sopenharmony_ci * appropriate start location. 8262306a36Sopenharmony_ci * 8362306a36Sopenharmony_ci * Returns: 8462306a36Sopenharmony_ci * 0 - failure 8562306a36Sopenharmony_ci * 1 - success 8662306a36Sopenharmony_ci */ 8762306a36Sopenharmony_cistatic inline int smp_startup_cpu(unsigned int lcpu) 8862306a36Sopenharmony_ci{ 8962306a36Sopenharmony_ci int status; 9062306a36Sopenharmony_ci unsigned long start_here = 9162306a36Sopenharmony_ci __pa(ppc_function_entry(generic_secondary_smp_init)); 9262306a36Sopenharmony_ci unsigned int pcpu; 9362306a36Sopenharmony_ci int start_cpu; 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci if (cpumask_test_cpu(lcpu, of_spin_mask)) 9662306a36Sopenharmony_ci /* Already started by OF and sitting in spin loop */ 9762306a36Sopenharmony_ci return 1; 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci pcpu = get_hard_smp_processor_id(lcpu); 10062306a36Sopenharmony_ci 10162306a36Sopenharmony_ci /* Check to see if the CPU out of FW already for kexec */ 10262306a36Sopenharmony_ci if (smp_query_cpu_stopped(pcpu) == QCSS_NOT_STOPPED){ 10362306a36Sopenharmony_ci cpumask_set_cpu(lcpu, of_spin_mask); 10462306a36Sopenharmony_ci return 1; 10562306a36Sopenharmony_ci } 10662306a36Sopenharmony_ci 10762306a36Sopenharmony_ci /* 10862306a36Sopenharmony_ci * If the RTAS start-cpu token does not exist then presume the 10962306a36Sopenharmony_ci * cpu is already spinning. 11062306a36Sopenharmony_ci */ 11162306a36Sopenharmony_ci start_cpu = rtas_function_token(RTAS_FN_START_CPU); 11262306a36Sopenharmony_ci if (start_cpu == RTAS_UNKNOWN_SERVICE) 11362306a36Sopenharmony_ci return 1; 11462306a36Sopenharmony_ci 11562306a36Sopenharmony_ci status = rtas_call(start_cpu, 3, 1, NULL, pcpu, start_here, pcpu); 11662306a36Sopenharmony_ci if (status != 0) { 11762306a36Sopenharmony_ci printk(KERN_ERR "start-cpu failed: %i\n", status); 11862306a36Sopenharmony_ci return 0; 11962306a36Sopenharmony_ci } 12062306a36Sopenharmony_ci 12162306a36Sopenharmony_ci return 1; 12262306a36Sopenharmony_ci} 12362306a36Sopenharmony_ci 12462306a36Sopenharmony_cistatic void smp_setup_cpu(int cpu) 12562306a36Sopenharmony_ci{ 12662306a36Sopenharmony_ci if (xive_enabled()) 12762306a36Sopenharmony_ci xive_smp_setup_cpu(); 12862306a36Sopenharmony_ci else if (cpu != boot_cpuid) 12962306a36Sopenharmony_ci xics_setup_cpu(); 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_ci if (firmware_has_feature(FW_FEATURE_SPLPAR)) 13262306a36Sopenharmony_ci vpa_init(cpu); 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_ci cpumask_clear_cpu(cpu, of_spin_mask); 13562306a36Sopenharmony_ci} 13662306a36Sopenharmony_ci 13762306a36Sopenharmony_cistatic int smp_pSeries_kick_cpu(int nr) 13862306a36Sopenharmony_ci{ 13962306a36Sopenharmony_ci if (nr < 0 || nr >= nr_cpu_ids) 14062306a36Sopenharmony_ci return -EINVAL; 14162306a36Sopenharmony_ci 14262306a36Sopenharmony_ci if (!smp_startup_cpu(nr)) 14362306a36Sopenharmony_ci return -ENOENT; 14462306a36Sopenharmony_ci 14562306a36Sopenharmony_ci /* 14662306a36Sopenharmony_ci * The processor is currently spinning, waiting for the 14762306a36Sopenharmony_ci * cpu_start field to become non-zero After we set cpu_start, 14862306a36Sopenharmony_ci * the processor will continue on to secondary_start 14962306a36Sopenharmony_ci */ 15062306a36Sopenharmony_ci paca_ptrs[nr]->cpu_start = 1; 15162306a36Sopenharmony_ci 15262306a36Sopenharmony_ci return 0; 15362306a36Sopenharmony_ci} 15462306a36Sopenharmony_ci 15562306a36Sopenharmony_cistatic int pseries_smp_prepare_cpu(int cpu) 15662306a36Sopenharmony_ci{ 15762306a36Sopenharmony_ci if (xive_enabled()) 15862306a36Sopenharmony_ci return xive_smp_prepare_cpu(cpu); 15962306a36Sopenharmony_ci return 0; 16062306a36Sopenharmony_ci} 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci/* Cause IPI as setup by the interrupt controller (xics or xive) */ 16362306a36Sopenharmony_cistatic void (*ic_cause_ipi)(int cpu) __ro_after_init; 16462306a36Sopenharmony_ci 16562306a36Sopenharmony_ci/* Use msgsndp doorbells target is a sibling, else use interrupt controller */ 16662306a36Sopenharmony_cistatic void dbell_or_ic_cause_ipi(int cpu) 16762306a36Sopenharmony_ci{ 16862306a36Sopenharmony_ci if (doorbell_try_core_ipi(cpu)) 16962306a36Sopenharmony_ci return; 17062306a36Sopenharmony_ci 17162306a36Sopenharmony_ci ic_cause_ipi(cpu); 17262306a36Sopenharmony_ci} 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_cistatic int pseries_cause_nmi_ipi(int cpu) 17562306a36Sopenharmony_ci{ 17662306a36Sopenharmony_ci int hwcpu; 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci if (cpu == NMI_IPI_ALL_OTHERS) { 17962306a36Sopenharmony_ci hwcpu = H_SIGNAL_SYS_RESET_ALL_OTHERS; 18062306a36Sopenharmony_ci } else { 18162306a36Sopenharmony_ci if (cpu < 0) { 18262306a36Sopenharmony_ci WARN_ONCE(true, "incorrect cpu parameter %d", cpu); 18362306a36Sopenharmony_ci return 0; 18462306a36Sopenharmony_ci } 18562306a36Sopenharmony_ci 18662306a36Sopenharmony_ci hwcpu = get_hard_smp_processor_id(cpu); 18762306a36Sopenharmony_ci } 18862306a36Sopenharmony_ci 18962306a36Sopenharmony_ci if (plpar_signal_sys_reset(hwcpu) == H_SUCCESS) 19062306a36Sopenharmony_ci return 1; 19162306a36Sopenharmony_ci 19262306a36Sopenharmony_ci return 0; 19362306a36Sopenharmony_ci} 19462306a36Sopenharmony_ci 19562306a36Sopenharmony_cistatic __init void pSeries_smp_probe(void) 19662306a36Sopenharmony_ci{ 19762306a36Sopenharmony_ci if (xive_enabled()) 19862306a36Sopenharmony_ci xive_smp_probe(); 19962306a36Sopenharmony_ci else 20062306a36Sopenharmony_ci xics_smp_probe(); 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_ci /* No doorbell facility, must use the interrupt controller for IPIs */ 20362306a36Sopenharmony_ci if (!cpu_has_feature(CPU_FTR_DBELL)) 20462306a36Sopenharmony_ci return; 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_ci /* Doorbells can only be used for IPIs between SMT siblings */ 20762306a36Sopenharmony_ci if (!cpu_has_feature(CPU_FTR_SMT)) 20862306a36Sopenharmony_ci return; 20962306a36Sopenharmony_ci 21062306a36Sopenharmony_ci check_kvm_guest(); 21162306a36Sopenharmony_ci 21262306a36Sopenharmony_ci if (is_kvm_guest()) { 21362306a36Sopenharmony_ci /* 21462306a36Sopenharmony_ci * KVM emulates doorbells by disabling FSCR[MSGP] so msgsndp 21562306a36Sopenharmony_ci * faults to the hypervisor which then reads the instruction 21662306a36Sopenharmony_ci * from guest memory, which tends to be slower than using XIVE. 21762306a36Sopenharmony_ci */ 21862306a36Sopenharmony_ci if (xive_enabled()) 21962306a36Sopenharmony_ci return; 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci /* 22262306a36Sopenharmony_ci * XICS hcalls aren't as fast, so we can use msgsndp (which 22362306a36Sopenharmony_ci * also helps exercise KVM emulation), however KVM can't 22462306a36Sopenharmony_ci * emulate secure guests because it can't read the instruction 22562306a36Sopenharmony_ci * out of their memory. 22662306a36Sopenharmony_ci */ 22762306a36Sopenharmony_ci if (is_secure_guest()) 22862306a36Sopenharmony_ci return; 22962306a36Sopenharmony_ci } 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ci /* 23262306a36Sopenharmony_ci * Under PowerVM, FSCR[MSGP] is enabled as guest vCPU siblings are 23362306a36Sopenharmony_ci * gang scheduled on the same physical core, so doorbells are always 23462306a36Sopenharmony_ci * faster than the interrupt controller, and they can be used by 23562306a36Sopenharmony_ci * secure guests. 23662306a36Sopenharmony_ci */ 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_ci ic_cause_ipi = smp_ops->cause_ipi; 23962306a36Sopenharmony_ci smp_ops->cause_ipi = dbell_or_ic_cause_ipi; 24062306a36Sopenharmony_ci} 24162306a36Sopenharmony_ci 24262306a36Sopenharmony_cistatic struct smp_ops_t pseries_smp_ops = { 24362306a36Sopenharmony_ci .message_pass = NULL, /* Use smp_muxed_ipi_message_pass */ 24462306a36Sopenharmony_ci .cause_ipi = NULL, /* Filled at runtime by pSeries_smp_probe() */ 24562306a36Sopenharmony_ci .cause_nmi_ipi = pseries_cause_nmi_ipi, 24662306a36Sopenharmony_ci .probe = pSeries_smp_probe, 24762306a36Sopenharmony_ci .prepare_cpu = pseries_smp_prepare_cpu, 24862306a36Sopenharmony_ci .kick_cpu = smp_pSeries_kick_cpu, 24962306a36Sopenharmony_ci .setup_cpu = smp_setup_cpu, 25062306a36Sopenharmony_ci .cpu_bootable = smp_generic_cpu_bootable, 25162306a36Sopenharmony_ci}; 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_ci/* This is called very early */ 25462306a36Sopenharmony_civoid __init smp_init_pseries(void) 25562306a36Sopenharmony_ci{ 25662306a36Sopenharmony_ci int i; 25762306a36Sopenharmony_ci 25862306a36Sopenharmony_ci pr_debug(" -> smp_init_pSeries()\n"); 25962306a36Sopenharmony_ci smp_ops = &pseries_smp_ops; 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_ci alloc_bootmem_cpumask_var(&of_spin_mask); 26262306a36Sopenharmony_ci 26362306a36Sopenharmony_ci /* 26462306a36Sopenharmony_ci * Mark threads which are still spinning in hold loops 26562306a36Sopenharmony_ci * 26662306a36Sopenharmony_ci * We know prom_init will not have started them if RTAS supports 26762306a36Sopenharmony_ci * query-cpu-stopped-state. 26862306a36Sopenharmony_ci */ 26962306a36Sopenharmony_ci if (rtas_function_token(RTAS_FN_QUERY_CPU_STOPPED_STATE) == RTAS_UNKNOWN_SERVICE) { 27062306a36Sopenharmony_ci if (cpu_has_feature(CPU_FTR_SMT)) { 27162306a36Sopenharmony_ci for_each_present_cpu(i) { 27262306a36Sopenharmony_ci if (cpu_thread_in_core(i) == 0) 27362306a36Sopenharmony_ci cpumask_set_cpu(i, of_spin_mask); 27462306a36Sopenharmony_ci } 27562306a36Sopenharmony_ci } else 27662306a36Sopenharmony_ci cpumask_copy(of_spin_mask, cpu_present_mask); 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_ci cpumask_clear_cpu(boot_cpuid, of_spin_mask); 27962306a36Sopenharmony_ci } 28062306a36Sopenharmony_ci 28162306a36Sopenharmony_ci pr_debug(" <- smp_init_pSeries()\n"); 28262306a36Sopenharmony_ci} 283