18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci * PowerNV setup code.
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * Copyright 2011 IBM Corp.
68c2ecf20Sopenharmony_ci */
78c2ecf20Sopenharmony_ci
88c2ecf20Sopenharmony_ci#undef DEBUG
98c2ecf20Sopenharmony_ci
108c2ecf20Sopenharmony_ci#include <linux/cpu.h>
118c2ecf20Sopenharmony_ci#include <linux/errno.h>
128c2ecf20Sopenharmony_ci#include <linux/sched.h>
138c2ecf20Sopenharmony_ci#include <linux/kernel.h>
148c2ecf20Sopenharmony_ci#include <linux/tty.h>
158c2ecf20Sopenharmony_ci#include <linux/reboot.h>
168c2ecf20Sopenharmony_ci#include <linux/init.h>
178c2ecf20Sopenharmony_ci#include <linux/console.h>
188c2ecf20Sopenharmony_ci#include <linux/delay.h>
198c2ecf20Sopenharmony_ci#include <linux/irq.h>
208c2ecf20Sopenharmony_ci#include <linux/seq_file.h>
218c2ecf20Sopenharmony_ci#include <linux/of.h>
228c2ecf20Sopenharmony_ci#include <linux/of_fdt.h>
238c2ecf20Sopenharmony_ci#include <linux/interrupt.h>
248c2ecf20Sopenharmony_ci#include <linux/bug.h>
258c2ecf20Sopenharmony_ci#include <linux/pci.h>
268c2ecf20Sopenharmony_ci#include <linux/cpufreq.h>
278c2ecf20Sopenharmony_ci#include <linux/memblock.h>
288c2ecf20Sopenharmony_ci
298c2ecf20Sopenharmony_ci#include <asm/machdep.h>
308c2ecf20Sopenharmony_ci#include <asm/firmware.h>
318c2ecf20Sopenharmony_ci#include <asm/xics.h>
328c2ecf20Sopenharmony_ci#include <asm/xive.h>
338c2ecf20Sopenharmony_ci#include <asm/opal.h>
348c2ecf20Sopenharmony_ci#include <asm/kexec.h>
358c2ecf20Sopenharmony_ci#include <asm/smp.h>
368c2ecf20Sopenharmony_ci#include <asm/tm.h>
378c2ecf20Sopenharmony_ci#include <asm/setup.h>
388c2ecf20Sopenharmony_ci#include <asm/security_features.h>
398c2ecf20Sopenharmony_ci
408c2ecf20Sopenharmony_ci#include "powernv.h"
418c2ecf20Sopenharmony_ci
428c2ecf20Sopenharmony_ci
438c2ecf20Sopenharmony_cistatic bool fw_feature_is(const char *state, const char *name,
448c2ecf20Sopenharmony_ci			  struct device_node *fw_features)
458c2ecf20Sopenharmony_ci{
468c2ecf20Sopenharmony_ci	struct device_node *np;
478c2ecf20Sopenharmony_ci	bool rc = false;
488c2ecf20Sopenharmony_ci
498c2ecf20Sopenharmony_ci	np = of_get_child_by_name(fw_features, name);
508c2ecf20Sopenharmony_ci	if (np) {
518c2ecf20Sopenharmony_ci		rc = of_property_read_bool(np, state);
528c2ecf20Sopenharmony_ci		of_node_put(np);
538c2ecf20Sopenharmony_ci	}
548c2ecf20Sopenharmony_ci
558c2ecf20Sopenharmony_ci	return rc;
568c2ecf20Sopenharmony_ci}
578c2ecf20Sopenharmony_ci
588c2ecf20Sopenharmony_cistatic void init_fw_feat_flags(struct device_node *np)
598c2ecf20Sopenharmony_ci{
608c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "inst-spec-barrier-ori31,31,0", np))
618c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_SPEC_BAR_ORI31);
628c2ecf20Sopenharmony_ci
638c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "fw-bcctrl-serialized", np))
648c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_BCCTRL_SERIALISED);
658c2ecf20Sopenharmony_ci
668c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "inst-l1d-flush-ori30,30,0", np))
678c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_L1D_FLUSH_ORI30);
688c2ecf20Sopenharmony_ci
698c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "inst-l1d-flush-trig2", np))
708c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_L1D_FLUSH_TRIG2);
718c2ecf20Sopenharmony_ci
728c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "fw-l1d-thread-split", np))
738c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_L1D_THREAD_PRIV);
748c2ecf20Sopenharmony_ci
758c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "fw-count-cache-disabled", np))
768c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_COUNT_CACHE_DISABLED);
778c2ecf20Sopenharmony_ci
788c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "fw-count-cache-flush-bcctr2,0,0", np))
798c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_BCCTR_FLUSH_ASSIST);
808c2ecf20Sopenharmony_ci
818c2ecf20Sopenharmony_ci	if (fw_feature_is("enabled", "needs-count-cache-flush-on-context-switch", np))
828c2ecf20Sopenharmony_ci		security_ftr_set(SEC_FTR_FLUSH_COUNT_CACHE);
838c2ecf20Sopenharmony_ci
848c2ecf20Sopenharmony_ci	/*
858c2ecf20Sopenharmony_ci	 * The features below are enabled by default, so we instead look to see
868c2ecf20Sopenharmony_ci	 * if firmware has *disabled* them, and clear them if so.
878c2ecf20Sopenharmony_ci	 */
888c2ecf20Sopenharmony_ci	if (fw_feature_is("disabled", "speculation-policy-favor-security", np))
898c2ecf20Sopenharmony_ci		security_ftr_clear(SEC_FTR_FAVOUR_SECURITY);
908c2ecf20Sopenharmony_ci
918c2ecf20Sopenharmony_ci	if (fw_feature_is("disabled", "needs-l1d-flush-msr-pr-0-to-1", np))
928c2ecf20Sopenharmony_ci		security_ftr_clear(SEC_FTR_L1D_FLUSH_PR);
938c2ecf20Sopenharmony_ci
948c2ecf20Sopenharmony_ci	if (fw_feature_is("disabled", "needs-l1d-flush-msr-hv-1-to-0", np))
958c2ecf20Sopenharmony_ci		security_ftr_clear(SEC_FTR_L1D_FLUSH_HV);
968c2ecf20Sopenharmony_ci
978c2ecf20Sopenharmony_ci	if (fw_feature_is("disabled", "needs-spec-barrier-for-bound-checks", np))
988c2ecf20Sopenharmony_ci		security_ftr_clear(SEC_FTR_BNDS_CHK_SPEC_BAR);
998c2ecf20Sopenharmony_ci}
1008c2ecf20Sopenharmony_ci
1018c2ecf20Sopenharmony_cistatic void pnv_setup_security_mitigations(void)
1028c2ecf20Sopenharmony_ci{
1038c2ecf20Sopenharmony_ci	struct device_node *np, *fw_features;
1048c2ecf20Sopenharmony_ci	enum l1d_flush_type type;
1058c2ecf20Sopenharmony_ci	bool enable;
1068c2ecf20Sopenharmony_ci
1078c2ecf20Sopenharmony_ci	/* Default to fallback in case fw-features are not available */
1088c2ecf20Sopenharmony_ci	type = L1D_FLUSH_FALLBACK;
1098c2ecf20Sopenharmony_ci
1108c2ecf20Sopenharmony_ci	np = of_find_node_by_name(NULL, "ibm,opal");
1118c2ecf20Sopenharmony_ci	fw_features = of_get_child_by_name(np, "fw-features");
1128c2ecf20Sopenharmony_ci	of_node_put(np);
1138c2ecf20Sopenharmony_ci
1148c2ecf20Sopenharmony_ci	if (fw_features) {
1158c2ecf20Sopenharmony_ci		init_fw_feat_flags(fw_features);
1168c2ecf20Sopenharmony_ci		of_node_put(fw_features);
1178c2ecf20Sopenharmony_ci
1188c2ecf20Sopenharmony_ci		if (security_ftr_enabled(SEC_FTR_L1D_FLUSH_TRIG2))
1198c2ecf20Sopenharmony_ci			type = L1D_FLUSH_MTTRIG;
1208c2ecf20Sopenharmony_ci
1218c2ecf20Sopenharmony_ci		if (security_ftr_enabled(SEC_FTR_L1D_FLUSH_ORI30))
1228c2ecf20Sopenharmony_ci			type = L1D_FLUSH_ORI;
1238c2ecf20Sopenharmony_ci	}
1248c2ecf20Sopenharmony_ci
1258c2ecf20Sopenharmony_ci	/*
1268c2ecf20Sopenharmony_ci	 * If we are non-Power9 bare metal, we don't need to flush on kernel
1278c2ecf20Sopenharmony_ci	 * entry or after user access: they fix a P9 specific vulnerability.
1288c2ecf20Sopenharmony_ci	 */
1298c2ecf20Sopenharmony_ci	if (!pvr_version_is(PVR_POWER9)) {
1308c2ecf20Sopenharmony_ci		security_ftr_clear(SEC_FTR_L1D_FLUSH_ENTRY);
1318c2ecf20Sopenharmony_ci		security_ftr_clear(SEC_FTR_L1D_FLUSH_UACCESS);
1328c2ecf20Sopenharmony_ci	}
1338c2ecf20Sopenharmony_ci
1348c2ecf20Sopenharmony_ci	enable = security_ftr_enabled(SEC_FTR_FAVOUR_SECURITY) && \
1358c2ecf20Sopenharmony_ci		 (security_ftr_enabled(SEC_FTR_L1D_FLUSH_PR)   || \
1368c2ecf20Sopenharmony_ci		  security_ftr_enabled(SEC_FTR_L1D_FLUSH_HV));
1378c2ecf20Sopenharmony_ci
1388c2ecf20Sopenharmony_ci	setup_rfi_flush(type, enable);
1398c2ecf20Sopenharmony_ci	setup_count_cache_flush();
1408c2ecf20Sopenharmony_ci
1418c2ecf20Sopenharmony_ci	enable = security_ftr_enabled(SEC_FTR_FAVOUR_SECURITY) &&
1428c2ecf20Sopenharmony_ci		 security_ftr_enabled(SEC_FTR_L1D_FLUSH_ENTRY);
1438c2ecf20Sopenharmony_ci	setup_entry_flush(enable);
1448c2ecf20Sopenharmony_ci
1458c2ecf20Sopenharmony_ci	enable = security_ftr_enabled(SEC_FTR_FAVOUR_SECURITY) &&
1468c2ecf20Sopenharmony_ci		 security_ftr_enabled(SEC_FTR_L1D_FLUSH_UACCESS);
1478c2ecf20Sopenharmony_ci	setup_uaccess_flush(enable);
1488c2ecf20Sopenharmony_ci
1498c2ecf20Sopenharmony_ci	setup_stf_barrier();
1508c2ecf20Sopenharmony_ci}
1518c2ecf20Sopenharmony_ci
1528c2ecf20Sopenharmony_cistatic void __init pnv_check_guarded_cores(void)
1538c2ecf20Sopenharmony_ci{
1548c2ecf20Sopenharmony_ci	struct device_node *dn;
1558c2ecf20Sopenharmony_ci	int bad_count = 0;
1568c2ecf20Sopenharmony_ci
1578c2ecf20Sopenharmony_ci	for_each_node_by_type(dn, "cpu") {
1588c2ecf20Sopenharmony_ci		if (of_property_match_string(dn, "status", "bad") >= 0)
1598c2ecf20Sopenharmony_ci			bad_count++;
1608c2ecf20Sopenharmony_ci	};
1618c2ecf20Sopenharmony_ci
1628c2ecf20Sopenharmony_ci	if (bad_count) {
1638c2ecf20Sopenharmony_ci		printk("  _     _______________\n");
1648c2ecf20Sopenharmony_ci		pr_cont(" | |   /               \\\n");
1658c2ecf20Sopenharmony_ci		pr_cont(" | |   |    WARNING!   |\n");
1668c2ecf20Sopenharmony_ci		pr_cont(" | |   |               |\n");
1678c2ecf20Sopenharmony_ci		pr_cont(" | |   | It looks like |\n");
1688c2ecf20Sopenharmony_ci		pr_cont(" |_|   |  you have %*d |\n", 3, bad_count);
1698c2ecf20Sopenharmony_ci		pr_cont("  _    | guarded cores |\n");
1708c2ecf20Sopenharmony_ci		pr_cont(" (_)   \\_______________/\n");
1718c2ecf20Sopenharmony_ci	}
1728c2ecf20Sopenharmony_ci}
1738c2ecf20Sopenharmony_ci
1748c2ecf20Sopenharmony_cistatic void __init pnv_setup_arch(void)
1758c2ecf20Sopenharmony_ci{
1768c2ecf20Sopenharmony_ci	set_arch_panic_timeout(10, ARCH_PANIC_TIMEOUT);
1778c2ecf20Sopenharmony_ci
1788c2ecf20Sopenharmony_ci	pnv_setup_security_mitigations();
1798c2ecf20Sopenharmony_ci
1808c2ecf20Sopenharmony_ci	/* Initialize SMP */
1818c2ecf20Sopenharmony_ci	pnv_smp_init();
1828c2ecf20Sopenharmony_ci
1838c2ecf20Sopenharmony_ci	/* Setup PCI */
1848c2ecf20Sopenharmony_ci	pnv_pci_init();
1858c2ecf20Sopenharmony_ci
1868c2ecf20Sopenharmony_ci	/* Setup RTC and NVRAM callbacks */
1878c2ecf20Sopenharmony_ci	if (firmware_has_feature(FW_FEATURE_OPAL))
1888c2ecf20Sopenharmony_ci		opal_nvram_init();
1898c2ecf20Sopenharmony_ci
1908c2ecf20Sopenharmony_ci	/* Enable NAP mode */
1918c2ecf20Sopenharmony_ci	powersave_nap = 1;
1928c2ecf20Sopenharmony_ci
1938c2ecf20Sopenharmony_ci	pnv_check_guarded_cores();
1948c2ecf20Sopenharmony_ci
1958c2ecf20Sopenharmony_ci	/* XXX PMCS */
1968c2ecf20Sopenharmony_ci
1978c2ecf20Sopenharmony_ci	pnv_rng_init();
1988c2ecf20Sopenharmony_ci}
1998c2ecf20Sopenharmony_ci
2008c2ecf20Sopenharmony_cistatic void __init pnv_init(void)
2018c2ecf20Sopenharmony_ci{
2028c2ecf20Sopenharmony_ci	/*
2038c2ecf20Sopenharmony_ci	 * Initialize the LPC bus now so that legacy serial
2048c2ecf20Sopenharmony_ci	 * ports can be found on it
2058c2ecf20Sopenharmony_ci	 */
2068c2ecf20Sopenharmony_ci	opal_lpc_init();
2078c2ecf20Sopenharmony_ci
2088c2ecf20Sopenharmony_ci#ifdef CONFIG_HVC_OPAL
2098c2ecf20Sopenharmony_ci	if (firmware_has_feature(FW_FEATURE_OPAL))
2108c2ecf20Sopenharmony_ci		hvc_opal_init_early();
2118c2ecf20Sopenharmony_ci	else
2128c2ecf20Sopenharmony_ci#endif
2138c2ecf20Sopenharmony_ci		add_preferred_console("hvc", 0, NULL);
2148c2ecf20Sopenharmony_ci
2158c2ecf20Sopenharmony_ci	if (!radix_enabled()) {
2168c2ecf20Sopenharmony_ci		size_t size = sizeof(struct slb_entry) * mmu_slb_size;
2178c2ecf20Sopenharmony_ci		int i;
2188c2ecf20Sopenharmony_ci
2198c2ecf20Sopenharmony_ci		/* Allocate per cpu area to save old slb contents during MCE */
2208c2ecf20Sopenharmony_ci		for_each_possible_cpu(i) {
2218c2ecf20Sopenharmony_ci			paca_ptrs[i]->mce_faulty_slbs =
2228c2ecf20Sopenharmony_ci					memblock_alloc_node(size,
2238c2ecf20Sopenharmony_ci						__alignof__(struct slb_entry),
2248c2ecf20Sopenharmony_ci						cpu_to_node(i));
2258c2ecf20Sopenharmony_ci		}
2268c2ecf20Sopenharmony_ci	}
2278c2ecf20Sopenharmony_ci}
2288c2ecf20Sopenharmony_ci
2298c2ecf20Sopenharmony_cistatic void __init pnv_init_IRQ(void)
2308c2ecf20Sopenharmony_ci{
2318c2ecf20Sopenharmony_ci	/* Try using a XIVE if available, otherwise use a XICS */
2328c2ecf20Sopenharmony_ci	if (!xive_native_init())
2338c2ecf20Sopenharmony_ci		xics_init();
2348c2ecf20Sopenharmony_ci
2358c2ecf20Sopenharmony_ci	WARN_ON(!ppc_md.get_irq);
2368c2ecf20Sopenharmony_ci}
2378c2ecf20Sopenharmony_ci
2388c2ecf20Sopenharmony_cistatic void pnv_show_cpuinfo(struct seq_file *m)
2398c2ecf20Sopenharmony_ci{
2408c2ecf20Sopenharmony_ci	struct device_node *root;
2418c2ecf20Sopenharmony_ci	const char *model = "";
2428c2ecf20Sopenharmony_ci
2438c2ecf20Sopenharmony_ci	root = of_find_node_by_path("/");
2448c2ecf20Sopenharmony_ci	if (root)
2458c2ecf20Sopenharmony_ci		model = of_get_property(root, "model", NULL);
2468c2ecf20Sopenharmony_ci	seq_printf(m, "machine\t\t: PowerNV %s\n", model);
2478c2ecf20Sopenharmony_ci	if (firmware_has_feature(FW_FEATURE_OPAL))
2488c2ecf20Sopenharmony_ci		seq_printf(m, "firmware\t: OPAL\n");
2498c2ecf20Sopenharmony_ci	else
2508c2ecf20Sopenharmony_ci		seq_printf(m, "firmware\t: BML\n");
2518c2ecf20Sopenharmony_ci	of_node_put(root);
2528c2ecf20Sopenharmony_ci	if (radix_enabled())
2538c2ecf20Sopenharmony_ci		seq_printf(m, "MMU\t\t: Radix\n");
2548c2ecf20Sopenharmony_ci	else
2558c2ecf20Sopenharmony_ci		seq_printf(m, "MMU\t\t: Hash\n");
2568c2ecf20Sopenharmony_ci}
2578c2ecf20Sopenharmony_ci
2588c2ecf20Sopenharmony_cistatic void pnv_prepare_going_down(void)
2598c2ecf20Sopenharmony_ci{
2608c2ecf20Sopenharmony_ci	/*
2618c2ecf20Sopenharmony_ci	 * Disable all notifiers from OPAL, we can't
2628c2ecf20Sopenharmony_ci	 * service interrupts anymore anyway
2638c2ecf20Sopenharmony_ci	 */
2648c2ecf20Sopenharmony_ci	opal_event_shutdown();
2658c2ecf20Sopenharmony_ci
2668c2ecf20Sopenharmony_ci	/* Print flash update message if one is scheduled. */
2678c2ecf20Sopenharmony_ci	opal_flash_update_print_message();
2688c2ecf20Sopenharmony_ci
2698c2ecf20Sopenharmony_ci	smp_send_stop();
2708c2ecf20Sopenharmony_ci
2718c2ecf20Sopenharmony_ci	hard_irq_disable();
2728c2ecf20Sopenharmony_ci}
2738c2ecf20Sopenharmony_ci
2748c2ecf20Sopenharmony_cistatic void  __noreturn pnv_restart(char *cmd)
2758c2ecf20Sopenharmony_ci{
2768c2ecf20Sopenharmony_ci	long rc;
2778c2ecf20Sopenharmony_ci
2788c2ecf20Sopenharmony_ci	pnv_prepare_going_down();
2798c2ecf20Sopenharmony_ci
2808c2ecf20Sopenharmony_ci	do {
2818c2ecf20Sopenharmony_ci		if (!cmd || !strlen(cmd))
2828c2ecf20Sopenharmony_ci			rc = opal_cec_reboot();
2838c2ecf20Sopenharmony_ci		else if (strcmp(cmd, "full") == 0)
2848c2ecf20Sopenharmony_ci			rc = opal_cec_reboot2(OPAL_REBOOT_FULL_IPL, NULL);
2858c2ecf20Sopenharmony_ci		else if (strcmp(cmd, "mpipl") == 0)
2868c2ecf20Sopenharmony_ci			rc = opal_cec_reboot2(OPAL_REBOOT_MPIPL, NULL);
2878c2ecf20Sopenharmony_ci		else if (strcmp(cmd, "error") == 0)
2888c2ecf20Sopenharmony_ci			rc = opal_cec_reboot2(OPAL_REBOOT_PLATFORM_ERROR, NULL);
2898c2ecf20Sopenharmony_ci		else if (strcmp(cmd, "fast") == 0)
2908c2ecf20Sopenharmony_ci			rc = opal_cec_reboot2(OPAL_REBOOT_FAST, NULL);
2918c2ecf20Sopenharmony_ci		else
2928c2ecf20Sopenharmony_ci			rc = OPAL_UNSUPPORTED;
2938c2ecf20Sopenharmony_ci
2948c2ecf20Sopenharmony_ci		if (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
2958c2ecf20Sopenharmony_ci			/* Opal is busy wait for some time and retry */
2968c2ecf20Sopenharmony_ci			opal_poll_events(NULL);
2978c2ecf20Sopenharmony_ci			mdelay(10);
2988c2ecf20Sopenharmony_ci
2998c2ecf20Sopenharmony_ci		} else	if (cmd && rc) {
3008c2ecf20Sopenharmony_ci			/* Unknown error while issuing reboot */
3018c2ecf20Sopenharmony_ci			if (rc == OPAL_UNSUPPORTED)
3028c2ecf20Sopenharmony_ci				pr_err("Unsupported '%s' reboot.\n", cmd);
3038c2ecf20Sopenharmony_ci			else
3048c2ecf20Sopenharmony_ci				pr_err("Unable to issue '%s' reboot. Err=%ld\n",
3058c2ecf20Sopenharmony_ci				       cmd, rc);
3068c2ecf20Sopenharmony_ci			pr_info("Forcing a cec-reboot\n");
3078c2ecf20Sopenharmony_ci			cmd = NULL;
3088c2ecf20Sopenharmony_ci			rc = OPAL_BUSY;
3098c2ecf20Sopenharmony_ci
3108c2ecf20Sopenharmony_ci		} else if (rc != OPAL_SUCCESS) {
3118c2ecf20Sopenharmony_ci			/* Unknown error while issuing cec-reboot */
3128c2ecf20Sopenharmony_ci			pr_err("Unable to reboot. Err=%ld\n", rc);
3138c2ecf20Sopenharmony_ci		}
3148c2ecf20Sopenharmony_ci
3158c2ecf20Sopenharmony_ci	} while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT);
3168c2ecf20Sopenharmony_ci
3178c2ecf20Sopenharmony_ci	for (;;)
3188c2ecf20Sopenharmony_ci		opal_poll_events(NULL);
3198c2ecf20Sopenharmony_ci}
3208c2ecf20Sopenharmony_ci
3218c2ecf20Sopenharmony_cistatic void __noreturn pnv_power_off(void)
3228c2ecf20Sopenharmony_ci{
3238c2ecf20Sopenharmony_ci	long rc = OPAL_BUSY;
3248c2ecf20Sopenharmony_ci
3258c2ecf20Sopenharmony_ci	pnv_prepare_going_down();
3268c2ecf20Sopenharmony_ci
3278c2ecf20Sopenharmony_ci	while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
3288c2ecf20Sopenharmony_ci		rc = opal_cec_power_down(0);
3298c2ecf20Sopenharmony_ci		if (rc == OPAL_BUSY_EVENT)
3308c2ecf20Sopenharmony_ci			opal_poll_events(NULL);
3318c2ecf20Sopenharmony_ci		else
3328c2ecf20Sopenharmony_ci			mdelay(10);
3338c2ecf20Sopenharmony_ci	}
3348c2ecf20Sopenharmony_ci	for (;;)
3358c2ecf20Sopenharmony_ci		opal_poll_events(NULL);
3368c2ecf20Sopenharmony_ci}
3378c2ecf20Sopenharmony_ci
3388c2ecf20Sopenharmony_cistatic void __noreturn pnv_halt(void)
3398c2ecf20Sopenharmony_ci{
3408c2ecf20Sopenharmony_ci	pnv_power_off();
3418c2ecf20Sopenharmony_ci}
3428c2ecf20Sopenharmony_ci
3438c2ecf20Sopenharmony_cistatic void pnv_progress(char *s, unsigned short hex)
3448c2ecf20Sopenharmony_ci{
3458c2ecf20Sopenharmony_ci}
3468c2ecf20Sopenharmony_ci
3478c2ecf20Sopenharmony_cistatic void pnv_shutdown(void)
3488c2ecf20Sopenharmony_ci{
3498c2ecf20Sopenharmony_ci	/* Let the PCI code clear up IODA tables */
3508c2ecf20Sopenharmony_ci	pnv_pci_shutdown();
3518c2ecf20Sopenharmony_ci
3528c2ecf20Sopenharmony_ci	/*
3538c2ecf20Sopenharmony_ci	 * Stop OPAL activity: Unregister all OPAL interrupts so they
3548c2ecf20Sopenharmony_ci	 * don't fire up while we kexec and make sure all potentially
3558c2ecf20Sopenharmony_ci	 * DMA'ing ops are complete (such as dump retrieval).
3568c2ecf20Sopenharmony_ci	 */
3578c2ecf20Sopenharmony_ci	opal_shutdown();
3588c2ecf20Sopenharmony_ci}
3598c2ecf20Sopenharmony_ci
3608c2ecf20Sopenharmony_ci#ifdef CONFIG_KEXEC_CORE
3618c2ecf20Sopenharmony_cistatic void pnv_kexec_wait_secondaries_down(void)
3628c2ecf20Sopenharmony_ci{
3638c2ecf20Sopenharmony_ci	int my_cpu, i, notified = -1;
3648c2ecf20Sopenharmony_ci
3658c2ecf20Sopenharmony_ci	my_cpu = get_cpu();
3668c2ecf20Sopenharmony_ci
3678c2ecf20Sopenharmony_ci	for_each_online_cpu(i) {
3688c2ecf20Sopenharmony_ci		uint8_t status;
3698c2ecf20Sopenharmony_ci		int64_t rc, timeout = 1000;
3708c2ecf20Sopenharmony_ci
3718c2ecf20Sopenharmony_ci		if (i == my_cpu)
3728c2ecf20Sopenharmony_ci			continue;
3738c2ecf20Sopenharmony_ci
3748c2ecf20Sopenharmony_ci		for (;;) {
3758c2ecf20Sopenharmony_ci			rc = opal_query_cpu_status(get_hard_smp_processor_id(i),
3768c2ecf20Sopenharmony_ci						   &status);
3778c2ecf20Sopenharmony_ci			if (rc != OPAL_SUCCESS || status != OPAL_THREAD_STARTED)
3788c2ecf20Sopenharmony_ci				break;
3798c2ecf20Sopenharmony_ci			barrier();
3808c2ecf20Sopenharmony_ci			if (i != notified) {
3818c2ecf20Sopenharmony_ci				printk(KERN_INFO "kexec: waiting for cpu %d "
3828c2ecf20Sopenharmony_ci				       "(physical %d) to enter OPAL\n",
3838c2ecf20Sopenharmony_ci				       i, paca_ptrs[i]->hw_cpu_id);
3848c2ecf20Sopenharmony_ci				notified = i;
3858c2ecf20Sopenharmony_ci			}
3868c2ecf20Sopenharmony_ci
3878c2ecf20Sopenharmony_ci			/*
3888c2ecf20Sopenharmony_ci			 * On crash secondaries might be unreachable or hung,
3898c2ecf20Sopenharmony_ci			 * so timeout if we've waited too long
3908c2ecf20Sopenharmony_ci			 * */
3918c2ecf20Sopenharmony_ci			mdelay(1);
3928c2ecf20Sopenharmony_ci			if (timeout-- == 0) {
3938c2ecf20Sopenharmony_ci				printk(KERN_ERR "kexec: timed out waiting for "
3948c2ecf20Sopenharmony_ci				       "cpu %d (physical %d) to enter OPAL\n",
3958c2ecf20Sopenharmony_ci				       i, paca_ptrs[i]->hw_cpu_id);
3968c2ecf20Sopenharmony_ci				break;
3978c2ecf20Sopenharmony_ci			}
3988c2ecf20Sopenharmony_ci		}
3998c2ecf20Sopenharmony_ci	}
4008c2ecf20Sopenharmony_ci}
4018c2ecf20Sopenharmony_ci
4028c2ecf20Sopenharmony_cistatic void pnv_kexec_cpu_down(int crash_shutdown, int secondary)
4038c2ecf20Sopenharmony_ci{
4048c2ecf20Sopenharmony_ci	u64 reinit_flags;
4058c2ecf20Sopenharmony_ci
4068c2ecf20Sopenharmony_ci	if (xive_enabled())
4078c2ecf20Sopenharmony_ci		xive_teardown_cpu();
4088c2ecf20Sopenharmony_ci	else
4098c2ecf20Sopenharmony_ci		xics_kexec_teardown_cpu(secondary);
4108c2ecf20Sopenharmony_ci
4118c2ecf20Sopenharmony_ci	/* On OPAL, we return all CPUs to firmware */
4128c2ecf20Sopenharmony_ci	if (!firmware_has_feature(FW_FEATURE_OPAL))
4138c2ecf20Sopenharmony_ci		return;
4148c2ecf20Sopenharmony_ci
4158c2ecf20Sopenharmony_ci	if (secondary) {
4168c2ecf20Sopenharmony_ci		/* Return secondary CPUs to firmware on OPAL v3 */
4178c2ecf20Sopenharmony_ci		mb();
4188c2ecf20Sopenharmony_ci		get_paca()->kexec_state = KEXEC_STATE_REAL_MODE;
4198c2ecf20Sopenharmony_ci		mb();
4208c2ecf20Sopenharmony_ci
4218c2ecf20Sopenharmony_ci		/* Return the CPU to OPAL */
4228c2ecf20Sopenharmony_ci		opal_return_cpu();
4238c2ecf20Sopenharmony_ci	} else {
4248c2ecf20Sopenharmony_ci		/* Primary waits for the secondaries to have reached OPAL */
4258c2ecf20Sopenharmony_ci		pnv_kexec_wait_secondaries_down();
4268c2ecf20Sopenharmony_ci
4278c2ecf20Sopenharmony_ci		/* Switch XIVE back to emulation mode */
4288c2ecf20Sopenharmony_ci		if (xive_enabled())
4298c2ecf20Sopenharmony_ci			xive_shutdown();
4308c2ecf20Sopenharmony_ci
4318c2ecf20Sopenharmony_ci		/*
4328c2ecf20Sopenharmony_ci		 * We might be running as little-endian - now that interrupts
4338c2ecf20Sopenharmony_ci		 * are disabled, reset the HILE bit to big-endian so we don't
4348c2ecf20Sopenharmony_ci		 * take interrupts in the wrong endian later
4358c2ecf20Sopenharmony_ci		 *
4368c2ecf20Sopenharmony_ci		 * We reinit to enable both radix and hash on P9 to ensure
4378c2ecf20Sopenharmony_ci		 * the mode used by the next kernel is always supported.
4388c2ecf20Sopenharmony_ci		 */
4398c2ecf20Sopenharmony_ci		reinit_flags = OPAL_REINIT_CPUS_HILE_BE;
4408c2ecf20Sopenharmony_ci		if (cpu_has_feature(CPU_FTR_ARCH_300))
4418c2ecf20Sopenharmony_ci			reinit_flags |= OPAL_REINIT_CPUS_MMU_RADIX |
4428c2ecf20Sopenharmony_ci				OPAL_REINIT_CPUS_MMU_HASH;
4438c2ecf20Sopenharmony_ci		opal_reinit_cpus(reinit_flags);
4448c2ecf20Sopenharmony_ci	}
4458c2ecf20Sopenharmony_ci}
4468c2ecf20Sopenharmony_ci#endif /* CONFIG_KEXEC_CORE */
4478c2ecf20Sopenharmony_ci
4488c2ecf20Sopenharmony_ci#ifdef CONFIG_MEMORY_HOTPLUG_SPARSE
4498c2ecf20Sopenharmony_cistatic unsigned long pnv_memory_block_size(void)
4508c2ecf20Sopenharmony_ci{
4518c2ecf20Sopenharmony_ci	/*
4528c2ecf20Sopenharmony_ci	 * We map the kernel linear region with 1GB large pages on radix. For
4538c2ecf20Sopenharmony_ci	 * memory hot unplug to work our memory block size must be at least
4548c2ecf20Sopenharmony_ci	 * this size.
4558c2ecf20Sopenharmony_ci	 */
4568c2ecf20Sopenharmony_ci	if (radix_enabled())
4578c2ecf20Sopenharmony_ci		return radix_mem_block_size;
4588c2ecf20Sopenharmony_ci	else
4598c2ecf20Sopenharmony_ci		return 256UL * 1024 * 1024;
4608c2ecf20Sopenharmony_ci}
4618c2ecf20Sopenharmony_ci#endif
4628c2ecf20Sopenharmony_ci
4638c2ecf20Sopenharmony_cistatic void __init pnv_setup_machdep_opal(void)
4648c2ecf20Sopenharmony_ci{
4658c2ecf20Sopenharmony_ci	ppc_md.get_boot_time = opal_get_boot_time;
4668c2ecf20Sopenharmony_ci	ppc_md.restart = pnv_restart;
4678c2ecf20Sopenharmony_ci	pm_power_off = pnv_power_off;
4688c2ecf20Sopenharmony_ci	ppc_md.halt = pnv_halt;
4698c2ecf20Sopenharmony_ci	/* ppc_md.system_reset_exception gets filled in by pnv_smp_init() */
4708c2ecf20Sopenharmony_ci	ppc_md.machine_check_exception = opal_machine_check;
4718c2ecf20Sopenharmony_ci	ppc_md.mce_check_early_recovery = opal_mce_check_early_recovery;
4728c2ecf20Sopenharmony_ci	if (opal_check_token(OPAL_HANDLE_HMI2))
4738c2ecf20Sopenharmony_ci		ppc_md.hmi_exception_early = opal_hmi_exception_early2;
4748c2ecf20Sopenharmony_ci	else
4758c2ecf20Sopenharmony_ci		ppc_md.hmi_exception_early = opal_hmi_exception_early;
4768c2ecf20Sopenharmony_ci	ppc_md.handle_hmi_exception = opal_handle_hmi_exception;
4778c2ecf20Sopenharmony_ci}
4788c2ecf20Sopenharmony_ci
4798c2ecf20Sopenharmony_cistatic int __init pnv_probe(void)
4808c2ecf20Sopenharmony_ci{
4818c2ecf20Sopenharmony_ci	if (!of_machine_is_compatible("ibm,powernv"))
4828c2ecf20Sopenharmony_ci		return 0;
4838c2ecf20Sopenharmony_ci
4848c2ecf20Sopenharmony_ci	if (firmware_has_feature(FW_FEATURE_OPAL))
4858c2ecf20Sopenharmony_ci		pnv_setup_machdep_opal();
4868c2ecf20Sopenharmony_ci
4878c2ecf20Sopenharmony_ci	pr_debug("PowerNV detected !\n");
4888c2ecf20Sopenharmony_ci
4898c2ecf20Sopenharmony_ci	pnv_init();
4908c2ecf20Sopenharmony_ci
4918c2ecf20Sopenharmony_ci	return 1;
4928c2ecf20Sopenharmony_ci}
4938c2ecf20Sopenharmony_ci
4948c2ecf20Sopenharmony_ci#ifdef CONFIG_PPC_TRANSACTIONAL_MEM
4958c2ecf20Sopenharmony_civoid __init pnv_tm_init(void)
4968c2ecf20Sopenharmony_ci{
4978c2ecf20Sopenharmony_ci	if (!firmware_has_feature(FW_FEATURE_OPAL) ||
4988c2ecf20Sopenharmony_ci	    !pvr_version_is(PVR_POWER9) ||
4998c2ecf20Sopenharmony_ci	    early_cpu_has_feature(CPU_FTR_TM))
5008c2ecf20Sopenharmony_ci		return;
5018c2ecf20Sopenharmony_ci
5028c2ecf20Sopenharmony_ci	if (opal_reinit_cpus(OPAL_REINIT_CPUS_TM_SUSPEND_DISABLED) != OPAL_SUCCESS)
5038c2ecf20Sopenharmony_ci		return;
5048c2ecf20Sopenharmony_ci
5058c2ecf20Sopenharmony_ci	pr_info("Enabling TM (Transactional Memory) with Suspend Disabled\n");
5068c2ecf20Sopenharmony_ci	cur_cpu_spec->cpu_features |= CPU_FTR_TM;
5078c2ecf20Sopenharmony_ci	/* Make sure "normal" HTM is off (it should be) */
5088c2ecf20Sopenharmony_ci	cur_cpu_spec->cpu_user_features2 &= ~PPC_FEATURE2_HTM;
5098c2ecf20Sopenharmony_ci	/* Turn on no suspend mode, and HTM no SC */
5108c2ecf20Sopenharmony_ci	cur_cpu_spec->cpu_user_features2 |= PPC_FEATURE2_HTM_NO_SUSPEND | \
5118c2ecf20Sopenharmony_ci					    PPC_FEATURE2_HTM_NOSC;
5128c2ecf20Sopenharmony_ci	tm_suspend_disabled = true;
5138c2ecf20Sopenharmony_ci}
5148c2ecf20Sopenharmony_ci#endif /* CONFIG_PPC_TRANSACTIONAL_MEM */
5158c2ecf20Sopenharmony_ci
5168c2ecf20Sopenharmony_ci/*
5178c2ecf20Sopenharmony_ci * Returns the cpu frequency for 'cpu' in Hz. This is used by
5188c2ecf20Sopenharmony_ci * /proc/cpuinfo
5198c2ecf20Sopenharmony_ci */
5208c2ecf20Sopenharmony_cistatic unsigned long pnv_get_proc_freq(unsigned int cpu)
5218c2ecf20Sopenharmony_ci{
5228c2ecf20Sopenharmony_ci	unsigned long ret_freq;
5238c2ecf20Sopenharmony_ci
5248c2ecf20Sopenharmony_ci	ret_freq = cpufreq_get(cpu) * 1000ul;
5258c2ecf20Sopenharmony_ci
5268c2ecf20Sopenharmony_ci	/*
5278c2ecf20Sopenharmony_ci	 * If the backend cpufreq driver does not exist,
5288c2ecf20Sopenharmony_ci         * then fallback to old way of reporting the clockrate.
5298c2ecf20Sopenharmony_ci	 */
5308c2ecf20Sopenharmony_ci	if (!ret_freq)
5318c2ecf20Sopenharmony_ci		ret_freq = ppc_proc_freq;
5328c2ecf20Sopenharmony_ci	return ret_freq;
5338c2ecf20Sopenharmony_ci}
5348c2ecf20Sopenharmony_ci
5358c2ecf20Sopenharmony_cistatic long pnv_machine_check_early(struct pt_regs *regs)
5368c2ecf20Sopenharmony_ci{
5378c2ecf20Sopenharmony_ci	long handled = 0;
5388c2ecf20Sopenharmony_ci
5398c2ecf20Sopenharmony_ci	if (cur_cpu_spec && cur_cpu_spec->machine_check_early)
5408c2ecf20Sopenharmony_ci		handled = cur_cpu_spec->machine_check_early(regs);
5418c2ecf20Sopenharmony_ci
5428c2ecf20Sopenharmony_ci	return handled;
5438c2ecf20Sopenharmony_ci}
5448c2ecf20Sopenharmony_ci
5458c2ecf20Sopenharmony_cidefine_machine(powernv) {
5468c2ecf20Sopenharmony_ci	.name			= "PowerNV",
5478c2ecf20Sopenharmony_ci	.probe			= pnv_probe,
5488c2ecf20Sopenharmony_ci	.setup_arch		= pnv_setup_arch,
5498c2ecf20Sopenharmony_ci	.init_IRQ		= pnv_init_IRQ,
5508c2ecf20Sopenharmony_ci	.show_cpuinfo		= pnv_show_cpuinfo,
5518c2ecf20Sopenharmony_ci	.get_proc_freq          = pnv_get_proc_freq,
5528c2ecf20Sopenharmony_ci	.progress		= pnv_progress,
5538c2ecf20Sopenharmony_ci	.machine_shutdown	= pnv_shutdown,
5548c2ecf20Sopenharmony_ci	.power_save             = NULL,
5558c2ecf20Sopenharmony_ci	.calibrate_decr		= generic_calibrate_decr,
5568c2ecf20Sopenharmony_ci	.machine_check_early	= pnv_machine_check_early,
5578c2ecf20Sopenharmony_ci#ifdef CONFIG_KEXEC_CORE
5588c2ecf20Sopenharmony_ci	.kexec_cpu_down		= pnv_kexec_cpu_down,
5598c2ecf20Sopenharmony_ci#endif
5608c2ecf20Sopenharmony_ci#ifdef CONFIG_MEMORY_HOTPLUG_SPARSE
5618c2ecf20Sopenharmony_ci	.memory_block_size	= pnv_memory_block_size,
5628c2ecf20Sopenharmony_ci#endif
5638c2ecf20Sopenharmony_ci};
564