162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * POWERNV cpufreq driver for the IBM POWER processors
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * (C) Copyright IBM 2014
662306a36Sopenharmony_ci *
762306a36Sopenharmony_ci * Author: Vaidyanathan Srinivasan <svaidy at linux.vnet.ibm.com>
862306a36Sopenharmony_ci */
962306a36Sopenharmony_ci
1062306a36Sopenharmony_ci#define pr_fmt(fmt)	"powernv-cpufreq: " fmt
1162306a36Sopenharmony_ci
1262306a36Sopenharmony_ci#include <linux/kernel.h>
1362306a36Sopenharmony_ci#include <linux/sysfs.h>
1462306a36Sopenharmony_ci#include <linux/cpumask.h>
1562306a36Sopenharmony_ci#include <linux/module.h>
1662306a36Sopenharmony_ci#include <linux/cpufreq.h>
1762306a36Sopenharmony_ci#include <linux/smp.h>
1862306a36Sopenharmony_ci#include <linux/of.h>
1962306a36Sopenharmony_ci#include <linux/reboot.h>
2062306a36Sopenharmony_ci#include <linux/slab.h>
2162306a36Sopenharmony_ci#include <linux/cpu.h>
2262306a36Sopenharmony_ci#include <linux/hashtable.h>
2362306a36Sopenharmony_ci#include <trace/events/power.h>
2462306a36Sopenharmony_ci
2562306a36Sopenharmony_ci#include <asm/cputhreads.h>
2662306a36Sopenharmony_ci#include <asm/firmware.h>
2762306a36Sopenharmony_ci#include <asm/reg.h>
2862306a36Sopenharmony_ci#include <asm/smp.h> /* Required for cpu_sibling_mask() in UP configs */
2962306a36Sopenharmony_ci#include <asm/opal.h>
3062306a36Sopenharmony_ci#include <linux/timer.h>
3162306a36Sopenharmony_ci
3262306a36Sopenharmony_ci#define POWERNV_MAX_PSTATES_ORDER  8
3362306a36Sopenharmony_ci#define POWERNV_MAX_PSTATES	(1UL << (POWERNV_MAX_PSTATES_ORDER))
3462306a36Sopenharmony_ci#define PMSR_PSAFE_ENABLE	(1UL << 30)
3562306a36Sopenharmony_ci#define PMSR_SPR_EM_DISABLE	(1UL << 31)
3662306a36Sopenharmony_ci#define MAX_PSTATE_SHIFT	32
3762306a36Sopenharmony_ci#define LPSTATE_SHIFT		48
3862306a36Sopenharmony_ci#define GPSTATE_SHIFT		56
3962306a36Sopenharmony_ci#define MAX_NR_CHIPS		32
4062306a36Sopenharmony_ci
4162306a36Sopenharmony_ci#define MAX_RAMP_DOWN_TIME				5120
4262306a36Sopenharmony_ci/*
4362306a36Sopenharmony_ci * On an idle system we want the global pstate to ramp-down from max value to
4462306a36Sopenharmony_ci * min over a span of ~5 secs. Also we want it to initially ramp-down slowly and
4562306a36Sopenharmony_ci * then ramp-down rapidly later on.
4662306a36Sopenharmony_ci *
4762306a36Sopenharmony_ci * This gives a percentage rampdown for time elapsed in milliseconds.
4862306a36Sopenharmony_ci * ramp_down_percentage = ((ms * ms) >> 18)
4962306a36Sopenharmony_ci *			~= 3.8 * (sec * sec)
5062306a36Sopenharmony_ci *
5162306a36Sopenharmony_ci * At 0 ms	ramp_down_percent = 0
5262306a36Sopenharmony_ci * At 5120 ms	ramp_down_percent = 100
5362306a36Sopenharmony_ci */
5462306a36Sopenharmony_ci#define ramp_down_percent(time)		((time * time) >> 18)
5562306a36Sopenharmony_ci
5662306a36Sopenharmony_ci/* Interval after which the timer is queued to bring down global pstate */
5762306a36Sopenharmony_ci#define GPSTATE_TIMER_INTERVAL				2000
5862306a36Sopenharmony_ci
5962306a36Sopenharmony_ci/**
6062306a36Sopenharmony_ci * struct global_pstate_info -	Per policy data structure to maintain history of
6162306a36Sopenharmony_ci *				global pstates
6262306a36Sopenharmony_ci * @highest_lpstate_idx:	The local pstate index from which we are
6362306a36Sopenharmony_ci *				ramping down
6462306a36Sopenharmony_ci * @elapsed_time:		Time in ms spent in ramping down from
6562306a36Sopenharmony_ci *				highest_lpstate_idx
6662306a36Sopenharmony_ci * @last_sampled_time:		Time from boot in ms when global pstates were
6762306a36Sopenharmony_ci *				last set
6862306a36Sopenharmony_ci * @last_lpstate_idx:		Last set value of local pstate and global
6962306a36Sopenharmony_ci * @last_gpstate_idx:		pstate in terms of cpufreq table index
7062306a36Sopenharmony_ci * @timer:			Is used for ramping down if cpu goes idle for
7162306a36Sopenharmony_ci *				a long time with global pstate held high
7262306a36Sopenharmony_ci * @gpstate_lock:		A spinlock to maintain synchronization between
7362306a36Sopenharmony_ci *				routines called by the timer handler and
7462306a36Sopenharmony_ci *				governer's target_index calls
7562306a36Sopenharmony_ci * @policy:			Associated CPUFreq policy
7662306a36Sopenharmony_ci */
7762306a36Sopenharmony_cistruct global_pstate_info {
7862306a36Sopenharmony_ci	int highest_lpstate_idx;
7962306a36Sopenharmony_ci	unsigned int elapsed_time;
8062306a36Sopenharmony_ci	unsigned int last_sampled_time;
8162306a36Sopenharmony_ci	int last_lpstate_idx;
8262306a36Sopenharmony_ci	int last_gpstate_idx;
8362306a36Sopenharmony_ci	spinlock_t gpstate_lock;
8462306a36Sopenharmony_ci	struct timer_list timer;
8562306a36Sopenharmony_ci	struct cpufreq_policy *policy;
8662306a36Sopenharmony_ci};
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_cistatic struct cpufreq_frequency_table powernv_freqs[POWERNV_MAX_PSTATES+1];
8962306a36Sopenharmony_ci
9062306a36Sopenharmony_cistatic DEFINE_HASHTABLE(pstate_revmap, POWERNV_MAX_PSTATES_ORDER);
9162306a36Sopenharmony_ci/**
9262306a36Sopenharmony_ci * struct pstate_idx_revmap_data: Entry in the hashmap pstate_revmap
9362306a36Sopenharmony_ci *				  indexed by a function of pstate id.
9462306a36Sopenharmony_ci *
9562306a36Sopenharmony_ci * @pstate_id: pstate id for this entry.
9662306a36Sopenharmony_ci *
9762306a36Sopenharmony_ci * @cpufreq_table_idx: Index into the powernv_freqs
9862306a36Sopenharmony_ci *		       cpufreq_frequency_table for frequency
9962306a36Sopenharmony_ci *		       corresponding to pstate_id.
10062306a36Sopenharmony_ci *
10162306a36Sopenharmony_ci * @hentry: hlist_node that hooks this entry into the pstate_revmap
10262306a36Sopenharmony_ci *	    hashtable
10362306a36Sopenharmony_ci */
10462306a36Sopenharmony_cistruct pstate_idx_revmap_data {
10562306a36Sopenharmony_ci	u8 pstate_id;
10662306a36Sopenharmony_ci	unsigned int cpufreq_table_idx;
10762306a36Sopenharmony_ci	struct hlist_node hentry;
10862306a36Sopenharmony_ci};
10962306a36Sopenharmony_ci
11062306a36Sopenharmony_cistatic bool rebooting, throttled, occ_reset;
11162306a36Sopenharmony_ci
11262306a36Sopenharmony_cistatic const char * const throttle_reason[] = {
11362306a36Sopenharmony_ci	"No throttling",
11462306a36Sopenharmony_ci	"Power Cap",
11562306a36Sopenharmony_ci	"Processor Over Temperature",
11662306a36Sopenharmony_ci	"Power Supply Failure",
11762306a36Sopenharmony_ci	"Over Current",
11862306a36Sopenharmony_ci	"OCC Reset"
11962306a36Sopenharmony_ci};
12062306a36Sopenharmony_ci
12162306a36Sopenharmony_cienum throttle_reason_type {
12262306a36Sopenharmony_ci	NO_THROTTLE = 0,
12362306a36Sopenharmony_ci	POWERCAP,
12462306a36Sopenharmony_ci	CPU_OVERTEMP,
12562306a36Sopenharmony_ci	POWER_SUPPLY_FAILURE,
12662306a36Sopenharmony_ci	OVERCURRENT,
12762306a36Sopenharmony_ci	OCC_RESET_THROTTLE,
12862306a36Sopenharmony_ci	OCC_MAX_REASON
12962306a36Sopenharmony_ci};
13062306a36Sopenharmony_ci
13162306a36Sopenharmony_cistatic struct chip {
13262306a36Sopenharmony_ci	unsigned int id;
13362306a36Sopenharmony_ci	bool throttled;
13462306a36Sopenharmony_ci	bool restore;
13562306a36Sopenharmony_ci	u8 throttle_reason;
13662306a36Sopenharmony_ci	cpumask_t mask;
13762306a36Sopenharmony_ci	struct work_struct throttle;
13862306a36Sopenharmony_ci	int throttle_turbo;
13962306a36Sopenharmony_ci	int throttle_sub_turbo;
14062306a36Sopenharmony_ci	int reason[OCC_MAX_REASON];
14162306a36Sopenharmony_ci} *chips;
14262306a36Sopenharmony_ci
14362306a36Sopenharmony_cistatic int nr_chips;
14462306a36Sopenharmony_cistatic DEFINE_PER_CPU(struct chip *, chip_info);
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_ci/*
14762306a36Sopenharmony_ci * Note:
14862306a36Sopenharmony_ci * The set of pstates consists of contiguous integers.
14962306a36Sopenharmony_ci * powernv_pstate_info stores the index of the frequency table for
15062306a36Sopenharmony_ci * max, min and nominal frequencies. It also stores number of
15162306a36Sopenharmony_ci * available frequencies.
15262306a36Sopenharmony_ci *
15362306a36Sopenharmony_ci * powernv_pstate_info.nominal indicates the index to the highest
15462306a36Sopenharmony_ci * non-turbo frequency.
15562306a36Sopenharmony_ci */
15662306a36Sopenharmony_cistatic struct powernv_pstate_info {
15762306a36Sopenharmony_ci	unsigned int min;
15862306a36Sopenharmony_ci	unsigned int max;
15962306a36Sopenharmony_ci	unsigned int nominal;
16062306a36Sopenharmony_ci	unsigned int nr_pstates;
16162306a36Sopenharmony_ci	bool wof_enabled;
16262306a36Sopenharmony_ci} powernv_pstate_info;
16362306a36Sopenharmony_ci
16462306a36Sopenharmony_cistatic inline u8 extract_pstate(u64 pmsr_val, unsigned int shift)
16562306a36Sopenharmony_ci{
16662306a36Sopenharmony_ci	return ((pmsr_val >> shift) & 0xFF);
16762306a36Sopenharmony_ci}
16862306a36Sopenharmony_ci
16962306a36Sopenharmony_ci#define extract_local_pstate(x) extract_pstate(x, LPSTATE_SHIFT)
17062306a36Sopenharmony_ci#define extract_global_pstate(x) extract_pstate(x, GPSTATE_SHIFT)
17162306a36Sopenharmony_ci#define extract_max_pstate(x)  extract_pstate(x, MAX_PSTATE_SHIFT)
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_ci/* Use following functions for conversions between pstate_id and index */
17462306a36Sopenharmony_ci
17562306a36Sopenharmony_ci/*
17662306a36Sopenharmony_ci * idx_to_pstate : Returns the pstate id corresponding to the
17762306a36Sopenharmony_ci *		   frequency in the cpufreq frequency table
17862306a36Sopenharmony_ci *		   powernv_freqs indexed by @i.
17962306a36Sopenharmony_ci *
18062306a36Sopenharmony_ci *		   If @i is out of bound, this will return the pstate
18162306a36Sopenharmony_ci *		   corresponding to the nominal frequency.
18262306a36Sopenharmony_ci */
18362306a36Sopenharmony_cistatic inline u8 idx_to_pstate(unsigned int i)
18462306a36Sopenharmony_ci{
18562306a36Sopenharmony_ci	if (unlikely(i >= powernv_pstate_info.nr_pstates)) {
18662306a36Sopenharmony_ci		pr_warn_once("idx_to_pstate: index %u is out of bound\n", i);
18762306a36Sopenharmony_ci		return powernv_freqs[powernv_pstate_info.nominal].driver_data;
18862306a36Sopenharmony_ci	}
18962306a36Sopenharmony_ci
19062306a36Sopenharmony_ci	return powernv_freqs[i].driver_data;
19162306a36Sopenharmony_ci}
19262306a36Sopenharmony_ci
19362306a36Sopenharmony_ci/*
19462306a36Sopenharmony_ci * pstate_to_idx : Returns the index in the cpufreq frequencytable
19562306a36Sopenharmony_ci *		   powernv_freqs for the frequency whose corresponding
19662306a36Sopenharmony_ci *		   pstate id is @pstate.
19762306a36Sopenharmony_ci *
19862306a36Sopenharmony_ci *		   If no frequency corresponding to @pstate is found,
19962306a36Sopenharmony_ci *		   this will return the index of the nominal
20062306a36Sopenharmony_ci *		   frequency.
20162306a36Sopenharmony_ci */
20262306a36Sopenharmony_cistatic unsigned int pstate_to_idx(u8 pstate)
20362306a36Sopenharmony_ci{
20462306a36Sopenharmony_ci	unsigned int key = pstate % POWERNV_MAX_PSTATES;
20562306a36Sopenharmony_ci	struct pstate_idx_revmap_data *revmap_data;
20662306a36Sopenharmony_ci
20762306a36Sopenharmony_ci	hash_for_each_possible(pstate_revmap, revmap_data, hentry, key) {
20862306a36Sopenharmony_ci		if (revmap_data->pstate_id == pstate)
20962306a36Sopenharmony_ci			return revmap_data->cpufreq_table_idx;
21062306a36Sopenharmony_ci	}
21162306a36Sopenharmony_ci
21262306a36Sopenharmony_ci	pr_warn_once("pstate_to_idx: pstate 0x%x not found\n", pstate);
21362306a36Sopenharmony_ci	return powernv_pstate_info.nominal;
21462306a36Sopenharmony_ci}
21562306a36Sopenharmony_ci
21662306a36Sopenharmony_cistatic inline void reset_gpstates(struct cpufreq_policy *policy)
21762306a36Sopenharmony_ci{
21862306a36Sopenharmony_ci	struct global_pstate_info *gpstates = policy->driver_data;
21962306a36Sopenharmony_ci
22062306a36Sopenharmony_ci	gpstates->highest_lpstate_idx = 0;
22162306a36Sopenharmony_ci	gpstates->elapsed_time = 0;
22262306a36Sopenharmony_ci	gpstates->last_sampled_time = 0;
22362306a36Sopenharmony_ci	gpstates->last_lpstate_idx = 0;
22462306a36Sopenharmony_ci	gpstates->last_gpstate_idx = 0;
22562306a36Sopenharmony_ci}
22662306a36Sopenharmony_ci
22762306a36Sopenharmony_ci/*
22862306a36Sopenharmony_ci * Initialize the freq table based on data obtained
22962306a36Sopenharmony_ci * from the firmware passed via device-tree
23062306a36Sopenharmony_ci */
23162306a36Sopenharmony_cistatic int init_powernv_pstates(void)
23262306a36Sopenharmony_ci{
23362306a36Sopenharmony_ci	struct device_node *power_mgt;
23462306a36Sopenharmony_ci	int i, nr_pstates = 0;
23562306a36Sopenharmony_ci	const __be32 *pstate_ids, *pstate_freqs;
23662306a36Sopenharmony_ci	u32 len_ids, len_freqs;
23762306a36Sopenharmony_ci	u32 pstate_min, pstate_max, pstate_nominal;
23862306a36Sopenharmony_ci	u32 pstate_turbo, pstate_ultra_turbo;
23962306a36Sopenharmony_ci	int rc = -ENODEV;
24062306a36Sopenharmony_ci
24162306a36Sopenharmony_ci	power_mgt = of_find_node_by_path("/ibm,opal/power-mgt");
24262306a36Sopenharmony_ci	if (!power_mgt) {
24362306a36Sopenharmony_ci		pr_warn("power-mgt node not found\n");
24462306a36Sopenharmony_ci		return -ENODEV;
24562306a36Sopenharmony_ci	}
24662306a36Sopenharmony_ci
24762306a36Sopenharmony_ci	if (of_property_read_u32(power_mgt, "ibm,pstate-min", &pstate_min)) {
24862306a36Sopenharmony_ci		pr_warn("ibm,pstate-min node not found\n");
24962306a36Sopenharmony_ci		goto out;
25062306a36Sopenharmony_ci	}
25162306a36Sopenharmony_ci
25262306a36Sopenharmony_ci	if (of_property_read_u32(power_mgt, "ibm,pstate-max", &pstate_max)) {
25362306a36Sopenharmony_ci		pr_warn("ibm,pstate-max node not found\n");
25462306a36Sopenharmony_ci		goto out;
25562306a36Sopenharmony_ci	}
25662306a36Sopenharmony_ci
25762306a36Sopenharmony_ci	if (of_property_read_u32(power_mgt, "ibm,pstate-nominal",
25862306a36Sopenharmony_ci				 &pstate_nominal)) {
25962306a36Sopenharmony_ci		pr_warn("ibm,pstate-nominal not found\n");
26062306a36Sopenharmony_ci		goto out;
26162306a36Sopenharmony_ci	}
26262306a36Sopenharmony_ci
26362306a36Sopenharmony_ci	if (of_property_read_u32(power_mgt, "ibm,pstate-ultra-turbo",
26462306a36Sopenharmony_ci				 &pstate_ultra_turbo)) {
26562306a36Sopenharmony_ci		powernv_pstate_info.wof_enabled = false;
26662306a36Sopenharmony_ci		goto next;
26762306a36Sopenharmony_ci	}
26862306a36Sopenharmony_ci
26962306a36Sopenharmony_ci	if (of_property_read_u32(power_mgt, "ibm,pstate-turbo",
27062306a36Sopenharmony_ci				 &pstate_turbo)) {
27162306a36Sopenharmony_ci		powernv_pstate_info.wof_enabled = false;
27262306a36Sopenharmony_ci		goto next;
27362306a36Sopenharmony_ci	}
27462306a36Sopenharmony_ci
27562306a36Sopenharmony_ci	if (pstate_turbo == pstate_ultra_turbo)
27662306a36Sopenharmony_ci		powernv_pstate_info.wof_enabled = false;
27762306a36Sopenharmony_ci	else
27862306a36Sopenharmony_ci		powernv_pstate_info.wof_enabled = true;
27962306a36Sopenharmony_ci
28062306a36Sopenharmony_cinext:
28162306a36Sopenharmony_ci	pr_info("cpufreq pstate min 0x%x nominal 0x%x max 0x%x\n", pstate_min,
28262306a36Sopenharmony_ci		pstate_nominal, pstate_max);
28362306a36Sopenharmony_ci	pr_info("Workload Optimized Frequency is %s in the platform\n",
28462306a36Sopenharmony_ci		(powernv_pstate_info.wof_enabled) ? "enabled" : "disabled");
28562306a36Sopenharmony_ci
28662306a36Sopenharmony_ci	pstate_ids = of_get_property(power_mgt, "ibm,pstate-ids", &len_ids);
28762306a36Sopenharmony_ci	if (!pstate_ids) {
28862306a36Sopenharmony_ci		pr_warn("ibm,pstate-ids not found\n");
28962306a36Sopenharmony_ci		goto out;
29062306a36Sopenharmony_ci	}
29162306a36Sopenharmony_ci
29262306a36Sopenharmony_ci	pstate_freqs = of_get_property(power_mgt, "ibm,pstate-frequencies-mhz",
29362306a36Sopenharmony_ci				      &len_freqs);
29462306a36Sopenharmony_ci	if (!pstate_freqs) {
29562306a36Sopenharmony_ci		pr_warn("ibm,pstate-frequencies-mhz not found\n");
29662306a36Sopenharmony_ci		goto out;
29762306a36Sopenharmony_ci	}
29862306a36Sopenharmony_ci
29962306a36Sopenharmony_ci	if (len_ids != len_freqs) {
30062306a36Sopenharmony_ci		pr_warn("Entries in ibm,pstate-ids and "
30162306a36Sopenharmony_ci			"ibm,pstate-frequencies-mhz does not match\n");
30262306a36Sopenharmony_ci	}
30362306a36Sopenharmony_ci
30462306a36Sopenharmony_ci	nr_pstates = min(len_ids, len_freqs) / sizeof(u32);
30562306a36Sopenharmony_ci	if (!nr_pstates) {
30662306a36Sopenharmony_ci		pr_warn("No PStates found\n");
30762306a36Sopenharmony_ci		goto out;
30862306a36Sopenharmony_ci	}
30962306a36Sopenharmony_ci
31062306a36Sopenharmony_ci	powernv_pstate_info.nr_pstates = nr_pstates;
31162306a36Sopenharmony_ci	pr_debug("NR PStates %d\n", nr_pstates);
31262306a36Sopenharmony_ci
31362306a36Sopenharmony_ci	for (i = 0; i < nr_pstates; i++) {
31462306a36Sopenharmony_ci		u32 id = be32_to_cpu(pstate_ids[i]);
31562306a36Sopenharmony_ci		u32 freq = be32_to_cpu(pstate_freqs[i]);
31662306a36Sopenharmony_ci		struct pstate_idx_revmap_data *revmap_data;
31762306a36Sopenharmony_ci		unsigned int key;
31862306a36Sopenharmony_ci
31962306a36Sopenharmony_ci		pr_debug("PState id %d freq %d MHz\n", id, freq);
32062306a36Sopenharmony_ci		powernv_freqs[i].frequency = freq * 1000; /* kHz */
32162306a36Sopenharmony_ci		powernv_freqs[i].driver_data = id & 0xFF;
32262306a36Sopenharmony_ci
32362306a36Sopenharmony_ci		revmap_data = kmalloc(sizeof(*revmap_data), GFP_KERNEL);
32462306a36Sopenharmony_ci		if (!revmap_data) {
32562306a36Sopenharmony_ci			rc = -ENOMEM;
32662306a36Sopenharmony_ci			goto out;
32762306a36Sopenharmony_ci		}
32862306a36Sopenharmony_ci
32962306a36Sopenharmony_ci		revmap_data->pstate_id = id & 0xFF;
33062306a36Sopenharmony_ci		revmap_data->cpufreq_table_idx = i;
33162306a36Sopenharmony_ci		key = (revmap_data->pstate_id) % POWERNV_MAX_PSTATES;
33262306a36Sopenharmony_ci		hash_add(pstate_revmap, &revmap_data->hentry, key);
33362306a36Sopenharmony_ci
33462306a36Sopenharmony_ci		if (id == pstate_max)
33562306a36Sopenharmony_ci			powernv_pstate_info.max = i;
33662306a36Sopenharmony_ci		if (id == pstate_nominal)
33762306a36Sopenharmony_ci			powernv_pstate_info.nominal = i;
33862306a36Sopenharmony_ci		if (id == pstate_min)
33962306a36Sopenharmony_ci			powernv_pstate_info.min = i;
34062306a36Sopenharmony_ci
34162306a36Sopenharmony_ci		if (powernv_pstate_info.wof_enabled && id == pstate_turbo) {
34262306a36Sopenharmony_ci			int j;
34362306a36Sopenharmony_ci
34462306a36Sopenharmony_ci			for (j = i - 1; j >= (int)powernv_pstate_info.max; j--)
34562306a36Sopenharmony_ci				powernv_freqs[j].flags = CPUFREQ_BOOST_FREQ;
34662306a36Sopenharmony_ci		}
34762306a36Sopenharmony_ci	}
34862306a36Sopenharmony_ci
34962306a36Sopenharmony_ci	/* End of list marker entry */
35062306a36Sopenharmony_ci	powernv_freqs[i].frequency = CPUFREQ_TABLE_END;
35162306a36Sopenharmony_ci
35262306a36Sopenharmony_ci	of_node_put(power_mgt);
35362306a36Sopenharmony_ci	return 0;
35462306a36Sopenharmony_ciout:
35562306a36Sopenharmony_ci	of_node_put(power_mgt);
35662306a36Sopenharmony_ci	return rc;
35762306a36Sopenharmony_ci}
35862306a36Sopenharmony_ci
35962306a36Sopenharmony_ci/* Returns the CPU frequency corresponding to the pstate_id. */
36062306a36Sopenharmony_cistatic unsigned int pstate_id_to_freq(u8 pstate_id)
36162306a36Sopenharmony_ci{
36262306a36Sopenharmony_ci	int i;
36362306a36Sopenharmony_ci
36462306a36Sopenharmony_ci	i = pstate_to_idx(pstate_id);
36562306a36Sopenharmony_ci	if (i >= powernv_pstate_info.nr_pstates || i < 0) {
36662306a36Sopenharmony_ci		pr_warn("PState id 0x%x outside of PState table, reporting nominal id 0x%x instead\n",
36762306a36Sopenharmony_ci			pstate_id, idx_to_pstate(powernv_pstate_info.nominal));
36862306a36Sopenharmony_ci		i = powernv_pstate_info.nominal;
36962306a36Sopenharmony_ci	}
37062306a36Sopenharmony_ci
37162306a36Sopenharmony_ci	return powernv_freqs[i].frequency;
37262306a36Sopenharmony_ci}
37362306a36Sopenharmony_ci
37462306a36Sopenharmony_ci/*
37562306a36Sopenharmony_ci * cpuinfo_nominal_freq_show - Show the nominal CPU frequency as indicated by
37662306a36Sopenharmony_ci * the firmware
37762306a36Sopenharmony_ci */
37862306a36Sopenharmony_cistatic ssize_t cpuinfo_nominal_freq_show(struct cpufreq_policy *policy,
37962306a36Sopenharmony_ci					char *buf)
38062306a36Sopenharmony_ci{
38162306a36Sopenharmony_ci	return sprintf(buf, "%u\n",
38262306a36Sopenharmony_ci		powernv_freqs[powernv_pstate_info.nominal].frequency);
38362306a36Sopenharmony_ci}
38462306a36Sopenharmony_ci
38562306a36Sopenharmony_cistatic struct freq_attr cpufreq_freq_attr_cpuinfo_nominal_freq =
38662306a36Sopenharmony_ci	__ATTR_RO(cpuinfo_nominal_freq);
38762306a36Sopenharmony_ci
38862306a36Sopenharmony_ci#define SCALING_BOOST_FREQS_ATTR_INDEX		2
38962306a36Sopenharmony_ci
39062306a36Sopenharmony_cistatic struct freq_attr *powernv_cpu_freq_attr[] = {
39162306a36Sopenharmony_ci	&cpufreq_freq_attr_scaling_available_freqs,
39262306a36Sopenharmony_ci	&cpufreq_freq_attr_cpuinfo_nominal_freq,
39362306a36Sopenharmony_ci	&cpufreq_freq_attr_scaling_boost_freqs,
39462306a36Sopenharmony_ci	NULL,
39562306a36Sopenharmony_ci};
39662306a36Sopenharmony_ci
39762306a36Sopenharmony_ci#define throttle_attr(name, member)					\
39862306a36Sopenharmony_cistatic ssize_t name##_show(struct cpufreq_policy *policy, char *buf)	\
39962306a36Sopenharmony_ci{									\
40062306a36Sopenharmony_ci	struct chip *chip = per_cpu(chip_info, policy->cpu);		\
40162306a36Sopenharmony_ci									\
40262306a36Sopenharmony_ci	return sprintf(buf, "%u\n", chip->member);			\
40362306a36Sopenharmony_ci}									\
40462306a36Sopenharmony_ci									\
40562306a36Sopenharmony_cistatic struct freq_attr throttle_attr_##name = __ATTR_RO(name)		\
40662306a36Sopenharmony_ci
40762306a36Sopenharmony_cithrottle_attr(unthrottle, reason[NO_THROTTLE]);
40862306a36Sopenharmony_cithrottle_attr(powercap, reason[POWERCAP]);
40962306a36Sopenharmony_cithrottle_attr(overtemp, reason[CPU_OVERTEMP]);
41062306a36Sopenharmony_cithrottle_attr(supply_fault, reason[POWER_SUPPLY_FAILURE]);
41162306a36Sopenharmony_cithrottle_attr(overcurrent, reason[OVERCURRENT]);
41262306a36Sopenharmony_cithrottle_attr(occ_reset, reason[OCC_RESET_THROTTLE]);
41362306a36Sopenharmony_cithrottle_attr(turbo_stat, throttle_turbo);
41462306a36Sopenharmony_cithrottle_attr(sub_turbo_stat, throttle_sub_turbo);
41562306a36Sopenharmony_ci
41662306a36Sopenharmony_cistatic struct attribute *throttle_attrs[] = {
41762306a36Sopenharmony_ci	&throttle_attr_unthrottle.attr,
41862306a36Sopenharmony_ci	&throttle_attr_powercap.attr,
41962306a36Sopenharmony_ci	&throttle_attr_overtemp.attr,
42062306a36Sopenharmony_ci	&throttle_attr_supply_fault.attr,
42162306a36Sopenharmony_ci	&throttle_attr_overcurrent.attr,
42262306a36Sopenharmony_ci	&throttle_attr_occ_reset.attr,
42362306a36Sopenharmony_ci	&throttle_attr_turbo_stat.attr,
42462306a36Sopenharmony_ci	&throttle_attr_sub_turbo_stat.attr,
42562306a36Sopenharmony_ci	NULL,
42662306a36Sopenharmony_ci};
42762306a36Sopenharmony_ci
42862306a36Sopenharmony_cistatic const struct attribute_group throttle_attr_grp = {
42962306a36Sopenharmony_ci	.name	= "throttle_stats",
43062306a36Sopenharmony_ci	.attrs	= throttle_attrs,
43162306a36Sopenharmony_ci};
43262306a36Sopenharmony_ci
43362306a36Sopenharmony_ci/* Helper routines */
43462306a36Sopenharmony_ci
43562306a36Sopenharmony_ci/* Access helpers to power mgt SPR */
43662306a36Sopenharmony_ci
43762306a36Sopenharmony_cistatic inline unsigned long get_pmspr(unsigned long sprn)
43862306a36Sopenharmony_ci{
43962306a36Sopenharmony_ci	switch (sprn) {
44062306a36Sopenharmony_ci	case SPRN_PMCR:
44162306a36Sopenharmony_ci		return mfspr(SPRN_PMCR);
44262306a36Sopenharmony_ci
44362306a36Sopenharmony_ci	case SPRN_PMICR:
44462306a36Sopenharmony_ci		return mfspr(SPRN_PMICR);
44562306a36Sopenharmony_ci
44662306a36Sopenharmony_ci	case SPRN_PMSR:
44762306a36Sopenharmony_ci		return mfspr(SPRN_PMSR);
44862306a36Sopenharmony_ci	}
44962306a36Sopenharmony_ci	BUG();
45062306a36Sopenharmony_ci}
45162306a36Sopenharmony_ci
45262306a36Sopenharmony_cistatic inline void set_pmspr(unsigned long sprn, unsigned long val)
45362306a36Sopenharmony_ci{
45462306a36Sopenharmony_ci	switch (sprn) {
45562306a36Sopenharmony_ci	case SPRN_PMCR:
45662306a36Sopenharmony_ci		mtspr(SPRN_PMCR, val);
45762306a36Sopenharmony_ci		return;
45862306a36Sopenharmony_ci
45962306a36Sopenharmony_ci	case SPRN_PMICR:
46062306a36Sopenharmony_ci		mtspr(SPRN_PMICR, val);
46162306a36Sopenharmony_ci		return;
46262306a36Sopenharmony_ci	}
46362306a36Sopenharmony_ci	BUG();
46462306a36Sopenharmony_ci}
46562306a36Sopenharmony_ci
46662306a36Sopenharmony_ci/*
46762306a36Sopenharmony_ci * Use objects of this type to query/update
46862306a36Sopenharmony_ci * pstates on a remote CPU via smp_call_function.
46962306a36Sopenharmony_ci */
47062306a36Sopenharmony_cistruct powernv_smp_call_data {
47162306a36Sopenharmony_ci	unsigned int freq;
47262306a36Sopenharmony_ci	u8 pstate_id;
47362306a36Sopenharmony_ci	u8 gpstate_id;
47462306a36Sopenharmony_ci};
47562306a36Sopenharmony_ci
47662306a36Sopenharmony_ci/*
47762306a36Sopenharmony_ci * powernv_read_cpu_freq: Reads the current frequency on this CPU.
47862306a36Sopenharmony_ci *
47962306a36Sopenharmony_ci * Called via smp_call_function.
48062306a36Sopenharmony_ci *
48162306a36Sopenharmony_ci * Note: The caller of the smp_call_function should pass an argument of
48262306a36Sopenharmony_ci * the type 'struct powernv_smp_call_data *' along with this function.
48362306a36Sopenharmony_ci *
48462306a36Sopenharmony_ci * The current frequency on this CPU will be returned via
48562306a36Sopenharmony_ci * ((struct powernv_smp_call_data *)arg)->freq;
48662306a36Sopenharmony_ci */
48762306a36Sopenharmony_cistatic void powernv_read_cpu_freq(void *arg)
48862306a36Sopenharmony_ci{
48962306a36Sopenharmony_ci	unsigned long pmspr_val;
49062306a36Sopenharmony_ci	struct powernv_smp_call_data *freq_data = arg;
49162306a36Sopenharmony_ci
49262306a36Sopenharmony_ci	pmspr_val = get_pmspr(SPRN_PMSR);
49362306a36Sopenharmony_ci	freq_data->pstate_id = extract_local_pstate(pmspr_val);
49462306a36Sopenharmony_ci	freq_data->freq = pstate_id_to_freq(freq_data->pstate_id);
49562306a36Sopenharmony_ci
49662306a36Sopenharmony_ci	pr_debug("cpu %d pmsr %016lX pstate_id 0x%x frequency %d kHz\n",
49762306a36Sopenharmony_ci		 raw_smp_processor_id(), pmspr_val, freq_data->pstate_id,
49862306a36Sopenharmony_ci		 freq_data->freq);
49962306a36Sopenharmony_ci}
50062306a36Sopenharmony_ci
50162306a36Sopenharmony_ci/*
50262306a36Sopenharmony_ci * powernv_cpufreq_get: Returns the CPU frequency as reported by the
50362306a36Sopenharmony_ci * firmware for CPU 'cpu'. This value is reported through the sysfs
50462306a36Sopenharmony_ci * file cpuinfo_cur_freq.
50562306a36Sopenharmony_ci */
50662306a36Sopenharmony_cistatic unsigned int powernv_cpufreq_get(unsigned int cpu)
50762306a36Sopenharmony_ci{
50862306a36Sopenharmony_ci	struct powernv_smp_call_data freq_data;
50962306a36Sopenharmony_ci
51062306a36Sopenharmony_ci	smp_call_function_any(cpu_sibling_mask(cpu), powernv_read_cpu_freq,
51162306a36Sopenharmony_ci			&freq_data, 1);
51262306a36Sopenharmony_ci
51362306a36Sopenharmony_ci	return freq_data.freq;
51462306a36Sopenharmony_ci}
51562306a36Sopenharmony_ci
51662306a36Sopenharmony_ci/*
51762306a36Sopenharmony_ci * set_pstate: Sets the pstate on this CPU.
51862306a36Sopenharmony_ci *
51962306a36Sopenharmony_ci * This is called via an smp_call_function.
52062306a36Sopenharmony_ci *
52162306a36Sopenharmony_ci * The caller must ensure that freq_data is of the type
52262306a36Sopenharmony_ci * (struct powernv_smp_call_data *) and the pstate_id which needs to be set
52362306a36Sopenharmony_ci * on this CPU should be present in freq_data->pstate_id.
52462306a36Sopenharmony_ci */
52562306a36Sopenharmony_cistatic void set_pstate(void *data)
52662306a36Sopenharmony_ci{
52762306a36Sopenharmony_ci	unsigned long val;
52862306a36Sopenharmony_ci	struct powernv_smp_call_data *freq_data = data;
52962306a36Sopenharmony_ci	unsigned long pstate_ul = freq_data->pstate_id;
53062306a36Sopenharmony_ci	unsigned long gpstate_ul = freq_data->gpstate_id;
53162306a36Sopenharmony_ci
53262306a36Sopenharmony_ci	val = get_pmspr(SPRN_PMCR);
53362306a36Sopenharmony_ci	val = val & 0x0000FFFFFFFFFFFFULL;
53462306a36Sopenharmony_ci
53562306a36Sopenharmony_ci	pstate_ul = pstate_ul & 0xFF;
53662306a36Sopenharmony_ci	gpstate_ul = gpstate_ul & 0xFF;
53762306a36Sopenharmony_ci
53862306a36Sopenharmony_ci	/* Set both global(bits 56..63) and local(bits 48..55) PStates */
53962306a36Sopenharmony_ci	val = val | (gpstate_ul << 56) | (pstate_ul << 48);
54062306a36Sopenharmony_ci
54162306a36Sopenharmony_ci	pr_debug("Setting cpu %d pmcr to %016lX\n",
54262306a36Sopenharmony_ci			raw_smp_processor_id(), val);
54362306a36Sopenharmony_ci	set_pmspr(SPRN_PMCR, val);
54462306a36Sopenharmony_ci}
54562306a36Sopenharmony_ci
54662306a36Sopenharmony_ci/*
54762306a36Sopenharmony_ci * get_nominal_index: Returns the index corresponding to the nominal
54862306a36Sopenharmony_ci * pstate in the cpufreq table
54962306a36Sopenharmony_ci */
55062306a36Sopenharmony_cistatic inline unsigned int get_nominal_index(void)
55162306a36Sopenharmony_ci{
55262306a36Sopenharmony_ci	return powernv_pstate_info.nominal;
55362306a36Sopenharmony_ci}
55462306a36Sopenharmony_ci
55562306a36Sopenharmony_cistatic void powernv_cpufreq_throttle_check(void *data)
55662306a36Sopenharmony_ci{
55762306a36Sopenharmony_ci	struct chip *chip;
55862306a36Sopenharmony_ci	unsigned int cpu = smp_processor_id();
55962306a36Sopenharmony_ci	unsigned long pmsr;
56062306a36Sopenharmony_ci	u8 pmsr_pmax;
56162306a36Sopenharmony_ci	unsigned int pmsr_pmax_idx;
56262306a36Sopenharmony_ci
56362306a36Sopenharmony_ci	pmsr = get_pmspr(SPRN_PMSR);
56462306a36Sopenharmony_ci	chip = this_cpu_read(chip_info);
56562306a36Sopenharmony_ci
56662306a36Sopenharmony_ci	/* Check for Pmax Capping */
56762306a36Sopenharmony_ci	pmsr_pmax = extract_max_pstate(pmsr);
56862306a36Sopenharmony_ci	pmsr_pmax_idx = pstate_to_idx(pmsr_pmax);
56962306a36Sopenharmony_ci	if (pmsr_pmax_idx != powernv_pstate_info.max) {
57062306a36Sopenharmony_ci		if (chip->throttled)
57162306a36Sopenharmony_ci			goto next;
57262306a36Sopenharmony_ci		chip->throttled = true;
57362306a36Sopenharmony_ci		if (pmsr_pmax_idx > powernv_pstate_info.nominal) {
57462306a36Sopenharmony_ci			pr_warn_once("CPU %d on Chip %u has Pmax(0x%x) reduced below that of nominal frequency(0x%x)\n",
57562306a36Sopenharmony_ci				     cpu, chip->id, pmsr_pmax,
57662306a36Sopenharmony_ci				     idx_to_pstate(powernv_pstate_info.nominal));
57762306a36Sopenharmony_ci			chip->throttle_sub_turbo++;
57862306a36Sopenharmony_ci		} else {
57962306a36Sopenharmony_ci			chip->throttle_turbo++;
58062306a36Sopenharmony_ci		}
58162306a36Sopenharmony_ci		trace_powernv_throttle(chip->id,
58262306a36Sopenharmony_ci				      throttle_reason[chip->throttle_reason],
58362306a36Sopenharmony_ci				      pmsr_pmax);
58462306a36Sopenharmony_ci	} else if (chip->throttled) {
58562306a36Sopenharmony_ci		chip->throttled = false;
58662306a36Sopenharmony_ci		trace_powernv_throttle(chip->id,
58762306a36Sopenharmony_ci				      throttle_reason[chip->throttle_reason],
58862306a36Sopenharmony_ci				      pmsr_pmax);
58962306a36Sopenharmony_ci	}
59062306a36Sopenharmony_ci
59162306a36Sopenharmony_ci	/* Check if Psafe_mode_active is set in PMSR. */
59262306a36Sopenharmony_cinext:
59362306a36Sopenharmony_ci	if (pmsr & PMSR_PSAFE_ENABLE) {
59462306a36Sopenharmony_ci		throttled = true;
59562306a36Sopenharmony_ci		pr_info("Pstate set to safe frequency\n");
59662306a36Sopenharmony_ci	}
59762306a36Sopenharmony_ci
59862306a36Sopenharmony_ci	/* Check if SPR_EM_DISABLE is set in PMSR */
59962306a36Sopenharmony_ci	if (pmsr & PMSR_SPR_EM_DISABLE) {
60062306a36Sopenharmony_ci		throttled = true;
60162306a36Sopenharmony_ci		pr_info("Frequency Control disabled from OS\n");
60262306a36Sopenharmony_ci	}
60362306a36Sopenharmony_ci
60462306a36Sopenharmony_ci	if (throttled) {
60562306a36Sopenharmony_ci		pr_info("PMSR = %16lx\n", pmsr);
60662306a36Sopenharmony_ci		pr_warn("CPU Frequency could be throttled\n");
60762306a36Sopenharmony_ci	}
60862306a36Sopenharmony_ci}
60962306a36Sopenharmony_ci
61062306a36Sopenharmony_ci/**
61162306a36Sopenharmony_ci * calc_global_pstate - Calculate global pstate
61262306a36Sopenharmony_ci * @elapsed_time:		Elapsed time in milliseconds
61362306a36Sopenharmony_ci * @local_pstate_idx:		New local pstate
61462306a36Sopenharmony_ci * @highest_lpstate_idx:	pstate from which its ramping down
61562306a36Sopenharmony_ci *
61662306a36Sopenharmony_ci * Finds the appropriate global pstate based on the pstate from which its
61762306a36Sopenharmony_ci * ramping down and the time elapsed in ramping down. It follows a quadratic
61862306a36Sopenharmony_ci * equation which ensures that it reaches ramping down to pmin in 5sec.
61962306a36Sopenharmony_ci */
62062306a36Sopenharmony_cistatic inline int calc_global_pstate(unsigned int elapsed_time,
62162306a36Sopenharmony_ci				     int highest_lpstate_idx,
62262306a36Sopenharmony_ci				     int local_pstate_idx)
62362306a36Sopenharmony_ci{
62462306a36Sopenharmony_ci	int index_diff;
62562306a36Sopenharmony_ci
62662306a36Sopenharmony_ci	/*
62762306a36Sopenharmony_ci	 * Using ramp_down_percent we get the percentage of rampdown
62862306a36Sopenharmony_ci	 * that we are expecting to be dropping. Difference between
62962306a36Sopenharmony_ci	 * highest_lpstate_idx and powernv_pstate_info.min will give a absolute
63062306a36Sopenharmony_ci	 * number of how many pstates we will drop eventually by the end of
63162306a36Sopenharmony_ci	 * 5 seconds, then just scale it get the number pstates to be dropped.
63262306a36Sopenharmony_ci	 */
63362306a36Sopenharmony_ci	index_diff =  ((int)ramp_down_percent(elapsed_time) *
63462306a36Sopenharmony_ci			(powernv_pstate_info.min - highest_lpstate_idx)) / 100;
63562306a36Sopenharmony_ci
63662306a36Sopenharmony_ci	/* Ensure that global pstate is >= to local pstate */
63762306a36Sopenharmony_ci	if (highest_lpstate_idx + index_diff >= local_pstate_idx)
63862306a36Sopenharmony_ci		return local_pstate_idx;
63962306a36Sopenharmony_ci	else
64062306a36Sopenharmony_ci		return highest_lpstate_idx + index_diff;
64162306a36Sopenharmony_ci}
64262306a36Sopenharmony_ci
64362306a36Sopenharmony_cistatic inline void  queue_gpstate_timer(struct global_pstate_info *gpstates)
64462306a36Sopenharmony_ci{
64562306a36Sopenharmony_ci	unsigned int timer_interval;
64662306a36Sopenharmony_ci
64762306a36Sopenharmony_ci	/*
64862306a36Sopenharmony_ci	 * Setting up timer to fire after GPSTATE_TIMER_INTERVAL ms, But
64962306a36Sopenharmony_ci	 * if it exceeds MAX_RAMP_DOWN_TIME ms for ramp down time.
65062306a36Sopenharmony_ci	 * Set timer such that it fires exactly at MAX_RAMP_DOWN_TIME
65162306a36Sopenharmony_ci	 * seconds of ramp down time.
65262306a36Sopenharmony_ci	 */
65362306a36Sopenharmony_ci	if ((gpstates->elapsed_time + GPSTATE_TIMER_INTERVAL)
65462306a36Sopenharmony_ci	     > MAX_RAMP_DOWN_TIME)
65562306a36Sopenharmony_ci		timer_interval = MAX_RAMP_DOWN_TIME - gpstates->elapsed_time;
65662306a36Sopenharmony_ci	else
65762306a36Sopenharmony_ci		timer_interval = GPSTATE_TIMER_INTERVAL;
65862306a36Sopenharmony_ci
65962306a36Sopenharmony_ci	mod_timer(&gpstates->timer, jiffies + msecs_to_jiffies(timer_interval));
66062306a36Sopenharmony_ci}
66162306a36Sopenharmony_ci
66262306a36Sopenharmony_ci/**
66362306a36Sopenharmony_ci * gpstate_timer_handler
66462306a36Sopenharmony_ci *
66562306a36Sopenharmony_ci * @t: Timer context used to fetch global pstate info struct
66662306a36Sopenharmony_ci *
66762306a36Sopenharmony_ci * This handler brings down the global pstate closer to the local pstate
66862306a36Sopenharmony_ci * according quadratic equation. Queues a new timer if it is still not equal
66962306a36Sopenharmony_ci * to local pstate
67062306a36Sopenharmony_ci */
67162306a36Sopenharmony_cistatic void gpstate_timer_handler(struct timer_list *t)
67262306a36Sopenharmony_ci{
67362306a36Sopenharmony_ci	struct global_pstate_info *gpstates = from_timer(gpstates, t, timer);
67462306a36Sopenharmony_ci	struct cpufreq_policy *policy = gpstates->policy;
67562306a36Sopenharmony_ci	int gpstate_idx, lpstate_idx;
67662306a36Sopenharmony_ci	unsigned long val;
67762306a36Sopenharmony_ci	unsigned int time_diff = jiffies_to_msecs(jiffies)
67862306a36Sopenharmony_ci					- gpstates->last_sampled_time;
67962306a36Sopenharmony_ci	struct powernv_smp_call_data freq_data;
68062306a36Sopenharmony_ci
68162306a36Sopenharmony_ci	if (!spin_trylock(&gpstates->gpstate_lock))
68262306a36Sopenharmony_ci		return;
68362306a36Sopenharmony_ci	/*
68462306a36Sopenharmony_ci	 * If the timer has migrated to the different cpu then bring
68562306a36Sopenharmony_ci	 * it back to one of the policy->cpus
68662306a36Sopenharmony_ci	 */
68762306a36Sopenharmony_ci	if (!cpumask_test_cpu(raw_smp_processor_id(), policy->cpus)) {
68862306a36Sopenharmony_ci		gpstates->timer.expires = jiffies + msecs_to_jiffies(1);
68962306a36Sopenharmony_ci		add_timer_on(&gpstates->timer, cpumask_first(policy->cpus));
69062306a36Sopenharmony_ci		spin_unlock(&gpstates->gpstate_lock);
69162306a36Sopenharmony_ci		return;
69262306a36Sopenharmony_ci	}
69362306a36Sopenharmony_ci
69462306a36Sopenharmony_ci	/*
69562306a36Sopenharmony_ci	 * If PMCR was last updated was using fast_swtich then
69662306a36Sopenharmony_ci	 * We may have wrong in gpstate->last_lpstate_idx
69762306a36Sopenharmony_ci	 * value. Hence, read from PMCR to get correct data.
69862306a36Sopenharmony_ci	 */
69962306a36Sopenharmony_ci	val = get_pmspr(SPRN_PMCR);
70062306a36Sopenharmony_ci	freq_data.gpstate_id = extract_global_pstate(val);
70162306a36Sopenharmony_ci	freq_data.pstate_id = extract_local_pstate(val);
70262306a36Sopenharmony_ci	if (freq_data.gpstate_id  == freq_data.pstate_id) {
70362306a36Sopenharmony_ci		reset_gpstates(policy);
70462306a36Sopenharmony_ci		spin_unlock(&gpstates->gpstate_lock);
70562306a36Sopenharmony_ci		return;
70662306a36Sopenharmony_ci	}
70762306a36Sopenharmony_ci
70862306a36Sopenharmony_ci	gpstates->last_sampled_time += time_diff;
70962306a36Sopenharmony_ci	gpstates->elapsed_time += time_diff;
71062306a36Sopenharmony_ci
71162306a36Sopenharmony_ci	if (gpstates->elapsed_time > MAX_RAMP_DOWN_TIME) {
71262306a36Sopenharmony_ci		gpstate_idx = pstate_to_idx(freq_data.pstate_id);
71362306a36Sopenharmony_ci		lpstate_idx = gpstate_idx;
71462306a36Sopenharmony_ci		reset_gpstates(policy);
71562306a36Sopenharmony_ci		gpstates->highest_lpstate_idx = gpstate_idx;
71662306a36Sopenharmony_ci	} else {
71762306a36Sopenharmony_ci		lpstate_idx = pstate_to_idx(freq_data.pstate_id);
71862306a36Sopenharmony_ci		gpstate_idx = calc_global_pstate(gpstates->elapsed_time,
71962306a36Sopenharmony_ci						 gpstates->highest_lpstate_idx,
72062306a36Sopenharmony_ci						 lpstate_idx);
72162306a36Sopenharmony_ci	}
72262306a36Sopenharmony_ci	freq_data.gpstate_id = idx_to_pstate(gpstate_idx);
72362306a36Sopenharmony_ci	gpstates->last_gpstate_idx = gpstate_idx;
72462306a36Sopenharmony_ci	gpstates->last_lpstate_idx = lpstate_idx;
72562306a36Sopenharmony_ci	/*
72662306a36Sopenharmony_ci	 * If local pstate is equal to global pstate, rampdown is over
72762306a36Sopenharmony_ci	 * So timer is not required to be queued.
72862306a36Sopenharmony_ci	 */
72962306a36Sopenharmony_ci	if (gpstate_idx != gpstates->last_lpstate_idx)
73062306a36Sopenharmony_ci		queue_gpstate_timer(gpstates);
73162306a36Sopenharmony_ci
73262306a36Sopenharmony_ci	set_pstate(&freq_data);
73362306a36Sopenharmony_ci	spin_unlock(&gpstates->gpstate_lock);
73462306a36Sopenharmony_ci}
73562306a36Sopenharmony_ci
73662306a36Sopenharmony_ci/*
73762306a36Sopenharmony_ci * powernv_cpufreq_target_index: Sets the frequency corresponding to
73862306a36Sopenharmony_ci * the cpufreq table entry indexed by new_index on the cpus in the
73962306a36Sopenharmony_ci * mask policy->cpus
74062306a36Sopenharmony_ci */
74162306a36Sopenharmony_cistatic int powernv_cpufreq_target_index(struct cpufreq_policy *policy,
74262306a36Sopenharmony_ci					unsigned int new_index)
74362306a36Sopenharmony_ci{
74462306a36Sopenharmony_ci	struct powernv_smp_call_data freq_data;
74562306a36Sopenharmony_ci	unsigned int cur_msec, gpstate_idx;
74662306a36Sopenharmony_ci	struct global_pstate_info *gpstates = policy->driver_data;
74762306a36Sopenharmony_ci
74862306a36Sopenharmony_ci	if (unlikely(rebooting) && new_index != get_nominal_index())
74962306a36Sopenharmony_ci		return 0;
75062306a36Sopenharmony_ci
75162306a36Sopenharmony_ci	if (!throttled) {
75262306a36Sopenharmony_ci		/* we don't want to be preempted while
75362306a36Sopenharmony_ci		 * checking if the CPU frequency has been throttled
75462306a36Sopenharmony_ci		 */
75562306a36Sopenharmony_ci		preempt_disable();
75662306a36Sopenharmony_ci		powernv_cpufreq_throttle_check(NULL);
75762306a36Sopenharmony_ci		preempt_enable();
75862306a36Sopenharmony_ci	}
75962306a36Sopenharmony_ci
76062306a36Sopenharmony_ci	cur_msec = jiffies_to_msecs(get_jiffies_64());
76162306a36Sopenharmony_ci
76262306a36Sopenharmony_ci	freq_data.pstate_id = idx_to_pstate(new_index);
76362306a36Sopenharmony_ci	if (!gpstates) {
76462306a36Sopenharmony_ci		freq_data.gpstate_id = freq_data.pstate_id;
76562306a36Sopenharmony_ci		goto no_gpstate;
76662306a36Sopenharmony_ci	}
76762306a36Sopenharmony_ci
76862306a36Sopenharmony_ci	spin_lock(&gpstates->gpstate_lock);
76962306a36Sopenharmony_ci
77062306a36Sopenharmony_ci	if (!gpstates->last_sampled_time) {
77162306a36Sopenharmony_ci		gpstate_idx = new_index;
77262306a36Sopenharmony_ci		gpstates->highest_lpstate_idx = new_index;
77362306a36Sopenharmony_ci		goto gpstates_done;
77462306a36Sopenharmony_ci	}
77562306a36Sopenharmony_ci
77662306a36Sopenharmony_ci	if (gpstates->last_gpstate_idx < new_index) {
77762306a36Sopenharmony_ci		gpstates->elapsed_time += cur_msec -
77862306a36Sopenharmony_ci						 gpstates->last_sampled_time;
77962306a36Sopenharmony_ci
78062306a36Sopenharmony_ci		/*
78162306a36Sopenharmony_ci		 * If its has been ramping down for more than MAX_RAMP_DOWN_TIME
78262306a36Sopenharmony_ci		 * we should be resetting all global pstate related data. Set it
78362306a36Sopenharmony_ci		 * equal to local pstate to start fresh.
78462306a36Sopenharmony_ci		 */
78562306a36Sopenharmony_ci		if (gpstates->elapsed_time > MAX_RAMP_DOWN_TIME) {
78662306a36Sopenharmony_ci			reset_gpstates(policy);
78762306a36Sopenharmony_ci			gpstates->highest_lpstate_idx = new_index;
78862306a36Sopenharmony_ci			gpstate_idx = new_index;
78962306a36Sopenharmony_ci		} else {
79062306a36Sopenharmony_ci		/* Elaspsed_time is less than 5 seconds, continue to rampdown */
79162306a36Sopenharmony_ci			gpstate_idx = calc_global_pstate(gpstates->elapsed_time,
79262306a36Sopenharmony_ci							 gpstates->highest_lpstate_idx,
79362306a36Sopenharmony_ci							 new_index);
79462306a36Sopenharmony_ci		}
79562306a36Sopenharmony_ci	} else {
79662306a36Sopenharmony_ci		reset_gpstates(policy);
79762306a36Sopenharmony_ci		gpstates->highest_lpstate_idx = new_index;
79862306a36Sopenharmony_ci		gpstate_idx = new_index;
79962306a36Sopenharmony_ci	}
80062306a36Sopenharmony_ci
80162306a36Sopenharmony_ci	/*
80262306a36Sopenharmony_ci	 * If local pstate is equal to global pstate, rampdown is over
80362306a36Sopenharmony_ci	 * So timer is not required to be queued.
80462306a36Sopenharmony_ci	 */
80562306a36Sopenharmony_ci	if (gpstate_idx != new_index)
80662306a36Sopenharmony_ci		queue_gpstate_timer(gpstates);
80762306a36Sopenharmony_ci	else
80862306a36Sopenharmony_ci		del_timer_sync(&gpstates->timer);
80962306a36Sopenharmony_ci
81062306a36Sopenharmony_cigpstates_done:
81162306a36Sopenharmony_ci	freq_data.gpstate_id = idx_to_pstate(gpstate_idx);
81262306a36Sopenharmony_ci	gpstates->last_sampled_time = cur_msec;
81362306a36Sopenharmony_ci	gpstates->last_gpstate_idx = gpstate_idx;
81462306a36Sopenharmony_ci	gpstates->last_lpstate_idx = new_index;
81562306a36Sopenharmony_ci
81662306a36Sopenharmony_ci	spin_unlock(&gpstates->gpstate_lock);
81762306a36Sopenharmony_ci
81862306a36Sopenharmony_cino_gpstate:
81962306a36Sopenharmony_ci	/*
82062306a36Sopenharmony_ci	 * Use smp_call_function to send IPI and execute the
82162306a36Sopenharmony_ci	 * mtspr on target CPU.  We could do that without IPI
82262306a36Sopenharmony_ci	 * if current CPU is within policy->cpus (core)
82362306a36Sopenharmony_ci	 */
82462306a36Sopenharmony_ci	smp_call_function_any(policy->cpus, set_pstate, &freq_data, 1);
82562306a36Sopenharmony_ci	return 0;
82662306a36Sopenharmony_ci}
82762306a36Sopenharmony_ci
82862306a36Sopenharmony_cistatic int powernv_cpufreq_cpu_init(struct cpufreq_policy *policy)
82962306a36Sopenharmony_ci{
83062306a36Sopenharmony_ci	int base, i;
83162306a36Sopenharmony_ci	struct kernfs_node *kn;
83262306a36Sopenharmony_ci	struct global_pstate_info *gpstates;
83362306a36Sopenharmony_ci
83462306a36Sopenharmony_ci	base = cpu_first_thread_sibling(policy->cpu);
83562306a36Sopenharmony_ci
83662306a36Sopenharmony_ci	for (i = 0; i < threads_per_core; i++)
83762306a36Sopenharmony_ci		cpumask_set_cpu(base + i, policy->cpus);
83862306a36Sopenharmony_ci
83962306a36Sopenharmony_ci	kn = kernfs_find_and_get(policy->kobj.sd, throttle_attr_grp.name);
84062306a36Sopenharmony_ci	if (!kn) {
84162306a36Sopenharmony_ci		int ret;
84262306a36Sopenharmony_ci
84362306a36Sopenharmony_ci		ret = sysfs_create_group(&policy->kobj, &throttle_attr_grp);
84462306a36Sopenharmony_ci		if (ret) {
84562306a36Sopenharmony_ci			pr_info("Failed to create throttle stats directory for cpu %d\n",
84662306a36Sopenharmony_ci				policy->cpu);
84762306a36Sopenharmony_ci			return ret;
84862306a36Sopenharmony_ci		}
84962306a36Sopenharmony_ci	} else {
85062306a36Sopenharmony_ci		kernfs_put(kn);
85162306a36Sopenharmony_ci	}
85262306a36Sopenharmony_ci
85362306a36Sopenharmony_ci	policy->freq_table = powernv_freqs;
85462306a36Sopenharmony_ci	policy->fast_switch_possible = true;
85562306a36Sopenharmony_ci
85662306a36Sopenharmony_ci	if (pvr_version_is(PVR_POWER9))
85762306a36Sopenharmony_ci		return 0;
85862306a36Sopenharmony_ci
85962306a36Sopenharmony_ci	/* Initialise Gpstate ramp-down timer only on POWER8 */
86062306a36Sopenharmony_ci	gpstates =  kzalloc(sizeof(*gpstates), GFP_KERNEL);
86162306a36Sopenharmony_ci	if (!gpstates)
86262306a36Sopenharmony_ci		return -ENOMEM;
86362306a36Sopenharmony_ci
86462306a36Sopenharmony_ci	policy->driver_data = gpstates;
86562306a36Sopenharmony_ci
86662306a36Sopenharmony_ci	/* initialize timer */
86762306a36Sopenharmony_ci	gpstates->policy = policy;
86862306a36Sopenharmony_ci	timer_setup(&gpstates->timer, gpstate_timer_handler,
86962306a36Sopenharmony_ci		    TIMER_PINNED | TIMER_DEFERRABLE);
87062306a36Sopenharmony_ci	gpstates->timer.expires = jiffies +
87162306a36Sopenharmony_ci				msecs_to_jiffies(GPSTATE_TIMER_INTERVAL);
87262306a36Sopenharmony_ci	spin_lock_init(&gpstates->gpstate_lock);
87362306a36Sopenharmony_ci
87462306a36Sopenharmony_ci	return 0;
87562306a36Sopenharmony_ci}
87662306a36Sopenharmony_ci
87762306a36Sopenharmony_cistatic int powernv_cpufreq_cpu_exit(struct cpufreq_policy *policy)
87862306a36Sopenharmony_ci{
87962306a36Sopenharmony_ci	struct powernv_smp_call_data freq_data;
88062306a36Sopenharmony_ci	struct global_pstate_info *gpstates = policy->driver_data;
88162306a36Sopenharmony_ci
88262306a36Sopenharmony_ci	freq_data.pstate_id = idx_to_pstate(powernv_pstate_info.min);
88362306a36Sopenharmony_ci	freq_data.gpstate_id = idx_to_pstate(powernv_pstate_info.min);
88462306a36Sopenharmony_ci	smp_call_function_single(policy->cpu, set_pstate, &freq_data, 1);
88562306a36Sopenharmony_ci	if (gpstates)
88662306a36Sopenharmony_ci		del_timer_sync(&gpstates->timer);
88762306a36Sopenharmony_ci
88862306a36Sopenharmony_ci	kfree(policy->driver_data);
88962306a36Sopenharmony_ci
89062306a36Sopenharmony_ci	return 0;
89162306a36Sopenharmony_ci}
89262306a36Sopenharmony_ci
89362306a36Sopenharmony_cistatic int powernv_cpufreq_reboot_notifier(struct notifier_block *nb,
89462306a36Sopenharmony_ci				unsigned long action, void *unused)
89562306a36Sopenharmony_ci{
89662306a36Sopenharmony_ci	int cpu;
89762306a36Sopenharmony_ci	struct cpufreq_policy *cpu_policy;
89862306a36Sopenharmony_ci
89962306a36Sopenharmony_ci	rebooting = true;
90062306a36Sopenharmony_ci	for_each_online_cpu(cpu) {
90162306a36Sopenharmony_ci		cpu_policy = cpufreq_cpu_get(cpu);
90262306a36Sopenharmony_ci		if (!cpu_policy)
90362306a36Sopenharmony_ci			continue;
90462306a36Sopenharmony_ci		powernv_cpufreq_target_index(cpu_policy, get_nominal_index());
90562306a36Sopenharmony_ci		cpufreq_cpu_put(cpu_policy);
90662306a36Sopenharmony_ci	}
90762306a36Sopenharmony_ci
90862306a36Sopenharmony_ci	return NOTIFY_DONE;
90962306a36Sopenharmony_ci}
91062306a36Sopenharmony_ci
91162306a36Sopenharmony_cistatic struct notifier_block powernv_cpufreq_reboot_nb = {
91262306a36Sopenharmony_ci	.notifier_call = powernv_cpufreq_reboot_notifier,
91362306a36Sopenharmony_ci};
91462306a36Sopenharmony_ci
91562306a36Sopenharmony_cistatic void powernv_cpufreq_work_fn(struct work_struct *work)
91662306a36Sopenharmony_ci{
91762306a36Sopenharmony_ci	struct chip *chip = container_of(work, struct chip, throttle);
91862306a36Sopenharmony_ci	struct cpufreq_policy *policy;
91962306a36Sopenharmony_ci	unsigned int cpu;
92062306a36Sopenharmony_ci	cpumask_t mask;
92162306a36Sopenharmony_ci
92262306a36Sopenharmony_ci	cpus_read_lock();
92362306a36Sopenharmony_ci	cpumask_and(&mask, &chip->mask, cpu_online_mask);
92462306a36Sopenharmony_ci	smp_call_function_any(&mask,
92562306a36Sopenharmony_ci			      powernv_cpufreq_throttle_check, NULL, 0);
92662306a36Sopenharmony_ci
92762306a36Sopenharmony_ci	if (!chip->restore)
92862306a36Sopenharmony_ci		goto out;
92962306a36Sopenharmony_ci
93062306a36Sopenharmony_ci	chip->restore = false;
93162306a36Sopenharmony_ci	for_each_cpu(cpu, &mask) {
93262306a36Sopenharmony_ci		int index;
93362306a36Sopenharmony_ci
93462306a36Sopenharmony_ci		policy = cpufreq_cpu_get(cpu);
93562306a36Sopenharmony_ci		if (!policy)
93662306a36Sopenharmony_ci			continue;
93762306a36Sopenharmony_ci		index = cpufreq_table_find_index_c(policy, policy->cur, false);
93862306a36Sopenharmony_ci		powernv_cpufreq_target_index(policy, index);
93962306a36Sopenharmony_ci		cpumask_andnot(&mask, &mask, policy->cpus);
94062306a36Sopenharmony_ci		cpufreq_cpu_put(policy);
94162306a36Sopenharmony_ci	}
94262306a36Sopenharmony_ciout:
94362306a36Sopenharmony_ci	cpus_read_unlock();
94462306a36Sopenharmony_ci}
94562306a36Sopenharmony_ci
94662306a36Sopenharmony_cistatic int powernv_cpufreq_occ_msg(struct notifier_block *nb,
94762306a36Sopenharmony_ci				   unsigned long msg_type, void *_msg)
94862306a36Sopenharmony_ci{
94962306a36Sopenharmony_ci	struct opal_msg *msg = _msg;
95062306a36Sopenharmony_ci	struct opal_occ_msg omsg;
95162306a36Sopenharmony_ci	int i;
95262306a36Sopenharmony_ci
95362306a36Sopenharmony_ci	if (msg_type != OPAL_MSG_OCC)
95462306a36Sopenharmony_ci		return 0;
95562306a36Sopenharmony_ci
95662306a36Sopenharmony_ci	omsg.type = be64_to_cpu(msg->params[0]);
95762306a36Sopenharmony_ci
95862306a36Sopenharmony_ci	switch (omsg.type) {
95962306a36Sopenharmony_ci	case OCC_RESET:
96062306a36Sopenharmony_ci		occ_reset = true;
96162306a36Sopenharmony_ci		pr_info("OCC (On Chip Controller - enforces hard thermal/power limits) Resetting\n");
96262306a36Sopenharmony_ci		/*
96362306a36Sopenharmony_ci		 * powernv_cpufreq_throttle_check() is called in
96462306a36Sopenharmony_ci		 * target() callback which can detect the throttle state
96562306a36Sopenharmony_ci		 * for governors like ondemand.
96662306a36Sopenharmony_ci		 * But static governors will not call target() often thus
96762306a36Sopenharmony_ci		 * report throttling here.
96862306a36Sopenharmony_ci		 */
96962306a36Sopenharmony_ci		if (!throttled) {
97062306a36Sopenharmony_ci			throttled = true;
97162306a36Sopenharmony_ci			pr_warn("CPU frequency is throttled for duration\n");
97262306a36Sopenharmony_ci		}
97362306a36Sopenharmony_ci
97462306a36Sopenharmony_ci		break;
97562306a36Sopenharmony_ci	case OCC_LOAD:
97662306a36Sopenharmony_ci		pr_info("OCC Loading, CPU frequency is throttled until OCC is started\n");
97762306a36Sopenharmony_ci		break;
97862306a36Sopenharmony_ci	case OCC_THROTTLE:
97962306a36Sopenharmony_ci		omsg.chip = be64_to_cpu(msg->params[1]);
98062306a36Sopenharmony_ci		omsg.throttle_status = be64_to_cpu(msg->params[2]);
98162306a36Sopenharmony_ci
98262306a36Sopenharmony_ci		if (occ_reset) {
98362306a36Sopenharmony_ci			occ_reset = false;
98462306a36Sopenharmony_ci			throttled = false;
98562306a36Sopenharmony_ci			pr_info("OCC Active, CPU frequency is no longer throttled\n");
98662306a36Sopenharmony_ci
98762306a36Sopenharmony_ci			for (i = 0; i < nr_chips; i++) {
98862306a36Sopenharmony_ci				chips[i].restore = true;
98962306a36Sopenharmony_ci				schedule_work(&chips[i].throttle);
99062306a36Sopenharmony_ci			}
99162306a36Sopenharmony_ci
99262306a36Sopenharmony_ci			return 0;
99362306a36Sopenharmony_ci		}
99462306a36Sopenharmony_ci
99562306a36Sopenharmony_ci		for (i = 0; i < nr_chips; i++)
99662306a36Sopenharmony_ci			if (chips[i].id == omsg.chip)
99762306a36Sopenharmony_ci				break;
99862306a36Sopenharmony_ci
99962306a36Sopenharmony_ci		if (omsg.throttle_status >= 0 &&
100062306a36Sopenharmony_ci		    omsg.throttle_status <= OCC_MAX_THROTTLE_STATUS) {
100162306a36Sopenharmony_ci			chips[i].throttle_reason = omsg.throttle_status;
100262306a36Sopenharmony_ci			chips[i].reason[omsg.throttle_status]++;
100362306a36Sopenharmony_ci		}
100462306a36Sopenharmony_ci
100562306a36Sopenharmony_ci		if (!omsg.throttle_status)
100662306a36Sopenharmony_ci			chips[i].restore = true;
100762306a36Sopenharmony_ci
100862306a36Sopenharmony_ci		schedule_work(&chips[i].throttle);
100962306a36Sopenharmony_ci	}
101062306a36Sopenharmony_ci	return 0;
101162306a36Sopenharmony_ci}
101262306a36Sopenharmony_ci
101362306a36Sopenharmony_cistatic struct notifier_block powernv_cpufreq_opal_nb = {
101462306a36Sopenharmony_ci	.notifier_call	= powernv_cpufreq_occ_msg,
101562306a36Sopenharmony_ci	.next		= NULL,
101662306a36Sopenharmony_ci	.priority	= 0,
101762306a36Sopenharmony_ci};
101862306a36Sopenharmony_ci
101962306a36Sopenharmony_cistatic unsigned int powernv_fast_switch(struct cpufreq_policy *policy,
102062306a36Sopenharmony_ci					unsigned int target_freq)
102162306a36Sopenharmony_ci{
102262306a36Sopenharmony_ci	int index;
102362306a36Sopenharmony_ci	struct powernv_smp_call_data freq_data;
102462306a36Sopenharmony_ci
102562306a36Sopenharmony_ci	index = cpufreq_table_find_index_dl(policy, target_freq, false);
102662306a36Sopenharmony_ci	freq_data.pstate_id = powernv_freqs[index].driver_data;
102762306a36Sopenharmony_ci	freq_data.gpstate_id = powernv_freqs[index].driver_data;
102862306a36Sopenharmony_ci	set_pstate(&freq_data);
102962306a36Sopenharmony_ci
103062306a36Sopenharmony_ci	return powernv_freqs[index].frequency;
103162306a36Sopenharmony_ci}
103262306a36Sopenharmony_ci
103362306a36Sopenharmony_cistatic struct cpufreq_driver powernv_cpufreq_driver = {
103462306a36Sopenharmony_ci	.name		= "powernv-cpufreq",
103562306a36Sopenharmony_ci	.flags		= CPUFREQ_CONST_LOOPS,
103662306a36Sopenharmony_ci	.init		= powernv_cpufreq_cpu_init,
103762306a36Sopenharmony_ci	.exit		= powernv_cpufreq_cpu_exit,
103862306a36Sopenharmony_ci	.verify		= cpufreq_generic_frequency_table_verify,
103962306a36Sopenharmony_ci	.target_index	= powernv_cpufreq_target_index,
104062306a36Sopenharmony_ci	.fast_switch	= powernv_fast_switch,
104162306a36Sopenharmony_ci	.get		= powernv_cpufreq_get,
104262306a36Sopenharmony_ci	.attr		= powernv_cpu_freq_attr,
104362306a36Sopenharmony_ci};
104462306a36Sopenharmony_ci
104562306a36Sopenharmony_cistatic int init_chip_info(void)
104662306a36Sopenharmony_ci{
104762306a36Sopenharmony_ci	unsigned int *chip;
104862306a36Sopenharmony_ci	unsigned int cpu, i;
104962306a36Sopenharmony_ci	unsigned int prev_chip_id = UINT_MAX;
105062306a36Sopenharmony_ci	cpumask_t *chip_cpu_mask;
105162306a36Sopenharmony_ci	int ret = 0;
105262306a36Sopenharmony_ci
105362306a36Sopenharmony_ci	chip = kcalloc(num_possible_cpus(), sizeof(*chip), GFP_KERNEL);
105462306a36Sopenharmony_ci	if (!chip)
105562306a36Sopenharmony_ci		return -ENOMEM;
105662306a36Sopenharmony_ci
105762306a36Sopenharmony_ci	/* Allocate a chip cpu mask large enough to fit mask for all chips */
105862306a36Sopenharmony_ci	chip_cpu_mask = kcalloc(MAX_NR_CHIPS, sizeof(cpumask_t), GFP_KERNEL);
105962306a36Sopenharmony_ci	if (!chip_cpu_mask) {
106062306a36Sopenharmony_ci		ret = -ENOMEM;
106162306a36Sopenharmony_ci		goto free_and_return;
106262306a36Sopenharmony_ci	}
106362306a36Sopenharmony_ci
106462306a36Sopenharmony_ci	for_each_possible_cpu(cpu) {
106562306a36Sopenharmony_ci		unsigned int id = cpu_to_chip_id(cpu);
106662306a36Sopenharmony_ci
106762306a36Sopenharmony_ci		if (prev_chip_id != id) {
106862306a36Sopenharmony_ci			prev_chip_id = id;
106962306a36Sopenharmony_ci			chip[nr_chips++] = id;
107062306a36Sopenharmony_ci		}
107162306a36Sopenharmony_ci		cpumask_set_cpu(cpu, &chip_cpu_mask[nr_chips-1]);
107262306a36Sopenharmony_ci	}
107362306a36Sopenharmony_ci
107462306a36Sopenharmony_ci	chips = kcalloc(nr_chips, sizeof(struct chip), GFP_KERNEL);
107562306a36Sopenharmony_ci	if (!chips) {
107662306a36Sopenharmony_ci		ret = -ENOMEM;
107762306a36Sopenharmony_ci		goto out_free_chip_cpu_mask;
107862306a36Sopenharmony_ci	}
107962306a36Sopenharmony_ci
108062306a36Sopenharmony_ci	for (i = 0; i < nr_chips; i++) {
108162306a36Sopenharmony_ci		chips[i].id = chip[i];
108262306a36Sopenharmony_ci		cpumask_copy(&chips[i].mask, &chip_cpu_mask[i]);
108362306a36Sopenharmony_ci		INIT_WORK(&chips[i].throttle, powernv_cpufreq_work_fn);
108462306a36Sopenharmony_ci		for_each_cpu(cpu, &chips[i].mask)
108562306a36Sopenharmony_ci			per_cpu(chip_info, cpu) =  &chips[i];
108662306a36Sopenharmony_ci	}
108762306a36Sopenharmony_ci
108862306a36Sopenharmony_ciout_free_chip_cpu_mask:
108962306a36Sopenharmony_ci	kfree(chip_cpu_mask);
109062306a36Sopenharmony_cifree_and_return:
109162306a36Sopenharmony_ci	kfree(chip);
109262306a36Sopenharmony_ci	return ret;
109362306a36Sopenharmony_ci}
109462306a36Sopenharmony_ci
109562306a36Sopenharmony_cistatic inline void clean_chip_info(void)
109662306a36Sopenharmony_ci{
109762306a36Sopenharmony_ci	int i;
109862306a36Sopenharmony_ci
109962306a36Sopenharmony_ci	/* flush any pending work items */
110062306a36Sopenharmony_ci	if (chips)
110162306a36Sopenharmony_ci		for (i = 0; i < nr_chips; i++)
110262306a36Sopenharmony_ci			cancel_work_sync(&chips[i].throttle);
110362306a36Sopenharmony_ci	kfree(chips);
110462306a36Sopenharmony_ci}
110562306a36Sopenharmony_ci
110662306a36Sopenharmony_cistatic inline void unregister_all_notifiers(void)
110762306a36Sopenharmony_ci{
110862306a36Sopenharmony_ci	opal_message_notifier_unregister(OPAL_MSG_OCC,
110962306a36Sopenharmony_ci					 &powernv_cpufreq_opal_nb);
111062306a36Sopenharmony_ci	unregister_reboot_notifier(&powernv_cpufreq_reboot_nb);
111162306a36Sopenharmony_ci}
111262306a36Sopenharmony_ci
111362306a36Sopenharmony_cistatic int __init powernv_cpufreq_init(void)
111462306a36Sopenharmony_ci{
111562306a36Sopenharmony_ci	int rc = 0;
111662306a36Sopenharmony_ci
111762306a36Sopenharmony_ci	/* Don't probe on pseries (guest) platforms */
111862306a36Sopenharmony_ci	if (!firmware_has_feature(FW_FEATURE_OPAL))
111962306a36Sopenharmony_ci		return -ENODEV;
112062306a36Sopenharmony_ci
112162306a36Sopenharmony_ci	/* Discover pstates from device tree and init */
112262306a36Sopenharmony_ci	rc = init_powernv_pstates();
112362306a36Sopenharmony_ci	if (rc)
112462306a36Sopenharmony_ci		goto out;
112562306a36Sopenharmony_ci
112662306a36Sopenharmony_ci	/* Populate chip info */
112762306a36Sopenharmony_ci	rc = init_chip_info();
112862306a36Sopenharmony_ci	if (rc)
112962306a36Sopenharmony_ci		goto out;
113062306a36Sopenharmony_ci
113162306a36Sopenharmony_ci	if (powernv_pstate_info.wof_enabled)
113262306a36Sopenharmony_ci		powernv_cpufreq_driver.boost_enabled = true;
113362306a36Sopenharmony_ci	else
113462306a36Sopenharmony_ci		powernv_cpu_freq_attr[SCALING_BOOST_FREQS_ATTR_INDEX] = NULL;
113562306a36Sopenharmony_ci
113662306a36Sopenharmony_ci	rc = cpufreq_register_driver(&powernv_cpufreq_driver);
113762306a36Sopenharmony_ci	if (rc) {
113862306a36Sopenharmony_ci		pr_info("Failed to register the cpufreq driver (%d)\n", rc);
113962306a36Sopenharmony_ci		goto cleanup;
114062306a36Sopenharmony_ci	}
114162306a36Sopenharmony_ci
114262306a36Sopenharmony_ci	if (powernv_pstate_info.wof_enabled)
114362306a36Sopenharmony_ci		cpufreq_enable_boost_support();
114462306a36Sopenharmony_ci
114562306a36Sopenharmony_ci	register_reboot_notifier(&powernv_cpufreq_reboot_nb);
114662306a36Sopenharmony_ci	opal_message_notifier_register(OPAL_MSG_OCC, &powernv_cpufreq_opal_nb);
114762306a36Sopenharmony_ci
114862306a36Sopenharmony_ci	return 0;
114962306a36Sopenharmony_cicleanup:
115062306a36Sopenharmony_ci	clean_chip_info();
115162306a36Sopenharmony_ciout:
115262306a36Sopenharmony_ci	pr_info("Platform driver disabled. System does not support PState control\n");
115362306a36Sopenharmony_ci	return rc;
115462306a36Sopenharmony_ci}
115562306a36Sopenharmony_cimodule_init(powernv_cpufreq_init);
115662306a36Sopenharmony_ci
115762306a36Sopenharmony_cistatic void __exit powernv_cpufreq_exit(void)
115862306a36Sopenharmony_ci{
115962306a36Sopenharmony_ci	cpufreq_unregister_driver(&powernv_cpufreq_driver);
116062306a36Sopenharmony_ci	unregister_all_notifiers();
116162306a36Sopenharmony_ci	clean_chip_info();
116262306a36Sopenharmony_ci}
116362306a36Sopenharmony_cimodule_exit(powernv_cpufreq_exit);
116462306a36Sopenharmony_ci
116562306a36Sopenharmony_ciMODULE_LICENSE("GPL");
116662306a36Sopenharmony_ciMODULE_AUTHOR("Vaidyanathan Srinivasan <svaidy at linux.vnet.ibm.com>");
1167