162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Copyright (C) 2013 Red Hat 462306a36Sopenharmony_ci * Author: Rob Clark <robdclark@gmail.com> 562306a36Sopenharmony_ci */ 662306a36Sopenharmony_ci 762306a36Sopenharmony_ci#include "msm_gpu.h" 862306a36Sopenharmony_ci#include "msm_gpu_trace.h" 962306a36Sopenharmony_ci 1062306a36Sopenharmony_ci#include <linux/devfreq.h> 1162306a36Sopenharmony_ci#include <linux/devfreq_cooling.h> 1262306a36Sopenharmony_ci#include <linux/math64.h> 1362306a36Sopenharmony_ci#include <linux/units.h> 1462306a36Sopenharmony_ci 1562306a36Sopenharmony_ci/* 1662306a36Sopenharmony_ci * Power Management: 1762306a36Sopenharmony_ci */ 1862306a36Sopenharmony_ci 1962306a36Sopenharmony_cistatic int msm_devfreq_target(struct device *dev, unsigned long *freq, 2062306a36Sopenharmony_ci u32 flags) 2162306a36Sopenharmony_ci{ 2262306a36Sopenharmony_ci struct msm_gpu *gpu = dev_to_gpu(dev); 2362306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 2462306a36Sopenharmony_ci struct dev_pm_opp *opp; 2562306a36Sopenharmony_ci 2662306a36Sopenharmony_ci /* 2762306a36Sopenharmony_ci * Note that devfreq_recommended_opp() can modify the freq 2862306a36Sopenharmony_ci * to something that actually is in the opp table: 2962306a36Sopenharmony_ci */ 3062306a36Sopenharmony_ci opp = devfreq_recommended_opp(dev, freq, flags); 3162306a36Sopenharmony_ci if (IS_ERR(opp)) 3262306a36Sopenharmony_ci return PTR_ERR(opp); 3362306a36Sopenharmony_ci 3462306a36Sopenharmony_ci trace_msm_gpu_freq_change(dev_pm_opp_get_freq(opp)); 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_ci /* 3762306a36Sopenharmony_ci * If the GPU is idle, devfreq is not aware, so just stash 3862306a36Sopenharmony_ci * the new target freq (to use when we return to active) 3962306a36Sopenharmony_ci */ 4062306a36Sopenharmony_ci if (df->idle_freq) { 4162306a36Sopenharmony_ci df->idle_freq = *freq; 4262306a36Sopenharmony_ci dev_pm_opp_put(opp); 4362306a36Sopenharmony_ci return 0; 4462306a36Sopenharmony_ci } 4562306a36Sopenharmony_ci 4662306a36Sopenharmony_ci if (gpu->funcs->gpu_set_freq) { 4762306a36Sopenharmony_ci mutex_lock(&df->lock); 4862306a36Sopenharmony_ci gpu->funcs->gpu_set_freq(gpu, opp, df->suspended); 4962306a36Sopenharmony_ci mutex_unlock(&df->lock); 5062306a36Sopenharmony_ci } else { 5162306a36Sopenharmony_ci dev_pm_opp_set_rate(dev, *freq); 5262306a36Sopenharmony_ci } 5362306a36Sopenharmony_ci 5462306a36Sopenharmony_ci dev_pm_opp_put(opp); 5562306a36Sopenharmony_ci 5662306a36Sopenharmony_ci return 0; 5762306a36Sopenharmony_ci} 5862306a36Sopenharmony_ci 5962306a36Sopenharmony_cistatic unsigned long get_freq(struct msm_gpu *gpu) 6062306a36Sopenharmony_ci{ 6162306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 6262306a36Sopenharmony_ci 6362306a36Sopenharmony_ci /* 6462306a36Sopenharmony_ci * If the GPU is idle, use the shadow/saved freq to avoid 6562306a36Sopenharmony_ci * confusing devfreq (which is unaware that we are switching 6662306a36Sopenharmony_ci * to lowest freq until the device is active again) 6762306a36Sopenharmony_ci */ 6862306a36Sopenharmony_ci if (df->idle_freq) 6962306a36Sopenharmony_ci return df->idle_freq; 7062306a36Sopenharmony_ci 7162306a36Sopenharmony_ci if (gpu->funcs->gpu_get_freq) 7262306a36Sopenharmony_ci return gpu->funcs->gpu_get_freq(gpu); 7362306a36Sopenharmony_ci 7462306a36Sopenharmony_ci return clk_get_rate(gpu->core_clk); 7562306a36Sopenharmony_ci} 7662306a36Sopenharmony_ci 7762306a36Sopenharmony_cistatic int msm_devfreq_get_dev_status(struct device *dev, 7862306a36Sopenharmony_ci struct devfreq_dev_status *status) 7962306a36Sopenharmony_ci{ 8062306a36Sopenharmony_ci struct msm_gpu *gpu = dev_to_gpu(dev); 8162306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 8262306a36Sopenharmony_ci u64 busy_cycles, busy_time; 8362306a36Sopenharmony_ci unsigned long sample_rate; 8462306a36Sopenharmony_ci ktime_t time; 8562306a36Sopenharmony_ci 8662306a36Sopenharmony_ci mutex_lock(&df->lock); 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci status->current_frequency = get_freq(gpu); 8962306a36Sopenharmony_ci time = ktime_get(); 9062306a36Sopenharmony_ci status->total_time = ktime_us_delta(time, df->time); 9162306a36Sopenharmony_ci df->time = time; 9262306a36Sopenharmony_ci 9362306a36Sopenharmony_ci if (df->suspended) { 9462306a36Sopenharmony_ci mutex_unlock(&df->lock); 9562306a36Sopenharmony_ci status->busy_time = 0; 9662306a36Sopenharmony_ci return 0; 9762306a36Sopenharmony_ci } 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci busy_cycles = gpu->funcs->gpu_busy(gpu, &sample_rate); 10062306a36Sopenharmony_ci busy_time = busy_cycles - df->busy_cycles; 10162306a36Sopenharmony_ci df->busy_cycles = busy_cycles; 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_ci mutex_unlock(&df->lock); 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_ci busy_time *= USEC_PER_SEC; 10662306a36Sopenharmony_ci busy_time = div64_ul(busy_time, sample_rate); 10762306a36Sopenharmony_ci if (WARN_ON(busy_time > ~0LU)) 10862306a36Sopenharmony_ci busy_time = ~0LU; 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci status->busy_time = busy_time; 11162306a36Sopenharmony_ci 11262306a36Sopenharmony_ci return 0; 11362306a36Sopenharmony_ci} 11462306a36Sopenharmony_ci 11562306a36Sopenharmony_cistatic int msm_devfreq_get_cur_freq(struct device *dev, unsigned long *freq) 11662306a36Sopenharmony_ci{ 11762306a36Sopenharmony_ci *freq = get_freq(dev_to_gpu(dev)); 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci return 0; 12062306a36Sopenharmony_ci} 12162306a36Sopenharmony_ci 12262306a36Sopenharmony_cistatic struct devfreq_dev_profile msm_devfreq_profile = { 12362306a36Sopenharmony_ci .timer = DEVFREQ_TIMER_DELAYED, 12462306a36Sopenharmony_ci .polling_ms = 50, 12562306a36Sopenharmony_ci .target = msm_devfreq_target, 12662306a36Sopenharmony_ci .get_dev_status = msm_devfreq_get_dev_status, 12762306a36Sopenharmony_ci .get_cur_freq = msm_devfreq_get_cur_freq, 12862306a36Sopenharmony_ci}; 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_cistatic void msm_devfreq_boost_work(struct kthread_work *work); 13162306a36Sopenharmony_cistatic void msm_devfreq_idle_work(struct kthread_work *work); 13262306a36Sopenharmony_ci 13362306a36Sopenharmony_cistatic bool has_devfreq(struct msm_gpu *gpu) 13462306a36Sopenharmony_ci{ 13562306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 13662306a36Sopenharmony_ci return !!df->devfreq; 13762306a36Sopenharmony_ci} 13862306a36Sopenharmony_ci 13962306a36Sopenharmony_civoid msm_devfreq_init(struct msm_gpu *gpu) 14062306a36Sopenharmony_ci{ 14162306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 14262306a36Sopenharmony_ci struct msm_drm_private *priv = gpu->dev->dev_private; 14362306a36Sopenharmony_ci 14462306a36Sopenharmony_ci /* We need target support to do devfreq */ 14562306a36Sopenharmony_ci if (!gpu->funcs->gpu_busy) 14662306a36Sopenharmony_ci return; 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_ci /* 14962306a36Sopenharmony_ci * Setup default values for simple_ondemand governor tuning. We 15062306a36Sopenharmony_ci * want to throttle up at 50% load for the double-buffer case, 15162306a36Sopenharmony_ci * where due to stalling waiting for vblank we could get stuck 15262306a36Sopenharmony_ci * at (for ex) 30fps at 50% utilization. 15362306a36Sopenharmony_ci */ 15462306a36Sopenharmony_ci priv->gpu_devfreq_config.upthreshold = 50; 15562306a36Sopenharmony_ci priv->gpu_devfreq_config.downdifferential = 10; 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci mutex_init(&df->lock); 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_ci dev_pm_qos_add_request(&gpu->pdev->dev, &df->boost_freq, 16062306a36Sopenharmony_ci DEV_PM_QOS_MIN_FREQUENCY, 0); 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci msm_devfreq_profile.initial_freq = gpu->fast_rate; 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_ci /* 16562306a36Sopenharmony_ci * Don't set the freq_table or max_state and let devfreq build the table 16662306a36Sopenharmony_ci * from OPP 16762306a36Sopenharmony_ci * After a deferred probe, these may have be left to non-zero values, 16862306a36Sopenharmony_ci * so set them back to zero before creating the devfreq device 16962306a36Sopenharmony_ci */ 17062306a36Sopenharmony_ci msm_devfreq_profile.freq_table = NULL; 17162306a36Sopenharmony_ci msm_devfreq_profile.max_state = 0; 17262306a36Sopenharmony_ci 17362306a36Sopenharmony_ci df->devfreq = devm_devfreq_add_device(&gpu->pdev->dev, 17462306a36Sopenharmony_ci &msm_devfreq_profile, DEVFREQ_GOV_SIMPLE_ONDEMAND, 17562306a36Sopenharmony_ci &priv->gpu_devfreq_config); 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci if (IS_ERR(df->devfreq)) { 17862306a36Sopenharmony_ci DRM_DEV_ERROR(&gpu->pdev->dev, "Couldn't initialize GPU devfreq\n"); 17962306a36Sopenharmony_ci dev_pm_qos_remove_request(&df->boost_freq); 18062306a36Sopenharmony_ci df->devfreq = NULL; 18162306a36Sopenharmony_ci return; 18262306a36Sopenharmony_ci } 18362306a36Sopenharmony_ci 18462306a36Sopenharmony_ci devfreq_suspend_device(df->devfreq); 18562306a36Sopenharmony_ci 18662306a36Sopenharmony_ci gpu->cooling = of_devfreq_cooling_register(gpu->pdev->dev.of_node, df->devfreq); 18762306a36Sopenharmony_ci if (IS_ERR(gpu->cooling)) { 18862306a36Sopenharmony_ci DRM_DEV_ERROR(&gpu->pdev->dev, 18962306a36Sopenharmony_ci "Couldn't register GPU cooling device\n"); 19062306a36Sopenharmony_ci gpu->cooling = NULL; 19162306a36Sopenharmony_ci } 19262306a36Sopenharmony_ci 19362306a36Sopenharmony_ci msm_hrtimer_work_init(&df->boost_work, gpu->worker, msm_devfreq_boost_work, 19462306a36Sopenharmony_ci CLOCK_MONOTONIC, HRTIMER_MODE_REL); 19562306a36Sopenharmony_ci msm_hrtimer_work_init(&df->idle_work, gpu->worker, msm_devfreq_idle_work, 19662306a36Sopenharmony_ci CLOCK_MONOTONIC, HRTIMER_MODE_REL); 19762306a36Sopenharmony_ci} 19862306a36Sopenharmony_ci 19962306a36Sopenharmony_cistatic void cancel_idle_work(struct msm_gpu_devfreq *df) 20062306a36Sopenharmony_ci{ 20162306a36Sopenharmony_ci hrtimer_cancel(&df->idle_work.timer); 20262306a36Sopenharmony_ci kthread_cancel_work_sync(&df->idle_work.work); 20362306a36Sopenharmony_ci} 20462306a36Sopenharmony_ci 20562306a36Sopenharmony_cistatic void cancel_boost_work(struct msm_gpu_devfreq *df) 20662306a36Sopenharmony_ci{ 20762306a36Sopenharmony_ci hrtimer_cancel(&df->boost_work.timer); 20862306a36Sopenharmony_ci kthread_cancel_work_sync(&df->boost_work.work); 20962306a36Sopenharmony_ci} 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_civoid msm_devfreq_cleanup(struct msm_gpu *gpu) 21262306a36Sopenharmony_ci{ 21362306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ci if (!has_devfreq(gpu)) 21662306a36Sopenharmony_ci return; 21762306a36Sopenharmony_ci 21862306a36Sopenharmony_ci devfreq_cooling_unregister(gpu->cooling); 21962306a36Sopenharmony_ci dev_pm_qos_remove_request(&df->boost_freq); 22062306a36Sopenharmony_ci} 22162306a36Sopenharmony_ci 22262306a36Sopenharmony_civoid msm_devfreq_resume(struct msm_gpu *gpu) 22362306a36Sopenharmony_ci{ 22462306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 22562306a36Sopenharmony_ci unsigned long sample_rate; 22662306a36Sopenharmony_ci 22762306a36Sopenharmony_ci if (!has_devfreq(gpu)) 22862306a36Sopenharmony_ci return; 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ci mutex_lock(&df->lock); 23162306a36Sopenharmony_ci df->busy_cycles = gpu->funcs->gpu_busy(gpu, &sample_rate); 23262306a36Sopenharmony_ci df->time = ktime_get(); 23362306a36Sopenharmony_ci df->suspended = false; 23462306a36Sopenharmony_ci mutex_unlock(&df->lock); 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci devfreq_resume_device(df->devfreq); 23762306a36Sopenharmony_ci} 23862306a36Sopenharmony_ci 23962306a36Sopenharmony_civoid msm_devfreq_suspend(struct msm_gpu *gpu) 24062306a36Sopenharmony_ci{ 24162306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_ci if (!has_devfreq(gpu)) 24462306a36Sopenharmony_ci return; 24562306a36Sopenharmony_ci 24662306a36Sopenharmony_ci mutex_lock(&df->lock); 24762306a36Sopenharmony_ci df->suspended = true; 24862306a36Sopenharmony_ci mutex_unlock(&df->lock); 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_ci devfreq_suspend_device(df->devfreq); 25162306a36Sopenharmony_ci 25262306a36Sopenharmony_ci cancel_idle_work(df); 25362306a36Sopenharmony_ci cancel_boost_work(df); 25462306a36Sopenharmony_ci} 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_cistatic void msm_devfreq_boost_work(struct kthread_work *work) 25762306a36Sopenharmony_ci{ 25862306a36Sopenharmony_ci struct msm_gpu_devfreq *df = container_of(work, 25962306a36Sopenharmony_ci struct msm_gpu_devfreq, boost_work.work); 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_ci dev_pm_qos_update_request(&df->boost_freq, 0); 26262306a36Sopenharmony_ci} 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_civoid msm_devfreq_boost(struct msm_gpu *gpu, unsigned factor) 26562306a36Sopenharmony_ci{ 26662306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 26762306a36Sopenharmony_ci uint64_t freq; 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci if (!has_devfreq(gpu)) 27062306a36Sopenharmony_ci return; 27162306a36Sopenharmony_ci 27262306a36Sopenharmony_ci freq = get_freq(gpu); 27362306a36Sopenharmony_ci freq *= factor; 27462306a36Sopenharmony_ci 27562306a36Sopenharmony_ci /* 27662306a36Sopenharmony_ci * A nice little trap is that PM QoS operates in terms of KHz, 27762306a36Sopenharmony_ci * while devfreq operates in terms of Hz: 27862306a36Sopenharmony_ci */ 27962306a36Sopenharmony_ci do_div(freq, HZ_PER_KHZ); 28062306a36Sopenharmony_ci 28162306a36Sopenharmony_ci dev_pm_qos_update_request(&df->boost_freq, freq); 28262306a36Sopenharmony_ci 28362306a36Sopenharmony_ci msm_hrtimer_queue_work(&df->boost_work, 28462306a36Sopenharmony_ci ms_to_ktime(msm_devfreq_profile.polling_ms), 28562306a36Sopenharmony_ci HRTIMER_MODE_REL); 28662306a36Sopenharmony_ci} 28762306a36Sopenharmony_ci 28862306a36Sopenharmony_civoid msm_devfreq_active(struct msm_gpu *gpu) 28962306a36Sopenharmony_ci{ 29062306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 29162306a36Sopenharmony_ci unsigned int idle_time; 29262306a36Sopenharmony_ci unsigned long target_freq; 29362306a36Sopenharmony_ci 29462306a36Sopenharmony_ci if (!has_devfreq(gpu)) 29562306a36Sopenharmony_ci return; 29662306a36Sopenharmony_ci 29762306a36Sopenharmony_ci /* 29862306a36Sopenharmony_ci * Cancel any pending transition to idle frequency: 29962306a36Sopenharmony_ci */ 30062306a36Sopenharmony_ci cancel_idle_work(df); 30162306a36Sopenharmony_ci 30262306a36Sopenharmony_ci /* 30362306a36Sopenharmony_ci * Hold devfreq lock to synchronize with get_dev_status()/ 30462306a36Sopenharmony_ci * target() callbacks 30562306a36Sopenharmony_ci */ 30662306a36Sopenharmony_ci mutex_lock(&df->devfreq->lock); 30762306a36Sopenharmony_ci 30862306a36Sopenharmony_ci target_freq = df->idle_freq; 30962306a36Sopenharmony_ci 31062306a36Sopenharmony_ci idle_time = ktime_to_ms(ktime_sub(ktime_get(), df->idle_time)); 31162306a36Sopenharmony_ci 31262306a36Sopenharmony_ci df->idle_freq = 0; 31362306a36Sopenharmony_ci 31462306a36Sopenharmony_ci /* 31562306a36Sopenharmony_ci * We could have become active again before the idle work had a 31662306a36Sopenharmony_ci * chance to run, in which case the df->idle_freq would have 31762306a36Sopenharmony_ci * still been zero. In this case, no need to change freq. 31862306a36Sopenharmony_ci */ 31962306a36Sopenharmony_ci if (target_freq) 32062306a36Sopenharmony_ci msm_devfreq_target(&gpu->pdev->dev, &target_freq, 0); 32162306a36Sopenharmony_ci 32262306a36Sopenharmony_ci mutex_unlock(&df->devfreq->lock); 32362306a36Sopenharmony_ci 32462306a36Sopenharmony_ci /* 32562306a36Sopenharmony_ci * If we've been idle for a significant fraction of a polling 32662306a36Sopenharmony_ci * interval, then we won't meet the threshold of busyness for 32762306a36Sopenharmony_ci * the governor to ramp up the freq.. so give some boost 32862306a36Sopenharmony_ci */ 32962306a36Sopenharmony_ci if (idle_time > msm_devfreq_profile.polling_ms) { 33062306a36Sopenharmony_ci msm_devfreq_boost(gpu, 2); 33162306a36Sopenharmony_ci } 33262306a36Sopenharmony_ci} 33362306a36Sopenharmony_ci 33462306a36Sopenharmony_ci 33562306a36Sopenharmony_cistatic void msm_devfreq_idle_work(struct kthread_work *work) 33662306a36Sopenharmony_ci{ 33762306a36Sopenharmony_ci struct msm_gpu_devfreq *df = container_of(work, 33862306a36Sopenharmony_ci struct msm_gpu_devfreq, idle_work.work); 33962306a36Sopenharmony_ci struct msm_gpu *gpu = container_of(df, struct msm_gpu, devfreq); 34062306a36Sopenharmony_ci struct msm_drm_private *priv = gpu->dev->dev_private; 34162306a36Sopenharmony_ci unsigned long idle_freq, target_freq = 0; 34262306a36Sopenharmony_ci 34362306a36Sopenharmony_ci /* 34462306a36Sopenharmony_ci * Hold devfreq lock to synchronize with get_dev_status()/ 34562306a36Sopenharmony_ci * target() callbacks 34662306a36Sopenharmony_ci */ 34762306a36Sopenharmony_ci mutex_lock(&df->devfreq->lock); 34862306a36Sopenharmony_ci 34962306a36Sopenharmony_ci idle_freq = get_freq(gpu); 35062306a36Sopenharmony_ci 35162306a36Sopenharmony_ci if (priv->gpu_clamp_to_idle) 35262306a36Sopenharmony_ci msm_devfreq_target(&gpu->pdev->dev, &target_freq, 0); 35362306a36Sopenharmony_ci 35462306a36Sopenharmony_ci df->idle_time = ktime_get(); 35562306a36Sopenharmony_ci df->idle_freq = idle_freq; 35662306a36Sopenharmony_ci 35762306a36Sopenharmony_ci mutex_unlock(&df->devfreq->lock); 35862306a36Sopenharmony_ci} 35962306a36Sopenharmony_ci 36062306a36Sopenharmony_civoid msm_devfreq_idle(struct msm_gpu *gpu) 36162306a36Sopenharmony_ci{ 36262306a36Sopenharmony_ci struct msm_gpu_devfreq *df = &gpu->devfreq; 36362306a36Sopenharmony_ci 36462306a36Sopenharmony_ci if (!has_devfreq(gpu)) 36562306a36Sopenharmony_ci return; 36662306a36Sopenharmony_ci 36762306a36Sopenharmony_ci msm_hrtimer_queue_work(&df->idle_work, ms_to_ktime(1), 36862306a36Sopenharmony_ci HRTIMER_MODE_REL); 36962306a36Sopenharmony_ci} 370