intel_gt_pm.c (9799B)
1// SPDX-License-Identifier: MIT 2/* 3 * Copyright © 2019 Intel Corporation 4 */ 5 6#include <linux/string_helpers.h> 7#include <linux/suspend.h> 8 9#include "i915_drv.h" 10#include "i915_params.h" 11#include "intel_context.h" 12#include "intel_engine_pm.h" 13#include "intel_gt.h" 14#include "intel_gt_clock_utils.h" 15#include "intel_gt_pm.h" 16#include "intel_gt_requests.h" 17#include "intel_llc.h" 18#include "intel_pm.h" 19#include "intel_rc6.h" 20#include "intel_rps.h" 21#include "intel_wakeref.h" 22#include "pxp/intel_pxp_pm.h" 23 24#define I915_GT_SUSPEND_IDLE_TIMEOUT (HZ / 2) 25 26static void user_forcewake(struct intel_gt *gt, bool suspend) 27{ 28 int count = atomic_read(>->user_wakeref); 29 30 /* Inside suspend/resume so single threaded, no races to worry about. */ 31 if (likely(!count)) 32 return; 33 34 intel_gt_pm_get(gt); 35 if (suspend) { 36 GEM_BUG_ON(count > atomic_read(>->wakeref.count)); 37 atomic_sub(count, >->wakeref.count); 38 } else { 39 atomic_add(count, >->wakeref.count); 40 } 41 intel_gt_pm_put(gt); 42} 43 44static void runtime_begin(struct intel_gt *gt) 45{ 46 local_irq_disable(); 47 write_seqcount_begin(>->stats.lock); 48 gt->stats.start = ktime_get(); 49 gt->stats.active = true; 50 write_seqcount_end(>->stats.lock); 51 local_irq_enable(); 52} 53 54static void runtime_end(struct intel_gt *gt) 55{ 56 local_irq_disable(); 57 write_seqcount_begin(>->stats.lock); 58 gt->stats.active = false; 59 gt->stats.total = 60 ktime_add(gt->stats.total, 61 ktime_sub(ktime_get(), gt->stats.start)); 62 write_seqcount_end(>->stats.lock); 63 local_irq_enable(); 64} 65 66static int __gt_unpark(struct intel_wakeref *wf) 67{ 68 struct intel_gt *gt = container_of(wf, typeof(*gt), wakeref); 69 struct drm_i915_private *i915 = gt->i915; 70 71 GT_TRACE(gt, "\n"); 72 73 /* 74 * It seems that the DMC likes to transition between the DC states a lot 75 * when there are no connected displays (no active power domains) during 76 * command submission. 77 * 78 * This activity has negative impact on the performance of the chip with 79 * huge latencies observed in the interrupt handler and elsewhere. 80 * 81 * Work around it by grabbing a GT IRQ power domain whilst there is any 82 * GT activity, preventing any DC state transitions. 83 */ 84 gt->awake = intel_display_power_get(i915, POWER_DOMAIN_GT_IRQ); 85 GEM_BUG_ON(!gt->awake); 86 87 intel_rc6_unpark(>->rc6); 88 intel_rps_unpark(>->rps); 89 i915_pmu_gt_unparked(i915); 90 intel_guc_busyness_unpark(gt); 91 92 intel_gt_unpark_requests(gt); 93 runtime_begin(gt); 94 95 return 0; 96} 97 98static int __gt_park(struct intel_wakeref *wf) 99{ 100 struct intel_gt *gt = container_of(wf, typeof(*gt), wakeref); 101 intel_wakeref_t wakeref = fetch_and_zero(>->awake); 102 struct drm_i915_private *i915 = gt->i915; 103 104 GT_TRACE(gt, "\n"); 105 106 runtime_end(gt); 107 intel_gt_park_requests(gt); 108 109 intel_guc_busyness_park(gt); 110 i915_vma_parked(gt); 111 i915_pmu_gt_parked(i915); 112 intel_rps_park(>->rps); 113 intel_rc6_park(>->rc6); 114 115 /* Everything switched off, flush any residual interrupt just in case */ 116 intel_synchronize_irq(i915); 117 118 /* Defer dropping the display power well for 100ms, it's slow! */ 119 GEM_BUG_ON(!wakeref); 120 intel_display_power_put_async(i915, POWER_DOMAIN_GT_IRQ, wakeref); 121 122 return 0; 123} 124 125static const struct intel_wakeref_ops wf_ops = { 126 .get = __gt_unpark, 127 .put = __gt_park, 128}; 129 130void intel_gt_pm_init_early(struct intel_gt *gt) 131{ 132 /* 133 * We access the runtime_pm structure via gt->i915 here rather than 134 * gt->uncore as we do elsewhere in the file because gt->uncore is not 135 * yet initialized for all tiles at this point in the driver startup. 136 * runtime_pm is per-device rather than per-tile, so this is still the 137 * correct structure. 138 */ 139 intel_wakeref_init(>->wakeref, >->i915->runtime_pm, &wf_ops); 140 seqcount_mutex_init(>->stats.lock, >->wakeref.mutex); 141} 142 143void intel_gt_pm_init(struct intel_gt *gt) 144{ 145 /* 146 * Enabling power-management should be "self-healing". If we cannot 147 * enable a feature, simply leave it disabled with a notice to the 148 * user. 149 */ 150 intel_rc6_init(>->rc6); 151 intel_rps_init(>->rps); 152} 153 154static bool reset_engines(struct intel_gt *gt) 155{ 156 if (INTEL_INFO(gt->i915)->gpu_reset_clobbers_display) 157 return false; 158 159 return __intel_gt_reset(gt, ALL_ENGINES) == 0; 160} 161 162static void gt_sanitize(struct intel_gt *gt, bool force) 163{ 164 struct intel_engine_cs *engine; 165 enum intel_engine_id id; 166 intel_wakeref_t wakeref; 167 168 GT_TRACE(gt, "force:%s", str_yes_no(force)); 169 170 /* Use a raw wakeref to avoid calling intel_display_power_get early */ 171 wakeref = intel_runtime_pm_get(gt->uncore->rpm); 172 intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL); 173 174 intel_gt_check_clock_frequency(gt); 175 176 /* 177 * As we have just resumed the machine and woken the device up from 178 * deep PCI sleep (presumably D3_cold), assume the HW has been reset 179 * back to defaults, recovering from whatever wedged state we left it 180 * in and so worth trying to use the device once more. 181 */ 182 if (intel_gt_is_wedged(gt)) 183 intel_gt_unset_wedged(gt); 184 185 /* For GuC mode, ensure submission is disabled before stopping ring */ 186 intel_uc_reset_prepare(>->uc); 187 188 for_each_engine(engine, gt, id) { 189 if (engine->reset.prepare) 190 engine->reset.prepare(engine); 191 192 if (engine->sanitize) 193 engine->sanitize(engine); 194 } 195 196 if (reset_engines(gt) || force) { 197 for_each_engine(engine, gt, id) 198 __intel_engine_reset(engine, false); 199 } 200 201 intel_uc_reset(>->uc, false); 202 203 for_each_engine(engine, gt, id) 204 if (engine->reset.finish) 205 engine->reset.finish(engine); 206 207 intel_rps_sanitize(>->rps); 208 209 intel_uncore_forcewake_put(gt->uncore, FORCEWAKE_ALL); 210 intel_runtime_pm_put(gt->uncore->rpm, wakeref); 211} 212 213void intel_gt_pm_fini(struct intel_gt *gt) 214{ 215 intel_rc6_fini(>->rc6); 216} 217 218int intel_gt_resume(struct intel_gt *gt) 219{ 220 struct intel_engine_cs *engine; 221 enum intel_engine_id id; 222 int err; 223 224 err = intel_gt_has_unrecoverable_error(gt); 225 if (err) 226 return err; 227 228 GT_TRACE(gt, "\n"); 229 230 /* 231 * After resume, we may need to poke into the pinned kernel 232 * contexts to paper over any damage caused by the sudden suspend. 233 * Only the kernel contexts should remain pinned over suspend, 234 * allowing us to fixup the user contexts on their first pin. 235 */ 236 gt_sanitize(gt, true); 237 238 intel_gt_pm_get(gt); 239 240 intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL); 241 intel_rc6_sanitize(>->rc6); 242 if (intel_gt_is_wedged(gt)) { 243 err = -EIO; 244 goto out_fw; 245 } 246 247 /* Only when the HW is re-initialised, can we replay the requests */ 248 err = intel_gt_init_hw(gt); 249 if (err) { 250 i915_probe_error(gt->i915, 251 "Failed to initialize GPU, declaring it wedged!\n"); 252 goto err_wedged; 253 } 254 255 intel_uc_reset_finish(>->uc); 256 257 intel_rps_enable(>->rps); 258 intel_llc_enable(>->llc); 259 260 for_each_engine(engine, gt, id) { 261 intel_engine_pm_get(engine); 262 263 engine->serial++; /* kernel context lost */ 264 err = intel_engine_resume(engine); 265 266 intel_engine_pm_put(engine); 267 if (err) { 268 drm_err(>->i915->drm, 269 "Failed to restart %s (%d)\n", 270 engine->name, err); 271 goto err_wedged; 272 } 273 } 274 275 intel_rc6_enable(>->rc6); 276 277 intel_uc_resume(>->uc); 278 279 intel_pxp_resume(>->pxp); 280 281 user_forcewake(gt, false); 282 283out_fw: 284 intel_uncore_forcewake_put(gt->uncore, FORCEWAKE_ALL); 285 intel_gt_pm_put(gt); 286 return err; 287 288err_wedged: 289 intel_gt_set_wedged(gt); 290 goto out_fw; 291} 292 293static void wait_for_suspend(struct intel_gt *gt) 294{ 295 if (!intel_gt_pm_is_awake(gt)) 296 return; 297 298 if (intel_gt_wait_for_idle(gt, I915_GT_SUSPEND_IDLE_TIMEOUT) == -ETIME) { 299 /* 300 * Forcibly cancel outstanding work and leave 301 * the gpu quiet. 302 */ 303 intel_gt_set_wedged(gt); 304 intel_gt_retire_requests(gt); 305 } 306 307 intel_gt_pm_wait_for_idle(gt); 308} 309 310void intel_gt_suspend_prepare(struct intel_gt *gt) 311{ 312 user_forcewake(gt, true); 313 wait_for_suspend(gt); 314 315 intel_pxp_suspend_prepare(>->pxp); 316} 317 318static suspend_state_t pm_suspend_target(void) 319{ 320#if IS_ENABLED(CONFIG_SUSPEND) && IS_ENABLED(CONFIG_PM_SLEEP) 321 return pm_suspend_target_state; 322#else 323 return PM_SUSPEND_TO_IDLE; 324#endif 325} 326 327void intel_gt_suspend_late(struct intel_gt *gt) 328{ 329 intel_wakeref_t wakeref; 330 331 /* We expect to be idle already; but also want to be independent */ 332 wait_for_suspend(gt); 333 334 if (is_mock_gt(gt)) 335 return; 336 337 GEM_BUG_ON(gt->awake); 338 339 intel_uc_suspend(>->uc); 340 intel_pxp_suspend(>->pxp); 341 342 /* 343 * On disabling the device, we want to turn off HW access to memory 344 * that we no longer own. 345 * 346 * However, not all suspend-states disable the device. S0 (s2idle) 347 * is effectively runtime-suspend, the device is left powered on 348 * but needs to be put into a low power state. We need to keep 349 * powermanagement enabled, but we also retain system state and so 350 * it remains safe to keep on using our allocated memory. 351 */ 352 if (pm_suspend_target() == PM_SUSPEND_TO_IDLE) 353 return; 354 355 with_intel_runtime_pm(gt->uncore->rpm, wakeref) { 356 intel_rps_disable(>->rps); 357 intel_rc6_disable(>->rc6); 358 intel_llc_disable(>->llc); 359 } 360 361 gt_sanitize(gt, false); 362 363 GT_TRACE(gt, "\n"); 364} 365 366void intel_gt_runtime_suspend(struct intel_gt *gt) 367{ 368 intel_pxp_runtime_suspend(>->pxp); 369 intel_uc_runtime_suspend(>->uc); 370 371 GT_TRACE(gt, "\n"); 372} 373 374int intel_gt_runtime_resume(struct intel_gt *gt) 375{ 376 int ret; 377 378 GT_TRACE(gt, "\n"); 379 intel_gt_init_swizzling(gt); 380 intel_ggtt_restore_fences(gt->ggtt); 381 382 ret = intel_uc_runtime_resume(>->uc); 383 if (ret) 384 return ret; 385 386 intel_pxp_runtime_resume(>->pxp); 387 388 return 0; 389} 390 391static ktime_t __intel_gt_get_awake_time(const struct intel_gt *gt) 392{ 393 ktime_t total = gt->stats.total; 394 395 if (gt->stats.active) 396 total = ktime_add(total, 397 ktime_sub(ktime_get(), gt->stats.start)); 398 399 return total; 400} 401 402ktime_t intel_gt_get_awake_time(const struct intel_gt *gt) 403{ 404 unsigned int seq; 405 ktime_t total; 406 407 do { 408 seq = read_seqcount_begin(>->stats.lock); 409 total = __intel_gt_get_awake_time(gt); 410 } while (read_seqcount_retry(>->stats.lock, seq)); 411 412 return total; 413} 414 415#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST) 416#include "selftest_gt_pm.c" 417#endif