/* * SPDX-License-Identifier: MIT * * Copyright © 2019 Intel Corporation */ #include "gem/i915_gem_pm.h" #include "gem/i915_gem_ttm_pm.h" #include "gt/intel_gt.h" #include "gt/intel_gt_pm.h" #include "gt/intel_gt_requests.h" #include "i915_driver.h" #include "i915_drv.h" #if IS_ENABLED(CONFIG_X86) #include #else #define wbinvd_on_all_cpus() \ pr_warn(DRIVER_NAME ": Missing cache flush in %s\n", __func__) #endif void i915_gem_suspend(struct drm_i915_private *i915) { struct intel_gt *gt; unsigned int i; GEM_TRACE("%s\n", dev_name(i915->drm.dev)); intel_wakeref_auto(&i915->runtime_pm.userfault_wakeref, 0); /* * On rare occasions, we've observed the fence completion triggers * free_engines asynchronously via rcu_call. Ensure those are done. * This path is only called on suspend, so it's an acceptable cost. */ rcu_barrier(); flush_workqueue(i915->wq); /* * We have to flush all the executing contexts to main memory so * that they can saved in the hibernation image. To ensure the last * context image is coherent, we have to switch away from it. That * leaves the i915->kernel_context still active when * we actually suspend, and its image in memory may not match the GPU * state. Fortunately, the kernel_context is disposable and we do * not rely on its state. */ for_each_gt(gt, i915, i) intel_gt_suspend_prepare(gt); i915_gem_drain_freed_objects(i915); } static int lmem_restore(struct drm_i915_private *i915, u32 flags) { struct intel_memory_region *mr; int ret = 0, id; for_each_memory_region(mr, i915, id) { if (mr->type == INTEL_MEMORY_LOCAL) { ret = i915_ttm_restore_region(mr, flags); if (ret) break; } } return ret; } static int lmem_suspend(struct drm_i915_private *i915, u32 flags) { struct intel_memory_region *mr; int ret = 0, id; for_each_memory_region(mr, i915, id) { if (mr->type == INTEL_MEMORY_LOCAL) { ret = i915_ttm_backup_region(mr, flags); if (ret) break; } } return ret; } static void lmem_recover(struct drm_i915_private *i915) { struct intel_memory_region *mr; int id; for_each_memory_region(mr, i915, id) if (mr->type == INTEL_MEMORY_LOCAL) i915_ttm_recover_region(mr); } int i915_gem_backup_suspend(struct drm_i915_private *i915) { int ret; /* Opportunistically try to evict unpinned objects */ ret = lmem_suspend(i915, I915_TTM_BACKUP_ALLOW_GPU); if (ret) goto out_recover; i915_gem_suspend(i915); /* * More objects may have become unpinned as requests were * retired. Now try to evict again. The gt may be wedged here * in which case we automatically fall back to memcpy. * We allow also backing up pinned objects that have not been * marked for early recover, and that may contain, for example, * page-tables for the migrate context. */ ret = lmem_suspend(i915, I915_TTM_BACKUP_ALLOW_GPU | I915_TTM_BACKUP_PINNED); if (ret) goto out_recover; /* * Remaining objects are backed up using memcpy once we've stopped * using the migrate context. */ ret = lmem_suspend(i915, I915_TTM_BACKUP_PINNED); if (ret) goto out_recover; return 0; out_recover: lmem_recover(i915); return ret; } void i915_gem_suspend_late(struct drm_i915_private *i915) { struct drm_i915_gem_object *obj; struct list_head *phases[] = { &i915->mm.shrink_list, &i915->mm.purge_list, NULL }, **phase; struct intel_gt *gt; unsigned long flags; unsigned int i; bool flush = false; /* * Neither the BIOS, ourselves or any other kernel * expects the system to be in execlists mode on startup, * so we need to reset the GPU back to legacy mode. And the only * known way to disable logical contexts is through a GPU reset. * * So in order to leave the system in a known default configuration, * always reset the GPU upon unload and suspend. Afterwards we then * clean up the GEM state tracking, flushing off the requests and * leaving the system in a known idle state. * * Note that is of the upmost importance that the GPU is idle and * all stray writes are flushed *before* we dismantle the backing * storage for the pinned objects. * * However, since we are uncertain that resetting the GPU on older * machines is a good idea, we don't - just in case it leaves the * machine in an unusable condition. */ /* Like i915_gem_suspend, flush tasks staged from fence triggers */ rcu_barrier(); for_each_gt(gt, i915, i) intel_gt_suspend_late(gt); spin_lock_irqsave(&i915->mm.obj_lock, flags); for (phase = phases; *phase; phase++) { list_for_each_entry(obj, *phase, mm.link) { if (!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ)) flush |= (obj->read_domains & I915_GEM_DOMAIN_CPU) == 0; __start_cpu_write(obj); /* presume auto-hibernate */ } } spin_unlock_irqrestore(&i915->mm.obj_lock, flags); if (flush) wbinvd_on_all_cpus(); } int i915_gem_freeze(struct drm_i915_private *i915) { /* Discard all purgeable objects, let userspace recover those as * required after resuming. */ i915_gem_shrink_all(i915); return 0; } int i915_gem_freeze_late(struct drm_i915_private *i915) { struct drm_i915_gem_object *obj; intel_wakeref_t wakeref; /* * Called just before we write the hibernation image. * * We need to update the domain tracking to reflect that the CPU * will be accessing all the pages to create and restore from the * hibernation, and so upon restoration those pages will be in the * CPU domain. * * To make sure the hibernation image contains the latest state, * we update that state just before writing out the image. * * To try and reduce the hibernation image, we manually shrink * the objects as well, see i915_gem_freeze() */ with_intel_runtime_pm(&i915->runtime_pm, wakeref) i915_gem_shrink(NULL, i915, -1UL, NULL, ~0); i915_gem_drain_freed_objects(i915); wbinvd_on_all_cpus(); list_for_each_entry(obj, &i915->mm.shrink_list, mm.link) __start_cpu_write(obj); return 0; } void i915_gem_resume(struct drm_i915_private *i915) { struct intel_gt *gt; int ret, i, j; GEM_TRACE("%s\n", dev_name(i915->drm.dev)); ret = lmem_restore(i915, 0); GEM_WARN_ON(ret); /* * As we didn't flush the kernel context before suspend, we cannot * guarantee that the context image is complete. So let's just reset * it and start again. */ for_each_gt(gt, i915, i) if (intel_gt_resume(gt)) goto err_wedged; ret = lmem_restore(i915, I915_TTM_BACKUP_ALLOW_GPU); GEM_WARN_ON(ret); return; err_wedged: for_each_gt(gt, i915, j) { if (!intel_gt_is_wedged(gt)) { dev_err(i915->drm.dev, "Failed to re-initialize GPU[%u], declaring it wedged!\n", j); intel_gt_set_wedged(gt); } if (j == i) break; } }