drivers/gpu/drm/i915/gem/i915_gem_pm.c - linux - Git at Google

 /*
  * SPDX-License-Identifier: MIT
  *
  * Copyright © 2019 Intel Corporation
  */

 #include "gem/i915_gem_pm.h"
 #include "gem/i915_gem_ttm_pm.h"
 #include "gt/intel_gt.h"
 #include "gt/intel_gt_pm.h"
 #include "gt/intel_gt_requests.h"

 #include "i915_driver.h"
 #include "i915_drv.h"

 #if defined(CONFIG_X86)
 #include <asm/smp.h>
 #else
 #define wbinvd_on_all_cpus() \
 	pr_warn(DRIVER_NAME ": Missing cache flush in %s\n", __func__)
 #endif

 void i915_gem_suspend(struct drm_i915_private *i915)
 {
 	struct intel_gt *gt;
 	unsigned int i;

 	GEM_TRACE("%s\n", dev_name(i915->drm.dev));

 	intel_wakeref_auto(&i915->runtime_pm.userfault_wakeref, 0);
 	/*
 	 * On rare occasions, we've observed the fence completion triggers
 	 * free_engines asynchronously via rcu_call. Ensure those are done.
 	 * This path is only called on suspend, so it's an acceptable cost.
 	 */
 	rcu_barrier();

 	flush_workqueue(i915->wq);

 	/*
 	 * We have to flush all the executing contexts to main memory so
 	 * that they can saved in the hibernation image. To ensure the last
 	 * context image is coherent, we have to switch away from it. That
 	 * leaves the i915->kernel_context still active when
 	 * we actually suspend, and its image in memory may not match the GPU
 	 * state. Fortunately, the kernel_context is disposable and we do
 	 * not rely on its state.
 	 */
 	for_each_gt(gt, i915, i)
 		intel_gt_suspend_prepare(gt);

 	i915_gem_drain_freed_objects(i915);
 }

 static int lmem_restore(struct drm_i915_private *i915, u32 flags)
 {
 	struct intel_memory_region *mr;
 	int ret = 0, id;

 	for_each_memory_region(mr, i915, id) {
 		if (mr->type == INTEL_MEMORY_LOCAL) {
 			ret = i915_ttm_restore_region(mr, flags);
 			if (ret)
 				break;
 		}
 	}

 	return ret;
 }

 static int lmem_suspend(struct drm_i915_private *i915, u32 flags)
 {
 	struct intel_memory_region *mr;
 	int ret = 0, id;

 	for_each_memory_region(mr, i915, id) {
 		if (mr->type == INTEL_MEMORY_LOCAL) {
 			ret = i915_ttm_backup_region(mr, flags);
 			if (ret)
 				break;
 		}
 	}

 	return ret;
 }

 static void lmem_recover(struct drm_i915_private *i915)
 {
 	struct intel_memory_region *mr;
 	int id;

 	for_each_memory_region(mr, i915, id)
 		if (mr->type == INTEL_MEMORY_LOCAL)
 			i915_ttm_recover_region(mr);
 }

 int i915_gem_backup_suspend(struct drm_i915_private *i915)
 {
 	int ret;

 	/* Opportunistically try to evict unpinned objects */
 	ret = lmem_suspend(i915, I915_TTM_BACKUP_ALLOW_GPU);
 	if (ret)
 		goto out_recover;

 	i915_gem_suspend(i915);

 	/*
 	 * More objects may have become unpinned as requests were
 	 * retired. Now try to evict again. The gt may be wedged here
 	 * in which case we automatically fall back to memcpy.
 	 * We allow also backing up pinned objects that have not been
 	 * marked for early recover, and that may contain, for example,
 	 * page-tables for the migrate context.
 	 */
 	ret = lmem_suspend(i915, I915_TTM_BACKUP_ALLOW_GPU |
 			   I915_TTM_BACKUP_PINNED);
 	if (ret)
 		goto out_recover;

 	/*
 	 * Remaining objects are backed up using memcpy once we've stopped
 	 * using the migrate context.
 	 */
 	ret = lmem_suspend(i915, I915_TTM_BACKUP_PINNED);
 	if (ret)
 		goto out_recover;

 	return 0;

 out_recover:
 	lmem_recover(i915);

 	return ret;
 }

 void i915_gem_suspend_late(struct drm_i915_private *i915)
 {
 	struct drm_i915_gem_object *obj;
 	struct list_head *phases[] = {
 		&i915->mm.shrink_list,
 		&i915->mm.purge_list,
 		NULL
 	}, **phase;
 	struct intel_gt *gt;
 	unsigned long flags;
 	unsigned int i;
 	bool flush = false;

 	/*
 	 * Neither the BIOS, ourselves or any other kernel
 	 * expects the system to be in execlists mode on startup,
 	 * so we need to reset the GPU back to legacy mode. And the only
 	 * known way to disable logical contexts is through a GPU reset.
 	 *
 	 * So in order to leave the system in a known default configuration,
 	 * always reset the GPU upon unload and suspend. Afterwards we then
 	 * clean up the GEM state tracking, flushing off the requests and
 	 * leaving the system in a known idle state.
 	 *
 	 * Note that is of the upmost importance that the GPU is idle and
 	 * all stray writes are flushed *before* we dismantle the backing
 	 * storage for the pinned objects.
 	 *
 	 * However, since we are uncertain that resetting the GPU on older
 	 * machines is a good idea, we don't - just in case it leaves the
 	 * machine in an unusable condition.
 	 */

 	/* Like i915_gem_suspend, flush tasks staged from fence triggers */
 	rcu_barrier();

 	for_each_gt(gt, i915, i)
 		intel_gt_suspend_late(gt);

 	spin_lock_irqsave(&i915->mm.obj_lock, flags);
 	for (phase = phases; *phase; phase++) {
 		list_for_each_entry(obj, *phase, mm.link) {
 			if (!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ))
 				flush |= (obj->read_domains & I915_GEM_DOMAIN_CPU) == 0;
 			__start_cpu_write(obj); /* presume auto-hibernate */
 		}
 	}
 	spin_unlock_irqrestore(&i915->mm.obj_lock, flags);
 	if (flush)
 		wbinvd_on_all_cpus();
 }

 int i915_gem_freeze(struct drm_i915_private *i915)
 {
 	/* Discard all purgeable objects, let userspace recover those as
 	 * required after resuming.
 	 */
 	i915_gem_shrink_all(i915);

 	return 0;
 }

 int i915_gem_freeze_late(struct drm_i915_private *i915)
 {
 	struct drm_i915_gem_object *obj;
 	intel_wakeref_t wakeref;

 	/*
 	 * Called just before we write the hibernation image.
 	 *
 	 * We need to update the domain tracking to reflect that the CPU
 	 * will be accessing all the pages to create and restore from the
 	 * hibernation, and so upon restoration those pages will be in the
 	 * CPU domain.
 	 *
 	 * To make sure the hibernation image contains the latest state,
 	 * we update that state just before writing out the image.
 	 *
 	 * To try and reduce the hibernation image, we manually shrink
 	 * the objects as well, see i915_gem_freeze()
 	 */

 	with_intel_runtime_pm(&i915->runtime_pm, wakeref)
 		i915_gem_shrink(NULL, i915, -1UL, NULL, ~0);
 	i915_gem_drain_freed_objects(i915);

 	wbinvd_on_all_cpus();
 	list_for_each_entry(obj, &i915->mm.shrink_list, mm.link)
 		__start_cpu_write(obj);

 	return 0;
 }

 void i915_gem_resume(struct drm_i915_private *i915)
 {
 	struct intel_gt *gt;
 	int ret, i, j;

 	GEM_TRACE("%s\n", dev_name(i915->drm.dev));

 	ret = lmem_restore(i915, 0);
 	GEM_WARN_ON(ret);

 	/*
 	 * As we didn't flush the kernel context before suspend, we cannot
 	 * guarantee that the context image is complete. So let's just reset
 	 * it and start again.
 	 */
 	for_each_gt(gt, i915, i)
 		if (intel_gt_resume(gt))
 			goto err_wedged;

 	ret = lmem_restore(i915, I915_TTM_BACKUP_ALLOW_GPU);
 	GEM_WARN_ON(ret);

 	return;

 err_wedged:
 	for_each_gt(gt, i915, j) {
 		if (!intel_gt_is_wedged(gt)) {
 			dev_err(i915->drm.dev,
 				"Failed to re-initialize GPU[%u], declaring it wedged!\n",
 				j);
 			intel_gt_set_wedged(gt);
 		}

 		if (j == i)
 			break;
 	}
 }
	/*
	* SPDX-License-Identifier: MIT
	*
	* Copyright © 2019 Intel Corporation
	*/

	#include "gem/i915_gem_pm.h"
	#include "gem/i915_gem_ttm_pm.h"
	#include "gt/intel_gt.h"
	#include "gt/intel_gt_pm.h"
	#include "gt/intel_gt_requests.h"

	#include "i915_driver.h"
	#include "i915_drv.h"

	#if defined(CONFIG_X86)
	#include <asm/smp.h>
	#else
	#define wbinvd_on_all_cpus() \
	pr_warn(DRIVER_NAME ": Missing cache flush in %s\n", __func__)
	#endif

	void i915_gem_suspend(struct drm_i915_private *i915)
	{
	struct intel_gt *gt;
	unsigned int i;

	GEM_TRACE("%s\n", dev_name(i915->drm.dev));

	intel_wakeref_auto(&i915->runtime_pm.userfault_wakeref, 0);
	/*
	* On rare occasions, we've observed the fence completion triggers
	* free_engines asynchronously via rcu_call. Ensure those are done.
	* This path is only called on suspend, so it's an acceptable cost.
	*/
	rcu_barrier();

	flush_workqueue(i915->wq);

	/*
	* We have to flush all the executing contexts to main memory so
	* that they can saved in the hibernation image. To ensure the last
	* context image is coherent, we have to switch away from it. That
	* leaves the i915->kernel_context still active when
	* we actually suspend, and its image in memory may not match the GPU
	* state. Fortunately, the kernel_context is disposable and we do
	* not rely on its state.
	*/
	for_each_gt(gt, i915, i)
	intel_gt_suspend_prepare(gt);

	i915_gem_drain_freed_objects(i915);
	}

	static int lmem_restore(struct drm_i915_private *i915, u32 flags)
	{
	struct intel_memory_region *mr;
	int ret = 0, id;

	for_each_memory_region(mr, i915, id) {
	if (mr->type == INTEL_MEMORY_LOCAL) {
	ret = i915_ttm_restore_region(mr, flags);
	if (ret)
	break;
	}
	}

	return ret;
	}

	static int lmem_suspend(struct drm_i915_private *i915, u32 flags)
	{
	struct intel_memory_region *mr;
	int ret = 0, id;

	for_each_memory_region(mr, i915, id) {
	if (mr->type == INTEL_MEMORY_LOCAL) {
	ret = i915_ttm_backup_region(mr, flags);
	if (ret)
	break;
	}
	}

	return ret;
	}

	static void lmem_recover(struct drm_i915_private *i915)
	{
	struct intel_memory_region *mr;
	int id;

	for_each_memory_region(mr, i915, id)
	if (mr->type == INTEL_MEMORY_LOCAL)
	i915_ttm_recover_region(mr);
	}

	int i915_gem_backup_suspend(struct drm_i915_private *i915)
	{
	int ret;

	/* Opportunistically try to evict unpinned objects */
	ret = lmem_suspend(i915, I915_TTM_BACKUP_ALLOW_GPU);
	if (ret)
	goto out_recover;

	i915_gem_suspend(i915);

	/*
	* More objects may have become unpinned as requests were
	* retired. Now try to evict again. The gt may be wedged here
	* in which case we automatically fall back to memcpy.
	* We allow also backing up pinned objects that have not been
	* marked for early recover, and that may contain, for example,
	* page-tables for the migrate context.
	*/
	ret = lmem_suspend(i915, I915_TTM_BACKUP_ALLOW_GPU \|
	I915_TTM_BACKUP_PINNED);
	if (ret)
	goto out_recover;

	/*
	* Remaining objects are backed up using memcpy once we've stopped
	* using the migrate context.
	*/
	ret = lmem_suspend(i915, I915_TTM_BACKUP_PINNED);
	if (ret)
	goto out_recover;

	return 0;

	out_recover:
	lmem_recover(i915);

	return ret;
	}

	void i915_gem_suspend_late(struct drm_i915_private *i915)
	{
	struct drm_i915_gem_object *obj;
	struct list_head *phases[] = {
	&i915->mm.shrink_list,
	&i915->mm.purge_list,
	NULL
	}, **phase;
	struct intel_gt *gt;
	unsigned long flags;
	unsigned int i;
	bool flush = false;

	/*
	* Neither the BIOS, ourselves or any other kernel
	* expects the system to be in execlists mode on startup,
	* so we need to reset the GPU back to legacy mode. And the only
	* known way to disable logical contexts is through a GPU reset.
	*
	* So in order to leave the system in a known default configuration,
	* always reset the GPU upon unload and suspend. Afterwards we then
	* clean up the GEM state tracking, flushing off the requests and
	* leaving the system in a known idle state.
	*
	* Note that is of the upmost importance that the GPU is idle and
	* all stray writes are flushed before we dismantle the backing
	* storage for the pinned objects.
	*
	* However, since we are uncertain that resetting the GPU on older
	* machines is a good idea, we don't - just in case it leaves the
	* machine in an unusable condition.
	*/

	/* Like i915_gem_suspend, flush tasks staged from fence triggers */
	rcu_barrier();

	for_each_gt(gt, i915, i)
	intel_gt_suspend_late(gt);

	spin_lock_irqsave(&i915->mm.obj_lock, flags);
	for (phase = phases; *phase; phase++) {
	list_for_each_entry(obj, *phase, mm.link) {
	if (!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ))
	flush \|= (obj->read_domains & I915_GEM_DOMAIN_CPU) == 0;
	__start_cpu_write(obj); /* presume auto-hibernate */
	}
	}
	spin_unlock_irqrestore(&i915->mm.obj_lock, flags);
	if (flush)
	wbinvd_on_all_cpus();
	}

	int i915_gem_freeze(struct drm_i915_private *i915)
	{
	/* Discard all purgeable objects, let userspace recover those as
	* required after resuming.
	*/
	i915_gem_shrink_all(i915);

	return 0;
	}

	int i915_gem_freeze_late(struct drm_i915_private *i915)
	{
	struct drm_i915_gem_object *obj;
	intel_wakeref_t wakeref;

	/*
	* Called just before we write the hibernation image.
	*
	* We need to update the domain tracking to reflect that the CPU
	* will be accessing all the pages to create and restore from the
	* hibernation, and so upon restoration those pages will be in the
	* CPU domain.
	*
	* To make sure the hibernation image contains the latest state,
	* we update that state just before writing out the image.
	*
	* To try and reduce the hibernation image, we manually shrink
	* the objects as well, see i915_gem_freeze()
	*/

	with_intel_runtime_pm(&i915->runtime_pm, wakeref)
	i915_gem_shrink(NULL, i915, -1UL, NULL, ~0);
	i915_gem_drain_freed_objects(i915);

	wbinvd_on_all_cpus();
	list_for_each_entry(obj, &i915->mm.shrink_list, mm.link)
	__start_cpu_write(obj);

	return 0;
	}

	void i915_gem_resume(struct drm_i915_private *i915)
	{
	struct intel_gt *gt;
	int ret, i, j;

	GEM_TRACE("%s\n", dev_name(i915->drm.dev));

	ret = lmem_restore(i915, 0);
	GEM_WARN_ON(ret);

	/*
	* As we didn't flush the kernel context before suspend, we cannot
	* guarantee that the context image is complete. So let's just reset
	* it and start again.
	*/
	for_each_gt(gt, i915, i)
	if (intel_gt_resume(gt))
	goto err_wedged;

	ret = lmem_restore(i915, I915_TTM_BACKUP_ALLOW_GPU);
	GEM_WARN_ON(ret);

	return;

	err_wedged:
	for_each_gt(gt, i915, j) {
	if (!intel_gt_is_wedged(gt)) {
	dev_err(i915->drm.dev,
	"Failed to re-initialize GPU[%u], declaring it wedged!\n",
	j);
	intel_gt_set_wedged(gt);
	}

	if (j == i)
	break;
	}
	}