drivers/gpu/drm/msm/adreno/a5xx_gpu.h - linux - Git at Google

 /* SPDX-License-Identifier: GPL-2.0-only */
 /* Copyright (c) 2016-2017 The Linux Foundation. All rights reserved.
  */
 #ifndef __A5XX_GPU_H__
 #define __A5XX_GPU_H__

 #include "adreno_gpu.h"

 /* Bringing over the hack from the previous targets */
 #undef ROP_COPY
 #undef ROP_XOR

 #include "a5xx.xml.h"

 struct a5xx_gpu {
 	struct adreno_gpu base;

 	struct drm_gem_object *pm4_bo;
 	uint64_t pm4_iova;

 	struct drm_gem_object *pfp_bo;
 	uint64_t pfp_iova;

 	struct drm_gem_object *gpmu_bo;
 	uint64_t gpmu_iova;
 	uint32_t gpmu_dwords;

 	uint32_t lm_leakage;

 	struct msm_ringbuffer *cur_ring;
 	struct msm_ringbuffer *next_ring;

 	struct drm_gem_object *preempt_bo[MSM_GPU_MAX_RINGS];
 	struct drm_gem_object *preempt_counters_bo[MSM_GPU_MAX_RINGS];
 	struct a5xx_preempt_record *preempt[MSM_GPU_MAX_RINGS];
 	uint64_t preempt_iova[MSM_GPU_MAX_RINGS];
 	uint32_t last_seqno[MSM_GPU_MAX_RINGS];

 	atomic_t preempt_state;
 	spinlock_t preempt_start_lock;
 	struct timer_list preempt_timer;

 	struct drm_gem_object *shadow_bo;
 	uint64_t shadow_iova;
 	uint32_t *shadow;

 	/* True if the microcode supports the WHERE_AM_I opcode */
 	bool has_whereami;
 };

 #define to_a5xx_gpu(x) container_of(x, struct a5xx_gpu, base)

 #ifdef CONFIG_DEBUG_FS
 void a5xx_debugfs_init(struct msm_gpu *gpu, struct drm_minor *minor);
 #endif

 /*
  * In order to do lockless preemption we use a simple state machine to progress
  * through the process.
  *
  * PREEMPT_NONE - no preemption in progress.  Next state START.
  * PREEMPT_START - The trigger is evaulating if preemption is possible. Next
  * states: TRIGGERED, NONE
  * PREEMPT_ABORT - An intermediate state before moving back to NONE. Next
  * state: NONE.
  * PREEMPT_TRIGGERED: A preemption has been executed on the hardware. Next
  * states: FAULTED, PENDING
  * PREEMPT_FAULTED: A preemption timed out (never completed). This will trigger
  * recovery.  Next state: N/A
  * PREEMPT_PENDING: Preemption complete interrupt fired - the callback is
  * checking the success of the operation. Next state: FAULTED, NONE.
  */

 enum preempt_state {
 	PREEMPT_NONE = 0,
 	PREEMPT_START,
 	PREEMPT_ABORT,
 	PREEMPT_TRIGGERED,
 	PREEMPT_FAULTED,
 	PREEMPT_PENDING,
 };

 /*
  * struct a5xx_preempt_record is a shared buffer between the microcode and the
  * CPU to store the state for preemption. The record itself is much larger
  * (64k) but most of that is used by the CP for storage.
  *
  * There is a preemption record assigned per ringbuffer. When the CPU triggers a
  * preemption, it fills out the record with the useful information (wptr, ring
  * base, etc) and the microcode uses that information to set up the CP following
  * the preemption.  When a ring is switched out, the CP will save the ringbuffer
  * state back to the record. In this way, once the records are properly set up
  * the CPU can quickly switch back and forth between ringbuffers by only
  * updating a few registers (often only the wptr).
  *
  * These are the CPU aware registers in the record:
  * @magic: Must always be 0x27C4BAFC
  * @info: Type of the record - written 0 by the CPU, updated by the CP
  * @data: Data field from SET_RENDER_MODE or a checkpoint. Written and used by
  * the CP
  * @cntl: Value of RB_CNTL written by CPU, save/restored by CP
  * @rptr: Value of RB_RPTR written by CPU, save/restored by CP
  * @wptr: Value of RB_WPTR written by CPU, save/restored by CP
  * @rptr_addr: Value of RB_RPTR_ADDR written by CPU, save/restored by CP
  * @rbase: Value of RB_BASE written by CPU, save/restored by CP
  * @counter: GPU address of the storage area for the performance counters
  */
 struct a5xx_preempt_record {
 	uint32_t magic;
 	uint32_t info;
 	uint32_t data;
 	uint32_t cntl;
 	uint32_t rptr;
 	uint32_t wptr;
 	uint64_t rptr_addr;
 	uint64_t rbase;
 	uint64_t counter;
 };

 /* Magic identifier for the preemption record */
 #define A5XX_PREEMPT_RECORD_MAGIC 0x27C4BAFCUL

 /*
  * Even though the structure above is only a few bytes, we need a full 64k to
  * store the entire preemption record from the CP
  */
 #define A5XX_PREEMPT_RECORD_SIZE (64 * 1024)

 /*
  * The preemption counter block is a storage area for the value of the
  * preemption counters that are saved immediately before context switch. We
  * append it on to the end of the allocation for the preemption record.
  */
 #define A5XX_PREEMPT_COUNTER_SIZE (16 * 4)


 int a5xx_power_init(struct msm_gpu *gpu);
 void a5xx_gpmu_ucode_init(struct msm_gpu *gpu);

 static inline int spin_usecs(struct msm_gpu *gpu, uint32_t usecs,
 		uint32_t reg, uint32_t mask, uint32_t value)
 {
 	while (usecs--) {
 		udelay(1);
 		if ((gpu_read(gpu, reg) & mask) == value)
 			return 0;
 		cpu_relax();
 	}

 	return -ETIMEDOUT;
 }

 #define shadowptr(a5xx_gpu, ring) ((a5xx_gpu)->shadow_iova + \
 		((ring)->id * sizeof(uint32_t)))

 bool a5xx_idle(struct msm_gpu *gpu, struct msm_ringbuffer *ring);
 void a5xx_set_hwcg(struct msm_gpu *gpu, bool state);

 void a5xx_preempt_init(struct msm_gpu *gpu);
 void a5xx_preempt_hw_init(struct msm_gpu *gpu);
 void a5xx_preempt_trigger(struct msm_gpu *gpu);
 void a5xx_preempt_irq(struct msm_gpu *gpu);
 void a5xx_preempt_fini(struct msm_gpu *gpu);

 void a5xx_flush(struct msm_gpu *gpu, struct msm_ringbuffer *ring, bool sync);

 /* Return true if we are in a preempt state */
 static inline bool a5xx_in_preempt(struct a5xx_gpu *a5xx_gpu)
 {
 	int preempt_state = atomic_read(&a5xx_gpu->preempt_state);

 	return !(preempt_state == PREEMPT_NONE ||
 			preempt_state == PREEMPT_ABORT);
 }

 #endif /* __A5XX_GPU_H__ */
	/* SPDX-License-Identifier: GPL-2.0-only */
	/* Copyright (c) 2016-2017 The Linux Foundation. All rights reserved.
	*/
	#ifndef __A5XX_GPU_H__
	#define __A5XX_GPU_H__

	#include "adreno_gpu.h"

	/* Bringing over the hack from the previous targets */
	#undef ROP_COPY
	#undef ROP_XOR

	#include "a5xx.xml.h"

	struct a5xx_gpu {
	struct adreno_gpu base;

	struct drm_gem_object *pm4_bo;
	uint64_t pm4_iova;

	struct drm_gem_object *pfp_bo;
	uint64_t pfp_iova;

	struct drm_gem_object *gpmu_bo;
	uint64_t gpmu_iova;
	uint32_t gpmu_dwords;

	uint32_t lm_leakage;

	struct msm_ringbuffer *cur_ring;
	struct msm_ringbuffer *next_ring;

	struct drm_gem_object *preempt_bo[MSM_GPU_MAX_RINGS];
	struct drm_gem_object *preempt_counters_bo[MSM_GPU_MAX_RINGS];
	struct a5xx_preempt_record *preempt[MSM_GPU_MAX_RINGS];
	uint64_t preempt_iova[MSM_GPU_MAX_RINGS];
	uint32_t last_seqno[MSM_GPU_MAX_RINGS];

	atomic_t preempt_state;
	spinlock_t preempt_start_lock;
	struct timer_list preempt_timer;

	struct drm_gem_object *shadow_bo;
	uint64_t shadow_iova;
	uint32_t *shadow;

	/* True if the microcode supports the WHERE_AM_I opcode */
	bool has_whereami;
	};

	#define to_a5xx_gpu(x) container_of(x, struct a5xx_gpu, base)

	#ifdef CONFIG_DEBUG_FS
	void a5xx_debugfs_init(struct msm_gpu gpu, struct drm_minor minor);
	#endif

	/*
	* In order to do lockless preemption we use a simple state machine to progress
	* through the process.
	*
	* PREEMPT_NONE - no preemption in progress. Next state START.
	* PREEMPT_START - The trigger is evaulating if preemption is possible. Next
	* states: TRIGGERED, NONE
	* PREEMPT_ABORT - An intermediate state before moving back to NONE. Next
	* state: NONE.
	* PREEMPT_TRIGGERED: A preemption has been executed on the hardware. Next
	* states: FAULTED, PENDING
	* PREEMPT_FAULTED: A preemption timed out (never completed). This will trigger
	* recovery. Next state: N/A
	* PREEMPT_PENDING: Preemption complete interrupt fired - the callback is
	* checking the success of the operation. Next state: FAULTED, NONE.
	*/

	enum preempt_state {
	PREEMPT_NONE = 0,
	PREEMPT_START,
	PREEMPT_ABORT,
	PREEMPT_TRIGGERED,
	PREEMPT_FAULTED,
	PREEMPT_PENDING,
	};

	/*
	* struct a5xx_preempt_record is a shared buffer between the microcode and the
	* CPU to store the state for preemption. The record itself is much larger
	* (64k) but most of that is used by the CP for storage.
	*
	* There is a preemption record assigned per ringbuffer. When the CPU triggers a
	* preemption, it fills out the record with the useful information (wptr, ring
	* base, etc) and the microcode uses that information to set up the CP following
	* the preemption. When a ring is switched out, the CP will save the ringbuffer
	* state back to the record. In this way, once the records are properly set up
	* the CPU can quickly switch back and forth between ringbuffers by only
	* updating a few registers (often only the wptr).
	*
	* These are the CPU aware registers in the record:
	* @magic: Must always be 0x27C4BAFC
	* @info: Type of the record - written 0 by the CPU, updated by the CP
	* @data: Data field from SET_RENDER_MODE or a checkpoint. Written and used by
	* the CP
	* @cntl: Value of RB_CNTL written by CPU, save/restored by CP
	* @rptr: Value of RB_RPTR written by CPU, save/restored by CP
	* @wptr: Value of RB_WPTR written by CPU, save/restored by CP
	* @rptr_addr: Value of RB_RPTR_ADDR written by CPU, save/restored by CP
	* @rbase: Value of RB_BASE written by CPU, save/restored by CP
	* @counter: GPU address of the storage area for the performance counters
	*/
	struct a5xx_preempt_record {
	uint32_t magic;
	uint32_t info;
	uint32_t data;
	uint32_t cntl;
	uint32_t rptr;
	uint32_t wptr;
	uint64_t rptr_addr;
	uint64_t rbase;
	uint64_t counter;
	};

	/* Magic identifier for the preemption record */
	#define A5XX_PREEMPT_RECORD_MAGIC 0x27C4BAFCUL

	/*
	* Even though the structure above is only a few bytes, we need a full 64k to
	* store the entire preemption record from the CP
	*/
	#define A5XX_PREEMPT_RECORD_SIZE (64 * 1024)

	/*
	* The preemption counter block is a storage area for the value of the
	* preemption counters that are saved immediately before context switch. We
	* append it on to the end of the allocation for the preemption record.
	*/
	#define A5XX_PREEMPT_COUNTER_SIZE (16 * 4)


	int a5xx_power_init(struct msm_gpu *gpu);
	void a5xx_gpmu_ucode_init(struct msm_gpu *gpu);

	static inline int spin_usecs(struct msm_gpu *gpu, uint32_t usecs,
	uint32_t reg, uint32_t mask, uint32_t value)
	{
	while (usecs--) {
	udelay(1);
	if ((gpu_read(gpu, reg) & mask) == value)
	return 0;
	cpu_relax();
	}

	return -ETIMEDOUT;
	}

	#define shadowptr(a5xx_gpu, ring) ((a5xx_gpu)->shadow_iova + \
	((ring)->id * sizeof(uint32_t)))

	bool a5xx_idle(struct msm_gpu gpu, struct msm_ringbuffer ring);
	void a5xx_set_hwcg(struct msm_gpu *gpu, bool state);

	void a5xx_preempt_init(struct msm_gpu *gpu);
	void a5xx_preempt_hw_init(struct msm_gpu *gpu);
	void a5xx_preempt_trigger(struct msm_gpu *gpu);
	void a5xx_preempt_irq(struct msm_gpu *gpu);
	void a5xx_preempt_fini(struct msm_gpu *gpu);

	void a5xx_flush(struct msm_gpu gpu, struct msm_ringbuffer ring, bool sync);

	/* Return true if we are in a preempt state */
	static inline bool a5xx_in_preempt(struct a5xx_gpu *a5xx_gpu)
	{
	int preempt_state = atomic_read(&a5xx_gpu->preempt_state);

	return !(preempt_state == PREEMPT_NONE \|\|
	preempt_state == PREEMPT_ABORT);
	}

	#endif /* __A5XX_GPU_H__ */