msm/adreno/a5xx_gpu.h

*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0-only */
*4882a593Smuzhiyun/* Copyright (c) 2016-2017 The Linux Foundation. All rights reserved.
*4882a593Smuzhiyun */
*4882a593Smuzhiyun#ifndef __A5XX_GPU_H__
*4882a593Smuzhiyun#define __A5XX_GPU_H__
*4882a593Smuzhiyun
*4882a593Smuzhiyun#include "adreno_gpu.h"
*4882a593Smuzhiyun
*4882a593Smuzhiyun/* Bringing over the hack from the previous targets */
*4882a593Smuzhiyun#undef ROP_COPY
*4882a593Smuzhiyun#undef ROP_XOR
*4882a593Smuzhiyun
*4882a593Smuzhiyun#include "a5xx.xml.h"
*4882a593Smuzhiyun
*4882a593Smuzhiyunstruct a5xx_gpu {
*4882a593Smuzhiyun	struct adreno_gpu base;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	struct drm_gem_object *pm4_bo;
*4882a593Smuzhiyun	uint64_t pm4_iova;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	struct drm_gem_object *pfp_bo;
*4882a593Smuzhiyun	uint64_t pfp_iova;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	struct drm_gem_object *gpmu_bo;
*4882a593Smuzhiyun	uint64_t gpmu_iova;
*4882a593Smuzhiyun	uint32_t gpmu_dwords;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	uint32_t lm_leakage;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	struct msm_ringbuffer *cur_ring;
*4882a593Smuzhiyun	struct msm_ringbuffer *next_ring;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	struct drm_gem_object *preempt_bo[MSM_GPU_MAX_RINGS];
*4882a593Smuzhiyun	struct drm_gem_object *preempt_counters_bo[MSM_GPU_MAX_RINGS];
*4882a593Smuzhiyun	struct a5xx_preempt_record *preempt[MSM_GPU_MAX_RINGS];
*4882a593Smuzhiyun	uint64_t preempt_iova[MSM_GPU_MAX_RINGS];
*4882a593Smuzhiyun
*4882a593Smuzhiyun	atomic_t preempt_state;
*4882a593Smuzhiyun	struct timer_list preempt_timer;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	struct drm_gem_object *shadow_bo;
*4882a593Smuzhiyun	uint64_t shadow_iova;
*4882a593Smuzhiyun	uint32_t *shadow;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* True if the microcode supports the WHERE_AM_I opcode */
*4882a593Smuzhiyun	bool has_whereami;
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyun#define to_a5xx_gpu(x) container_of(x, struct a5xx_gpu, base)
*4882a593Smuzhiyun
*4882a593Smuzhiyun#ifdef CONFIG_DEBUG_FS
*4882a593Smuzhiyunvoid a5xx_debugfs_init(struct msm_gpu *gpu, struct drm_minor *minor);
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * In order to do lockless preemption we use a simple state machine to progress
*4882a593Smuzhiyun * through the process.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * PREEMPT_NONE - no preemption in progress.  Next state START.
*4882a593Smuzhiyun * PREEMPT_START - The trigger is evaulating if preemption is possible. Next
*4882a593Smuzhiyun * states: TRIGGERED, NONE
*4882a593Smuzhiyun * PREEMPT_ABORT - An intermediate state before moving back to NONE. Next
*4882a593Smuzhiyun * state: NONE.
*4882a593Smuzhiyun * PREEMPT_TRIGGERED: A preemption has been executed on the hardware. Next
*4882a593Smuzhiyun * states: FAULTED, PENDING
*4882a593Smuzhiyun * PREEMPT_FAULTED: A preemption timed out (never completed). This will trigger
*4882a593Smuzhiyun * recovery.  Next state: N/A
*4882a593Smuzhiyun * PREEMPT_PENDING: Preemption complete interrupt fired - the callback is
*4882a593Smuzhiyun * checking the success of the operation. Next state: FAULTED, NONE.
*4882a593Smuzhiyun */
*4882a593Smuzhiyun
*4882a593Smuzhiyunenum preempt_state {
*4882a593Smuzhiyun	PREEMPT_NONE = 0,
*4882a593Smuzhiyun	PREEMPT_START,
*4882a593Smuzhiyun	PREEMPT_ABORT,
*4882a593Smuzhiyun	PREEMPT_TRIGGERED,
*4882a593Smuzhiyun	PREEMPT_FAULTED,
*4882a593Smuzhiyun	PREEMPT_PENDING,
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * struct a5xx_preempt_record is a shared buffer between the microcode and the
*4882a593Smuzhiyun * CPU to store the state for preemption. The record itself is much larger
*4882a593Smuzhiyun * (64k) but most of that is used by the CP for storage.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * There is a preemption record assigned per ringbuffer. When the CPU triggers a
*4882a593Smuzhiyun * preemption, it fills out the record with the useful information (wptr, ring
*4882a593Smuzhiyun * base, etc) and the microcode uses that information to set up the CP following
*4882a593Smuzhiyun * the preemption.  When a ring is switched out, the CP will save the ringbuffer
*4882a593Smuzhiyun * state back to the record. In this way, once the records are properly set up
*4882a593Smuzhiyun * the CPU can quickly switch back and forth between ringbuffers by only
*4882a593Smuzhiyun * updating a few registers (often only the wptr).
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * These are the CPU aware registers in the record:
*4882a593Smuzhiyun * @magic: Must always be 0x27C4BAFC
*4882a593Smuzhiyun * @info: Type of the record - written 0 by the CPU, updated by the CP
*4882a593Smuzhiyun * @data: Data field from SET_RENDER_MODE or a checkpoint. Written and used by
*4882a593Smuzhiyun * the CP
*4882a593Smuzhiyun * @cntl: Value of RB_CNTL written by CPU, save/restored by CP
*4882a593Smuzhiyun * @rptr: Value of RB_RPTR written by CPU, save/restored by CP
*4882a593Smuzhiyun * @wptr: Value of RB_WPTR written by CPU, save/restored by CP
*4882a593Smuzhiyun * @rptr_addr: Value of RB_RPTR_ADDR written by CPU, save/restored by CP
*4882a593Smuzhiyun * @rbase: Value of RB_BASE written by CPU, save/restored by CP
*4882a593Smuzhiyun * @counter: GPU address of the storage area for the performance counters
*4882a593Smuzhiyun */
*4882a593Smuzhiyunstruct a5xx_preempt_record {
*4882a593Smuzhiyun	uint32_t magic;
*4882a593Smuzhiyun	uint32_t info;
*4882a593Smuzhiyun	uint32_t data;
*4882a593Smuzhiyun	uint32_t cntl;
*4882a593Smuzhiyun	uint32_t rptr;
*4882a593Smuzhiyun	uint32_t wptr;
*4882a593Smuzhiyun	uint64_t rptr_addr;
*4882a593Smuzhiyun	uint64_t rbase;
*4882a593Smuzhiyun	uint64_t counter;
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyun/* Magic identifier for the preemption record */
*4882a593Smuzhiyun#define A5XX_PREEMPT_RECORD_MAGIC 0x27C4BAFCUL
*4882a593Smuzhiyun
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * Even though the structure above is only a few bytes, we need a full 64k to
*4882a593Smuzhiyun * store the entire preemption record from the CP
*4882a593Smuzhiyun */
*4882a593Smuzhiyun#define A5XX_PREEMPT_RECORD_SIZE (64 * 1024)
*4882a593Smuzhiyun
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * The preemption counter block is a storage area for the value of the
*4882a593Smuzhiyun * preemption counters that are saved immediately before context switch. We
*4882a593Smuzhiyun * append it on to the end of the allocation for the preemption record.
*4882a593Smuzhiyun */
*4882a593Smuzhiyun#define A5XX_PREEMPT_COUNTER_SIZE (16 * 4)
*4882a593Smuzhiyun
*4882a593Smuzhiyun
*4882a593Smuzhiyunint a5xx_power_init(struct msm_gpu *gpu);
*4882a593Smuzhiyunvoid a5xx_gpmu_ucode_init(struct msm_gpu *gpu);
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic inline int spin_usecs(struct msm_gpu *gpu, uint32_t usecs,
*4882a593Smuzhiyun		uint32_t reg, uint32_t mask, uint32_t value)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	while (usecs--) {
*4882a593Smuzhiyun		udelay(1);
*4882a593Smuzhiyun		if ((gpu_read(gpu, reg) & mask) == value)
*4882a593Smuzhiyun			return 0;
*4882a593Smuzhiyun		cpu_relax();
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return -ETIMEDOUT;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun#define shadowptr(a5xx_gpu, ring) ((a5xx_gpu)->shadow_iova + \
*4882a593Smuzhiyun		((ring)->id * sizeof(uint32_t)))
*4882a593Smuzhiyun
*4882a593Smuzhiyunbool a5xx_idle(struct msm_gpu *gpu, struct msm_ringbuffer *ring);
*4882a593Smuzhiyunvoid a5xx_set_hwcg(struct msm_gpu *gpu, bool state);
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid a5xx_preempt_init(struct msm_gpu *gpu);
*4882a593Smuzhiyunvoid a5xx_preempt_hw_init(struct msm_gpu *gpu);
*4882a593Smuzhiyunvoid a5xx_preempt_trigger(struct msm_gpu *gpu);
*4882a593Smuzhiyunvoid a5xx_preempt_irq(struct msm_gpu *gpu);
*4882a593Smuzhiyunvoid a5xx_preempt_fini(struct msm_gpu *gpu);
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid a5xx_flush(struct msm_gpu *gpu, struct msm_ringbuffer *ring, bool sync);
*4882a593Smuzhiyun
*4882a593Smuzhiyun/* Return true if we are in a preempt state */
*4882a593Smuzhiyunstatic inline bool a5xx_in_preempt(struct a5xx_gpu *a5xx_gpu)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	int preempt_state = atomic_read(&a5xx_gpu->preempt_state);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return !(preempt_state == PREEMPT_NONE ||
*4882a593Smuzhiyun			preempt_state == PREEMPT_ABORT);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun#endif /* __A5XX_GPU_H__ */