Commit dd5a376c authored by Arunpravin Paneer Selvam's avatar Arunpravin Paneer Selvam Committed by Alex Deucher
Browse files

drm/amdgpu: enable userqueue secure sem for GFX 12



- Add a field in struct amdgpu_mqd_prop for userqueue
  secure sem fence address since now we have a generic
  file for mes_userqueue.c
- Add secure sem fence address mqd support to gfx12 into
  their corresponding init functions.
- Enable secure semaphore IRQ handling

V2: Address review comment from Alex:
    Use fence_address instead of fenceaddress (Shashank)

Cc: Alex Deucher <alexander.deucher@amd.com>
Cc: Christian Koenig <christian.koenig@amd.com>
Reviewed-by: default avatarAlex Deucher <alexander.deucher@amd.com>
Signed-off-by: default avatarArunpravin Paneer Selvam <Arunpravin.PaneerSelvam@amd.com>
Signed-off-by: default avatarSomalapuram Amaranath <Amaranath.Somalapuram@amd.com>
Signed-off-by: default avatarShashank Sharma <shashank.sharma@amd.com>
Signed-off-by: default avatarAlex Deucher <alexander.deucher@amd.com>
parent 988c9e70
Loading
Loading
Loading
Loading
+1 −0
Original line number Diff line number Diff line
@@ -833,6 +833,7 @@ struct amdgpu_mqd_prop {
	uint64_t shadow_addr;
	uint64_t gds_bkup_addr;
	uint64_t csa_addr;
	uint64_t fence_address;
};

struct amdgpu_mqd {
+2 −0
Original line number Diff line number Diff line
@@ -4134,6 +4134,8 @@ static int gfx_v11_0_gfx_mqd_init(struct amdgpu_device *adev, void *m,
	mqd->gds_bkup_base_hi = upper_32_bits(prop->gds_bkup_addr);
	mqd->fw_work_area_base_lo = lower_32_bits(prop->csa_addr);
	mqd->fw_work_area_base_hi = upper_32_bits(prop->csa_addr);
	mqd->fence_address_lo = lower_32_bits(prop->fence_address);
	mqd->fence_address_hi = upper_32_bits(prop->fence_address);

	return 0;
}
+14 −13
Original line number Diff line number Diff line
@@ -45,6 +45,7 @@
#include "nbif_v6_3_1.h"
#include "mes_v12_0.h"
#include "mes_userqueue.h"
#include "amdgpu_userq_fence.h"

#define GFX12_NUM_GFX_RINGS	1
#define GFX12_MEC_HPD_SIZE	2048
@@ -3037,6 +3038,8 @@ static int gfx_v12_0_gfx_mqd_init(struct amdgpu_device *adev, void *m,
	mqd->shadow_base_hi = upper_32_bits(prop->shadow_addr);
	mqd->fw_work_area_base_lo = lower_32_bits(prop->csa_addr);
	mqd->fw_work_area_base_hi = upper_32_bits(prop->csa_addr);
	mqd->fence_address_lo = lower_32_bits(prop->fence_address);
	mqd->fence_address_hi = upper_32_bits(prop->fence_address);

	return 0;
}
@@ -4819,25 +4822,23 @@ static int gfx_v12_0_eop_irq(struct amdgpu_device *adev,
			     struct amdgpu_irq_src *source,
			     struct amdgpu_iv_entry *entry)
{
	int i;
	u32 doorbell_offset = entry->src_data[0];
	u8 me_id, pipe_id, queue_id;
	struct amdgpu_ring *ring;
	uint32_t mes_queue_id = entry->src_data[0];
	int i;

	DRM_DEBUG("IH: CP EOP\n");

	if (adev->enable_mes && (mes_queue_id & AMDGPU_FENCE_MES_QUEUE_FLAG)) {
		struct amdgpu_mes_queue *queue;

		mes_queue_id &= AMDGPU_FENCE_MES_QUEUE_ID_MASK;
	if (adev->enable_mes && doorbell_offset) {
		struct amdgpu_userq_fence_driver *fence_drv = NULL;
		struct xarray *xa = &adev->userq_xa;
		unsigned long flags;

		spin_lock(&adev->mes.queue_id_lock);
		queue = idr_find(&adev->mes.queue_id_idr, mes_queue_id);
		if (queue) {
			DRM_DEBUG("process mes queue id = %d\n", mes_queue_id);
			amdgpu_fence_process(queue->ring);
		}
		spin_unlock(&adev->mes.queue_id_lock);
		xa_lock_irqsave(xa, flags);
		fence_drv = xa_load(xa, doorbell_offset);
		if (fence_drv)
			amdgpu_userq_fence_driver_process(fence_drv);
		xa_unlock_irqrestore(xa, flags);
	} else {
		me_id = (entry->ring_id & 0x0c) >> 2;
		pipe_id = (entry->ring_id & 0x03) >> 0;
+1 −10
Original line number Diff line number Diff line
@@ -185,14 +185,6 @@ static int mes_userq_create_ctx_space(struct amdgpu_userq_mgr *uq_mgr,
	return 0;
}

static void mes_userq_set_fence_space(struct amdgpu_usermode_queue *queue)
{
	struct v11_gfx_mqd *mqd = queue->mqd.cpu_ptr;

	mqd->fenceaddress_lo = lower_32_bits(queue->fence_drv->gpu_addr);
	mqd->fenceaddress_hi = upper_32_bits(queue->fence_drv->gpu_addr);
}

static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr,
				struct drm_amdgpu_userq_in *args_in,
				struct amdgpu_usermode_queue *queue)
@@ -231,6 +223,7 @@ static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr,
	userq_props->mqd_gpu_addr = queue->mqd.gpu_addr;
	userq_props->use_doorbell = true;
	userq_props->doorbell_index = queue->doorbell_index;
	userq_props->fence_address = queue->fence_drv->gpu_addr;

	if (queue->queue_type == AMDGPU_HW_IP_COMPUTE) {
		struct drm_amdgpu_userq_mqd_compute_gfx11 *compute_mqd;
@@ -307,8 +300,6 @@ static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr,
		goto free_mqd;
	}

	mes_userq_set_fence_space(queue);

	/* FW expects WPTR BOs to be mapped into GART */
	r = mes_userq_create_wptr_mapping(uq_mgr, queue, userq_props->wptr_gpu_addr);
	if (r) {
+2 −2
Original line number Diff line number Diff line
@@ -535,8 +535,8 @@ struct v11_gfx_mqd {
	uint32_t reserved_507; // offset: 507  (0x1FB)
	uint32_t reserved_508; // offset: 508  (0x1FC)
	uint32_t reserved_509; // offset: 509  (0x1FD)
	uint32_t fenceaddress_lo; // offset: 510  (0x1FE)
	uint32_t fenceaddress_hi; // offset: 511  (0x1FF)
	uint32_t fence_address_lo; // offset: 510  (0x1FE)
	uint32_t fence_address_hi; // offset: 511  (0x1FF)
};

struct v11_sdma_mqd {
Loading