mirror of https://gitee.com/openkylin/linux.git
drm/amdgpu: fix and cleanup user fence handling v2
We leaked the BO in the error pass, additional to that we only have one user fence for all IBs in a job. v2: remove white space changes Signed-off-by: Christian König <christian.koenig@amd.com> Reviewed-by: Alex Deucher <alexander.deucher@amd.com> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
This commit is contained in:
parent
d88bf583bd
commit
758ac17f96
|
@ -368,13 +368,6 @@ struct amdgpu_fence_driver {
|
||||||
#define AMDGPU_FENCE_FLAG_64BIT (1 << 0)
|
#define AMDGPU_FENCE_FLAG_64BIT (1 << 0)
|
||||||
#define AMDGPU_FENCE_FLAG_INT (1 << 1)
|
#define AMDGPU_FENCE_FLAG_INT (1 << 1)
|
||||||
|
|
||||||
struct amdgpu_user_fence {
|
|
||||||
/* write-back bo */
|
|
||||||
struct amdgpu_bo *bo;
|
|
||||||
/* write-back address offset to bo start */
|
|
||||||
uint32_t offset;
|
|
||||||
};
|
|
||||||
|
|
||||||
int amdgpu_fence_driver_init(struct amdgpu_device *adev);
|
int amdgpu_fence_driver_init(struct amdgpu_device *adev);
|
||||||
void amdgpu_fence_driver_fini(struct amdgpu_device *adev);
|
void amdgpu_fence_driver_fini(struct amdgpu_device *adev);
|
||||||
void amdgpu_fence_driver_force_completion(struct amdgpu_device *adev);
|
void amdgpu_fence_driver_force_completion(struct amdgpu_device *adev);
|
||||||
|
@ -741,10 +734,7 @@ struct amdgpu_ib {
|
||||||
uint32_t length_dw;
|
uint32_t length_dw;
|
||||||
uint64_t gpu_addr;
|
uint64_t gpu_addr;
|
||||||
uint32_t *ptr;
|
uint32_t *ptr;
|
||||||
struct amdgpu_user_fence *user;
|
|
||||||
uint32_t flags;
|
uint32_t flags;
|
||||||
/* resulting sequence number */
|
|
||||||
uint64_t sequence;
|
|
||||||
};
|
};
|
||||||
|
|
||||||
enum amdgpu_ring_type {
|
enum amdgpu_ring_type {
|
||||||
|
@ -1219,7 +1209,7 @@ void amdgpu_ring_fini(struct amdgpu_ring *ring);
|
||||||
struct amdgpu_cs_chunk {
|
struct amdgpu_cs_chunk {
|
||||||
uint32_t chunk_id;
|
uint32_t chunk_id;
|
||||||
uint32_t length_dw;
|
uint32_t length_dw;
|
||||||
uint32_t *kdata;
|
void *kdata;
|
||||||
};
|
};
|
||||||
|
|
||||||
struct amdgpu_cs_parser {
|
struct amdgpu_cs_parser {
|
||||||
|
@ -1263,7 +1253,12 @@ struct amdgpu_job {
|
||||||
uint32_t gds_base, gds_size;
|
uint32_t gds_base, gds_size;
|
||||||
uint32_t gws_base, gws_size;
|
uint32_t gws_base, gws_size;
|
||||||
uint32_t oa_base, oa_size;
|
uint32_t oa_base, oa_size;
|
||||||
struct amdgpu_user_fence uf;
|
|
||||||
|
/* user fence handling */
|
||||||
|
struct amdgpu_bo *uf_bo;
|
||||||
|
uint32_t uf_offset;
|
||||||
|
uint64_t uf_sequence;
|
||||||
|
|
||||||
};
|
};
|
||||||
#define to_amdgpu_job(sched_job) \
|
#define to_amdgpu_job(sched_job) \
|
||||||
container_of((sched_job), struct amdgpu_job, base)
|
container_of((sched_job), struct amdgpu_job, base)
|
||||||
|
|
|
@ -87,33 +87,30 @@ int amdgpu_cs_get_ring(struct amdgpu_device *adev, u32 ip_type,
|
||||||
}
|
}
|
||||||
|
|
||||||
static int amdgpu_cs_user_fence_chunk(struct amdgpu_cs_parser *p,
|
static int amdgpu_cs_user_fence_chunk(struct amdgpu_cs_parser *p,
|
||||||
struct amdgpu_user_fence *uf,
|
struct drm_amdgpu_cs_chunk_fence *data,
|
||||||
struct drm_amdgpu_cs_chunk_fence *fence_data)
|
uint32_t *offset)
|
||||||
{
|
{
|
||||||
struct drm_gem_object *gobj;
|
struct drm_gem_object *gobj;
|
||||||
uint32_t handle;
|
|
||||||
|
|
||||||
handle = fence_data->handle;
|
|
||||||
gobj = drm_gem_object_lookup(p->adev->ddev, p->filp,
|
gobj = drm_gem_object_lookup(p->adev->ddev, p->filp,
|
||||||
fence_data->handle);
|
data->handle);
|
||||||
if (gobj == NULL)
|
if (gobj == NULL)
|
||||||
return -EINVAL;
|
return -EINVAL;
|
||||||
|
|
||||||
uf->bo = amdgpu_bo_ref(gem_to_amdgpu_bo(gobj));
|
p->uf_entry.robj = amdgpu_bo_ref(gem_to_amdgpu_bo(gobj));
|
||||||
uf->offset = fence_data->offset;
|
|
||||||
|
|
||||||
if (amdgpu_ttm_tt_get_usermm(uf->bo->tbo.ttm)) {
|
|
||||||
drm_gem_object_unreference_unlocked(gobj);
|
|
||||||
return -EINVAL;
|
|
||||||
}
|
|
||||||
|
|
||||||
p->uf_entry.robj = amdgpu_bo_ref(uf->bo);
|
|
||||||
p->uf_entry.priority = 0;
|
p->uf_entry.priority = 0;
|
||||||
p->uf_entry.tv.bo = &p->uf_entry.robj->tbo;
|
p->uf_entry.tv.bo = &p->uf_entry.robj->tbo;
|
||||||
p->uf_entry.tv.shared = true;
|
p->uf_entry.tv.shared = true;
|
||||||
p->uf_entry.user_pages = NULL;
|
p->uf_entry.user_pages = NULL;
|
||||||
|
*offset = data->offset;
|
||||||
|
|
||||||
drm_gem_object_unreference_unlocked(gobj);
|
drm_gem_object_unreference_unlocked(gobj);
|
||||||
|
|
||||||
|
if (amdgpu_ttm_tt_get_usermm(p->uf_entry.robj->tbo.ttm)) {
|
||||||
|
amdgpu_bo_unref(&p->uf_entry.robj);
|
||||||
|
return -EINVAL;
|
||||||
|
}
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -124,8 +121,8 @@ int amdgpu_cs_parser_init(struct amdgpu_cs_parser *p, void *data)
|
||||||
union drm_amdgpu_cs *cs = data;
|
union drm_amdgpu_cs *cs = data;
|
||||||
uint64_t *chunk_array_user;
|
uint64_t *chunk_array_user;
|
||||||
uint64_t *chunk_array;
|
uint64_t *chunk_array;
|
||||||
struct amdgpu_user_fence uf = {};
|
|
||||||
unsigned size, num_ibs = 0;
|
unsigned size, num_ibs = 0;
|
||||||
|
uint32_t uf_offset = 0;
|
||||||
int i;
|
int i;
|
||||||
int ret;
|
int ret;
|
||||||
|
|
||||||
|
@ -200,7 +197,8 @@ int amdgpu_cs_parser_init(struct amdgpu_cs_parser *p, void *data)
|
||||||
goto free_partial_kdata;
|
goto free_partial_kdata;
|
||||||
}
|
}
|
||||||
|
|
||||||
ret = amdgpu_cs_user_fence_chunk(p, &uf, (void *)p->chunks[i].kdata);
|
ret = amdgpu_cs_user_fence_chunk(p, p->chunks[i].kdata,
|
||||||
|
&uf_offset);
|
||||||
if (ret)
|
if (ret)
|
||||||
goto free_partial_kdata;
|
goto free_partial_kdata;
|
||||||
|
|
||||||
|
@ -219,7 +217,10 @@ int amdgpu_cs_parser_init(struct amdgpu_cs_parser *p, void *data)
|
||||||
if (ret)
|
if (ret)
|
||||||
goto free_all_kdata;
|
goto free_all_kdata;
|
||||||
|
|
||||||
p->job->uf = uf;
|
if (p->uf_entry.robj) {
|
||||||
|
p->job->uf_bo = amdgpu_bo_ref(p->uf_entry.robj);
|
||||||
|
p->job->uf_offset = uf_offset;
|
||||||
|
}
|
||||||
|
|
||||||
kfree(chunk_array);
|
kfree(chunk_array);
|
||||||
return 0;
|
return 0;
|
||||||
|
@ -377,7 +378,7 @@ static int amdgpu_cs_parser_bos(struct amdgpu_cs_parser *p,
|
||||||
INIT_LIST_HEAD(&duplicates);
|
INIT_LIST_HEAD(&duplicates);
|
||||||
amdgpu_vm_get_pd_bo(&fpriv->vm, &p->validated, &p->vm_pd);
|
amdgpu_vm_get_pd_bo(&fpriv->vm, &p->validated, &p->vm_pd);
|
||||||
|
|
||||||
if (p->job->uf.bo)
|
if (p->uf_entry.robj)
|
||||||
list_add(&p->uf_entry.tv.head, &p->validated);
|
list_add(&p->uf_entry.tv.head, &p->validated);
|
||||||
|
|
||||||
if (need_mmap_lock)
|
if (need_mmap_lock)
|
||||||
|
@ -760,18 +761,12 @@ static int amdgpu_cs_ib_fill(struct amdgpu_device *adev,
|
||||||
j++;
|
j++;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* wrap the last IB with user fence */
|
|
||||||
if (parser->job->uf.bo) {
|
|
||||||
struct amdgpu_ib *ib = &parser->job->ibs[parser->job->num_ibs - 1];
|
|
||||||
|
|
||||||
/* UVD & VCE fw doesn't support user fences */
|
/* UVD & VCE fw doesn't support user fences */
|
||||||
if (parser->job->ring->type == AMDGPU_RING_TYPE_UVD ||
|
if (parser->job->uf_bo && (
|
||||||
parser->job->ring->type == AMDGPU_RING_TYPE_VCE)
|
parser->job->ring->type == AMDGPU_RING_TYPE_UVD ||
|
||||||
|
parser->job->ring->type == AMDGPU_RING_TYPE_VCE))
|
||||||
return -EINVAL;
|
return -EINVAL;
|
||||||
|
|
||||||
ib->user = &parser->job->uf;
|
|
||||||
}
|
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -856,7 +851,7 @@ static int amdgpu_cs_submit(struct amdgpu_cs_parser *p,
|
||||||
job->ctx = entity->fence_context;
|
job->ctx = entity->fence_context;
|
||||||
p->fence = fence_get(fence);
|
p->fence = fence_get(fence);
|
||||||
cs->out.handle = amdgpu_ctx_add_fence(p->ctx, ring, fence);
|
cs->out.handle = amdgpu_ctx_add_fence(p->ctx, ring, fence);
|
||||||
job->ibs[job->num_ibs - 1].sequence = cs->out.handle;
|
job->uf_sequence = cs->out.handle;
|
||||||
|
|
||||||
trace_amdgpu_cs_ioctl(job);
|
trace_amdgpu_cs_ioctl(job);
|
||||||
amd_sched_entity_push_job(&job->base);
|
amd_sched_entity_push_job(&job->base);
|
||||||
|
|
|
@ -203,10 +203,11 @@ int amdgpu_ib_schedule(struct amdgpu_ring *ring, unsigned num_ibs,
|
||||||
}
|
}
|
||||||
|
|
||||||
/* wrap the last IB with fence */
|
/* wrap the last IB with fence */
|
||||||
if (ib->user) {
|
if (job && job->uf_bo) {
|
||||||
uint64_t addr = amdgpu_bo_gpu_offset(ib->user->bo);
|
uint64_t addr = amdgpu_bo_gpu_offset(job->uf_bo);
|
||||||
addr += ib->user->offset;
|
|
||||||
amdgpu_ring_emit_fence(ring, addr, ib->sequence,
|
addr += job->uf_offset;
|
||||||
|
amdgpu_ring_emit_fence(ring, addr, job->uf_sequence,
|
||||||
AMDGPU_FENCE_FLAG_64BIT);
|
AMDGPU_FENCE_FLAG_64BIT);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -97,7 +97,7 @@ void amdgpu_job_free(struct amdgpu_job *job)
|
||||||
amdgpu_sa_bo_free(job->adev, &job->ibs[i].sa_bo, f);
|
amdgpu_sa_bo_free(job->adev, &job->ibs[i].sa_bo, f);
|
||||||
fence_put(job->fence);
|
fence_put(job->fence);
|
||||||
|
|
||||||
amdgpu_bo_unref(&job->uf.bo);
|
amdgpu_bo_unref(&job->uf_bo);
|
||||||
amdgpu_sync_free(&job->sync);
|
amdgpu_sync_free(&job->sync);
|
||||||
|
|
||||||
if (!job->base.use_sched)
|
if (!job->base.use_sched)
|
||||||
|
|
Loading…
Reference in New Issue