Commit d71518b5 authored by Christian König's avatar Christian König Committed by Alex Deucher

drm/amdgpu: cleanup in kernel job submission

Add a job_alloc_with_ib helper and proper job submission.
Signed-off-by: default avatarChristian König <christian.koenig@amd.com>
Reviewed-by: default avatarAlex Deucher <alexander.deucer@amd.com>
Signed-off-by: default avatarAlex Deucher <alexander.deucher@amd.com>
parent a0332b56
...@@ -797,14 +797,11 @@ extern struct amd_sched_backend_ops amdgpu_sched_ops; ...@@ -797,14 +797,11 @@ extern struct amd_sched_backend_ops amdgpu_sched_ops;
int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs, int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
struct amdgpu_job **job); struct amdgpu_job **job);
int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
struct amdgpu_job **job);
void amdgpu_job_free(struct amdgpu_job *job); void amdgpu_job_free(struct amdgpu_job *job);
int amdgpu_sched_ib_submit_kernel_helper(struct amdgpu_device *adev, int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring,
struct amdgpu_ring *ring, void *owner, struct fence **f);
struct amdgpu_ib *ibs,
unsigned num_ibs,
int (*free_job)(struct amdgpu_job *),
void *owner,
struct fence **fence);
struct amdgpu_ring { struct amdgpu_ring {
struct amdgpu_device *adev; struct amdgpu_device *adev;
...@@ -987,7 +984,6 @@ int amdgpu_vm_bo_unmap(struct amdgpu_device *adev, ...@@ -987,7 +984,6 @@ int amdgpu_vm_bo_unmap(struct amdgpu_device *adev,
uint64_t addr); uint64_t addr);
void amdgpu_vm_bo_rmv(struct amdgpu_device *adev, void amdgpu_vm_bo_rmv(struct amdgpu_device *adev,
struct amdgpu_bo_va *bo_va); struct amdgpu_bo_va *bo_va);
int amdgpu_vm_free_job(struct amdgpu_job *job);
/* /*
* context related structures * context related structures
...@@ -1244,7 +1240,6 @@ struct amdgpu_job { ...@@ -1244,7 +1240,6 @@ struct amdgpu_job {
uint32_t num_ibs; uint32_t num_ibs;
void *owner; void *owner;
struct amdgpu_user_fence uf; struct amdgpu_user_fence uf;
int (*free_job)(struct amdgpu_job *job);
}; };
#define to_amdgpu_job(sched_job) \ #define to_amdgpu_job(sched_job) \
container_of((sched_job), struct amdgpu_job, base) container_of((sched_job), struct amdgpu_job, base)
......
...@@ -752,12 +752,6 @@ static int amdgpu_cs_dependencies(struct amdgpu_device *adev, ...@@ -752,12 +752,6 @@ static int amdgpu_cs_dependencies(struct amdgpu_device *adev,
return 0; return 0;
} }
static int amdgpu_cs_free_job(struct amdgpu_job *job)
{
amdgpu_job_free(job);
return 0;
}
static int amdgpu_cs_submit(struct amdgpu_cs_parser *p, static int amdgpu_cs_submit(struct amdgpu_cs_parser *p,
union drm_amdgpu_cs *cs) union drm_amdgpu_cs *cs)
{ {
...@@ -771,12 +765,10 @@ static int amdgpu_cs_submit(struct amdgpu_cs_parser *p, ...@@ -771,12 +765,10 @@ static int amdgpu_cs_submit(struct amdgpu_cs_parser *p,
job->base.sched = &ring->sched; job->base.sched = &ring->sched;
job->base.s_entity = &p->ctx->rings[ring->idx].entity; job->base.s_entity = &p->ctx->rings[ring->idx].entity;
job->owner = p->filp; job->owner = p->filp;
job->free_job = amdgpu_cs_free_job;
fence = amd_sched_fence_create(job->base.s_entity, p->filp); fence = amd_sched_fence_create(job->base.s_entity, p->filp);
if (!fence) { if (!fence) {
amdgpu_cs_free_job(job); amdgpu_job_free(job);
kfree(job);
return -ENOMEM; return -ENOMEM;
} }
......
...@@ -45,11 +45,26 @@ int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs, ...@@ -45,11 +45,26 @@ int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
(*job)->adev = adev; (*job)->adev = adev;
(*job)->ibs = (void *)&(*job)[1]; (*job)->ibs = (void *)&(*job)[1];
(*job)->num_ibs = num_ibs; (*job)->num_ibs = num_ibs;
(*job)->free_job = NULL;
return 0; return 0;
} }
int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
struct amdgpu_job **job)
{
int r;
r = amdgpu_job_alloc(adev, 1, job);
if (r)
return r;
r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]);
if (r)
kfree(*job);
return r;
}
void amdgpu_job_free(struct amdgpu_job *job) void amdgpu_job_free(struct amdgpu_job *job)
{ {
unsigned i; unsigned i;
...@@ -58,7 +73,27 @@ void amdgpu_job_free(struct amdgpu_job *job) ...@@ -58,7 +73,27 @@ void amdgpu_job_free(struct amdgpu_job *job)
amdgpu_ib_free(job->adev, &job->ibs[i]); amdgpu_ib_free(job->adev, &job->ibs[i]);
amdgpu_bo_unref(&job->uf.bo); amdgpu_bo_unref(&job->uf.bo);
/* TODO: Free the job structure here as well */ kfree(job);
}
int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring,
void *owner, struct fence **f)
{
struct amdgpu_device *adev = job->adev;
job->ring = ring;
job->base.sched = &ring->sched;
job->base.s_entity = &adev->kernel_ctx.rings[ring->idx].entity;
job->base.s_fence = amd_sched_fence_create(job->base.s_entity, owner);
if (!job->base.s_fence)
return -ENOMEM;
*f = fence_get(&job->base.s_fence->base);
job->owner = owner;
amd_sched_entity_push_job(&job->base);
return 0;
} }
static struct fence *amdgpu_sched_dependency(struct amd_sched_job *sched_job) static struct fence *amdgpu_sched_dependency(struct amd_sched_job *sched_job)
...@@ -106,10 +141,7 @@ static struct fence *amdgpu_sched_run_job(struct amd_sched_job *sched_job) ...@@ -106,10 +141,7 @@ static struct fence *amdgpu_sched_run_job(struct amd_sched_job *sched_job)
} }
err: err:
if (job->free_job) amdgpu_job_free(job);
job->free_job(job);
kfree(job);
return fence; return fence;
} }
...@@ -117,35 +149,3 @@ struct amd_sched_backend_ops amdgpu_sched_ops = { ...@@ -117,35 +149,3 @@ struct amd_sched_backend_ops amdgpu_sched_ops = {
.dependency = amdgpu_sched_dependency, .dependency = amdgpu_sched_dependency,
.run_job = amdgpu_sched_run_job, .run_job = amdgpu_sched_run_job,
}; };
int amdgpu_sched_ib_submit_kernel_helper(struct amdgpu_device *adev,
struct amdgpu_ring *ring,
struct amdgpu_ib *ibs,
unsigned num_ibs,
int (*free_job)(struct amdgpu_job *),
void *owner,
struct fence **f)
{
struct amdgpu_job *job =
kzalloc(sizeof(struct amdgpu_job), GFP_KERNEL);
if (!job)
return -ENOMEM;
job->base.sched = &ring->sched;
job->base.s_entity = &adev->kernel_ctx.rings[ring->idx].entity;
job->base.s_fence = amd_sched_fence_create(job->base.s_entity, owner);
if (!job->base.s_fence) {
kfree(job);
return -ENOMEM;
}
*f = fence_get(&job->base.s_fence->base);
job->adev = adev;
job->ring = ring;
job->ibs = ibs;
job->num_ibs = num_ibs;
job->owner = owner;
job->free_job = free_job;
amd_sched_entity_push_job(&job->base);
return 0;
}
...@@ -1012,9 +1012,10 @@ int amdgpu_copy_buffer(struct amdgpu_ring *ring, ...@@ -1012,9 +1012,10 @@ int amdgpu_copy_buffer(struct amdgpu_ring *ring,
struct fence **fence) struct fence **fence)
{ {
struct amdgpu_device *adev = ring->adev; struct amdgpu_device *adev = ring->adev;
struct amdgpu_job *job;
uint32_t max_bytes; uint32_t max_bytes;
unsigned num_loops, num_dw; unsigned num_loops, num_dw;
struct amdgpu_ib *ib;
unsigned i; unsigned i;
int r; int r;
...@@ -1026,20 +1027,12 @@ int amdgpu_copy_buffer(struct amdgpu_ring *ring, ...@@ -1026,20 +1027,12 @@ int amdgpu_copy_buffer(struct amdgpu_ring *ring,
while (num_dw & 0x7) while (num_dw & 0x7)
num_dw++; num_dw++;
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL); r = amdgpu_job_alloc_with_ib(adev, num_dw * 4, &job);
if (!ib) if (r)
return -ENOMEM;
r = amdgpu_ib_get(adev, NULL, num_dw * 4, ib);
if (r) {
kfree(ib);
return r; return r;
}
ib->length_dw = 0;
if (resv) { if (resv) {
r = amdgpu_sync_resv(adev, &ib->sync, resv, r = amdgpu_sync_resv(adev, &job->ibs[0].sync, resv,
AMDGPU_FENCE_OWNER_UNDEFINED); AMDGPU_FENCE_OWNER_UNDEFINED);
if (r) { if (r) {
DRM_ERROR("sync failed (%d).\n", r); DRM_ERROR("sync failed (%d).\n", r);
...@@ -1050,27 +1043,24 @@ int amdgpu_copy_buffer(struct amdgpu_ring *ring, ...@@ -1050,27 +1043,24 @@ int amdgpu_copy_buffer(struct amdgpu_ring *ring,
for (i = 0; i < num_loops; i++) { for (i = 0; i < num_loops; i++) {
uint32_t cur_size_in_bytes = min(byte_count, max_bytes); uint32_t cur_size_in_bytes = min(byte_count, max_bytes);
amdgpu_emit_copy_buffer(adev, ib, src_offset, dst_offset, amdgpu_emit_copy_buffer(adev, &job->ibs[0], src_offset,
cur_size_in_bytes); dst_offset, cur_size_in_bytes);
src_offset += cur_size_in_bytes; src_offset += cur_size_in_bytes;
dst_offset += cur_size_in_bytes; dst_offset += cur_size_in_bytes;
byte_count -= cur_size_in_bytes; byte_count -= cur_size_in_bytes;
} }
amdgpu_ring_pad_ib(ring, ib); amdgpu_ring_pad_ib(ring, &job->ibs[0]);
WARN_ON(ib->length_dw > num_dw); WARN_ON(job->ibs[0].length_dw > num_dw);
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1, r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_UNDEFINED, fence);
&amdgpu_vm_free_job,
AMDGPU_FENCE_OWNER_UNDEFINED,
fence);
if (r) if (r)
goto error_free; goto error_free;
return 0; return 0;
error_free: error_free:
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
return r; return r;
} }
......
...@@ -823,14 +823,6 @@ int amdgpu_uvd_ring_parse_cs(struct amdgpu_cs_parser *parser, uint32_t ib_idx) ...@@ -823,14 +823,6 @@ int amdgpu_uvd_ring_parse_cs(struct amdgpu_cs_parser *parser, uint32_t ib_idx)
return 0; return 0;
} }
static int amdgpu_uvd_free_job(
struct amdgpu_job *job)
{
amdgpu_ib_free(job->adev, job->ibs);
kfree(job->ibs);
return 0;
}
static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring, static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring,
struct amdgpu_bo *bo, struct amdgpu_bo *bo,
struct fence **fence) struct fence **fence)
...@@ -838,7 +830,8 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring, ...@@ -838,7 +830,8 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring,
struct ttm_validate_buffer tv; struct ttm_validate_buffer tv;
struct ww_acquire_ctx ticket; struct ww_acquire_ctx ticket;
struct list_head head; struct list_head head;
struct amdgpu_ib *ib = NULL; struct amdgpu_job *job;
struct amdgpu_ib *ib;
struct fence *f = NULL; struct fence *f = NULL;
struct amdgpu_device *adev = ring->adev; struct amdgpu_device *adev = ring->adev;
uint64_t addr; uint64_t addr;
...@@ -862,15 +855,12 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring, ...@@ -862,15 +855,12 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring,
r = ttm_bo_validate(&bo->tbo, &bo->placement, true, false); r = ttm_bo_validate(&bo->tbo, &bo->placement, true, false);
if (r) if (r)
goto err; goto err;
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL);
if (!ib) { r = amdgpu_job_alloc_with_ib(adev, 64, &job);
r = -ENOMEM;
goto err;
}
r = amdgpu_ib_get(adev, NULL, 64, ib);
if (r) if (r)
goto err1; goto err;
ib = &job->ibs[0];
addr = amdgpu_bo_gpu_offset(bo); addr = amdgpu_bo_gpu_offset(bo);
ib->ptr[0] = PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0); ib->ptr[0] = PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0);
ib->ptr[1] = addr; ib->ptr[1] = addr;
...@@ -882,12 +872,9 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring, ...@@ -882,12 +872,9 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring,
ib->ptr[i] = PACKET2(0); ib->ptr[i] = PACKET2(0);
ib->length_dw = 16; ib->length_dw = 16;
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1, r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_UNDEFINED, &f);
&amdgpu_uvd_free_job,
AMDGPU_FENCE_OWNER_UNDEFINED,
&f);
if (r) if (r)
goto err2; goto err_free;
ttm_eu_fence_buffer_objects(&ticket, &head, f); ttm_eu_fence_buffer_objects(&ticket, &head, f);
...@@ -897,10 +884,10 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring, ...@@ -897,10 +884,10 @@ static int amdgpu_uvd_send_msg(struct amdgpu_ring *ring,
fence_put(f); fence_put(f);
return 0; return 0;
err2:
amdgpu_ib_free(ring->adev, ib); err_free:
err1: amdgpu_job_free(job);
kfree(ib);
err: err:
ttm_eu_backoff_reservation(&ticket, &head); ttm_eu_backoff_reservation(&ticket, &head);
return r; return r;
......
...@@ -346,14 +346,6 @@ void amdgpu_vce_free_handles(struct amdgpu_device *adev, struct drm_file *filp) ...@@ -346,14 +346,6 @@ void amdgpu_vce_free_handles(struct amdgpu_device *adev, struct drm_file *filp)
} }
} }
static int amdgpu_vce_free_job(
struct amdgpu_job *job)
{
amdgpu_ib_free(job->adev, job->ibs);
kfree(job->ibs);
return 0;
}
/** /**
* amdgpu_vce_get_create_msg - generate a VCE create msg * amdgpu_vce_get_create_msg - generate a VCE create msg
* *
...@@ -368,21 +360,17 @@ int amdgpu_vce_get_create_msg(struct amdgpu_ring *ring, uint32_t handle, ...@@ -368,21 +360,17 @@ int amdgpu_vce_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
struct fence **fence) struct fence **fence)
{ {
const unsigned ib_size_dw = 1024; const unsigned ib_size_dw = 1024;
struct amdgpu_ib *ib = NULL; struct amdgpu_job *job;
struct amdgpu_ib *ib;
struct fence *f = NULL; struct fence *f = NULL;
struct amdgpu_device *adev = ring->adev;
uint64_t dummy; uint64_t dummy;
int i, r; int i, r;
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL); r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
if (!ib) if (r)
return -ENOMEM;
r = amdgpu_ib_get(adev, NULL, ib_size_dw * 4, ib);
if (r) {
DRM_ERROR("amdgpu: failed to get ib (%d).\n", r);
kfree(ib);
return r; return r;
}
ib = &job->ibs[0];
dummy = ib->gpu_addr + 1024; dummy = ib->gpu_addr + 1024;
...@@ -423,19 +411,16 @@ int amdgpu_vce_get_create_msg(struct amdgpu_ring *ring, uint32_t handle, ...@@ -423,19 +411,16 @@ int amdgpu_vce_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
for (i = ib->length_dw; i < ib_size_dw; ++i) for (i = ib->length_dw; i < ib_size_dw; ++i)
ib->ptr[i] = 0x0; ib->ptr[i] = 0x0;
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1, r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_UNDEFINED, &f);
&amdgpu_vce_free_job,
AMDGPU_FENCE_OWNER_UNDEFINED,
&f);
if (r) if (r)
goto err; goto err;
if (fence) if (fence)
*fence = fence_get(f); *fence = fence_get(f);
fence_put(f); fence_put(f);
return 0; return 0;
err: err:
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
return r; return r;
} }
...@@ -453,23 +438,17 @@ int amdgpu_vce_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle, ...@@ -453,23 +438,17 @@ int amdgpu_vce_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
struct fence **fence) struct fence **fence)
{ {
const unsigned ib_size_dw = 1024; const unsigned ib_size_dw = 1024;
struct amdgpu_ib *ib = NULL; struct amdgpu_job *job;
struct amdgpu_ib *ib;
struct fence *f = NULL; struct fence *f = NULL;
struct amdgpu_device *adev = ring->adev;
uint64_t dummy; uint64_t dummy;
int i, r; int i, r;
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL); r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
if (!ib) if (r)
return -ENOMEM;
r = amdgpu_ib_get(adev, NULL, ib_size_dw * 4, ib);
if (r) {
kfree(ib);
DRM_ERROR("amdgpu: failed to get ib (%d).\n", r);
return r; return r;
}
ib = &job->ibs[0];
dummy = ib->gpu_addr + 1024; dummy = ib->gpu_addr + 1024;
/* stitch together an VCE destroy msg */ /* stitch together an VCE destroy msg */
...@@ -489,19 +468,16 @@ int amdgpu_vce_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle, ...@@ -489,19 +468,16 @@ int amdgpu_vce_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
for (i = ib->length_dw; i < ib_size_dw; ++i) for (i = ib->length_dw; i < ib_size_dw; ++i)
ib->ptr[i] = 0x0; ib->ptr[i] = 0x0;
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1, r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_UNDEFINED, &f);
&amdgpu_vce_free_job,
AMDGPU_FENCE_OWNER_UNDEFINED,
&f);
if (r) if (r)
goto err; goto err;
if (fence) if (fence)
*fence = fence_get(f); *fence = fence_get(f);
fence_put(f); fence_put(f);
return 0; return 0;
err: err:
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
return r; return r;
} }
......
...@@ -313,15 +313,6 @@ static void amdgpu_vm_update_pages(struct amdgpu_device *adev, ...@@ -313,15 +313,6 @@ static void amdgpu_vm_update_pages(struct amdgpu_device *adev,
} }
} }
int amdgpu_vm_free_job(struct amdgpu_job *job)
{
int i;
for (i = 0; i < job->num_ibs; i++)
amdgpu_ib_free(job->adev, &job->ibs[i]);
kfree(job->ibs);
return 0;
}
/** /**
* amdgpu_vm_clear_bo - initially clear the page dir/table * amdgpu_vm_clear_bo - initially clear the page dir/table
* *
...@@ -335,7 +326,7 @@ static int amdgpu_vm_clear_bo(struct amdgpu_device *adev, ...@@ -335,7 +326,7 @@ static int amdgpu_vm_clear_bo(struct amdgpu_device *adev,
{ {
struct amdgpu_ring *ring = adev->vm_manager.vm_pte_funcs_ring; struct amdgpu_ring *ring = adev->vm_manager.vm_pte_funcs_ring;
struct fence *fence = NULL; struct fence *fence = NULL;
struct amdgpu_ib *ib; struct amdgpu_job *job;
unsigned entries; unsigned entries;
uint64_t addr; uint64_t addr;
int r; int r;
...@@ -351,32 +342,25 @@ static int amdgpu_vm_clear_bo(struct amdgpu_device *adev, ...@@ -351,32 +342,25 @@ static int amdgpu_vm_clear_bo(struct amdgpu_device *adev,
addr = amdgpu_bo_gpu_offset(bo); addr = amdgpu_bo_gpu_offset(bo);
entries = amdgpu_bo_size(bo) / 8; entries = amdgpu_bo_size(bo) / 8;
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL); r = amdgpu_job_alloc_with_ib(adev, 64, &job);
if (!ib) if (r)
goto error; goto error;
r = amdgpu_ib_get(adev, NULL, 64, ib); amdgpu_vm_update_pages(adev, NULL, 0, &job->ibs[0], addr, 0, entries,
0, 0);
amdgpu_ring_pad_ib(ring, &job->ibs[0]);
WARN_ON(job->ibs[0].length_dw > 64);
r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_VM, &fence);
if (r) if (r)
goto error_free; goto error_free;
ib->length_dw = 0;
amdgpu_vm_update_pages(adev, NULL, 0, ib, addr, 0, entries, 0, 0);
amdgpu_ring_pad_ib(ring, ib);
WARN_ON(ib->length_dw > 64);
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1,
&amdgpu_vm_free_job,
AMDGPU_FENCE_OWNER_VM,
&fence);
if (!r)
amdgpu_bo_fence(bo, fence, true); amdgpu_bo_fence(bo, fence, true);
fence_put(fence); fence_put(fence);
return 0; return 0;
error_free: error_free:
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
error: error:
return r; return r;
...@@ -433,6 +417,7 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev, ...@@ -433,6 +417,7 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev,
uint32_t incr = AMDGPU_VM_PTE_COUNT * 8; uint32_t incr = AMDGPU_VM_PTE_COUNT * 8;
uint64_t last_pde = ~0, last_pt = ~0; uint64_t last_pde = ~0, last_pt = ~0;
unsigned count = 0, pt_idx, ndw; unsigned count = 0, pt_idx, ndw;
struct amdgpu_job *job;
struct amdgpu_ib *ib; struct amdgpu_ib *ib;
struct fence *fence = NULL; struct fence *fence = NULL;
...@@ -444,16 +429,11 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev, ...@@ -444,16 +429,11 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev,
/* assume the worst case */ /* assume the worst case */
ndw += vm->max_pde_used * 6; ndw += vm->max_pde_used * 6;
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL); r = amdgpu_job_alloc_with_ib(adev, ndw * 4, &job);
if (!ib) if (r)
return -ENOMEM;
r = amdgpu_ib_get(adev, NULL, ndw * 4, ib);
if (r) {
kfree(ib);
return r; return r;
}
ib->length_dw = 0; ib = &job->ibs[0];
/* walk over the address space and update the page directory */ /* walk over the address space and update the page directory */
for (pt_idx = 0; pt_idx <= vm->max_pde_used; ++pt_idx) { for (pt_idx = 0; pt_idx <= vm->max_pde_used; ++pt_idx) {
...@@ -495,10 +475,7 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev, ...@@ -495,10 +475,7 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev,
amdgpu_ring_pad_ib(ring, ib); amdgpu_ring_pad_ib(ring, ib);
amdgpu_sync_resv(adev, &ib->sync, pd->tbo.resv, AMDGPU_FENCE_OWNER_VM); amdgpu_sync_resv(adev, &ib->sync, pd->tbo.resv, AMDGPU_FENCE_OWNER_VM);
WARN_ON(ib->length_dw > ndw); WARN_ON(ib->length_dw > ndw);
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1, r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_VM, &fence);
&amdgpu_vm_free_job,
AMDGPU_FENCE_OWNER_VM,
&fence);
if (r) if (r)
goto error_free; goto error_free;
...@@ -506,18 +483,15 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev, ...@@ -506,18 +483,15 @@ int amdgpu_vm_update_page_directory(struct amdgpu_device *adev,
fence_put(vm->page_directory_fence); fence_put(vm->page_directory_fence);
vm->page_directory_fence = fence_get(fence); vm->page_directory_fence = fence_get(fence);
fence_put(fence); fence_put(fence);
}
if (ib->length_dw == 0) { } else {
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
} }
return 0; return 0;
error_free: error_free:
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
return r; return r;
} }
...@@ -695,6 +669,7 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev, ...@@ -695,6 +669,7 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
struct amdgpu_ring *ring = adev->vm_manager.vm_pte_funcs_ring; struct amdgpu_ring *ring = adev->vm_manager.vm_pte_funcs_ring;
void *owner = AMDGPU_FENCE_OWNER_VM; void *owner = AMDGPU_FENCE_OWNER_VM;
unsigned nptes, ncmds, ndw; unsigned nptes, ncmds, ndw;
struct amdgpu_job *job;
struct amdgpu_ib *ib; struct amdgpu_ib *ib;
struct fence *f = NULL; struct fence *f = NULL;
int r; int r;
...@@ -733,15 +708,11 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev, ...@@ -733,15 +708,11 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
ndw += 2 * 10; ndw += 2 * 10;
} }
ib = kzalloc(sizeof(struct amdgpu_ib), GFP_KERNEL); r = amdgpu_job_alloc_with_ib(adev, ndw * 4, &job);
if (!ib) if (r)
return -ENOMEM;
r = amdgpu_ib_get(adev, NULL, ndw * 4, ib);
if (r) {
kfree(ib);
return r; return r;
}
ib = &job->ibs[0];
r = amdgpu_sync_resv(adev, &ib->sync, vm->page_directory->tbo.resv, r = amdgpu_sync_resv(adev, &ib->sync, vm->page_directory->tbo.resv,
owner); owner);
...@@ -757,10 +728,7 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev, ...@@ -757,10 +728,7 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
amdgpu_ring_pad_ib(ring, ib); amdgpu_ring_pad_ib(ring, ib);
WARN_ON(ib->length_dw > ndw); WARN_ON(ib->length_dw > ndw);
r = amdgpu_sched_ib_submit_kernel_helper(adev, ring, ib, 1, r = amdgpu_job_submit(job, ring, AMDGPU_FENCE_OWNER_VM, &f);
&amdgpu_vm_free_job,
AMDGPU_FENCE_OWNER_VM,
&f);
if (r) if (r)
goto error_free; goto error_free;
...@@ -773,8 +741,7 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev, ...@@ -773,8 +741,7 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
return 0; return 0;
error_free: error_free:
amdgpu_ib_free(adev, ib); amdgpu_job_free(job);
kfree(ib);
return r; return r;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment