Commit 25ce7c50 authored by Brian Welty's avatar Brian Welty Committed by Matthew Brost

drm/xe: Finish refactoring of exec_queue_create

Setting of exec_queue user extensions is moved from the end of the ioctl
function earlier, into __xe_exec_queue_alloc().
This fixes bug in that the USM attributes for access counters were being
applied too late, and effectively were ignored.

However, in order to apply user extensions this early, we can no longer
call q->ops functions.  Instead, make it more efficient. The user extension
functions can simply update the q->sched_props values and they will be
applied by the backend during q->ops->init().

v2: minor changes for readability (Matt)
Signed-off-by: default avatarBrian Welty <brian.welty@intel.com>
Signed-off-by: default avatarMatthew Brost <matthew.brost@intel.com>
Reviewed-by: default avatarMatthew Brost <matthew.brost@intel.com>
parent 6ae24344
...@@ -30,14 +30,18 @@ enum xe_exec_queue_sched_prop { ...@@ -30,14 +30,18 @@ enum xe_exec_queue_sched_prop {
XE_EXEC_QUEUE_SCHED_PROP_MAX = 3, XE_EXEC_QUEUE_SCHED_PROP_MAX = 3,
}; };
static int exec_queue_user_extensions(struct xe_device *xe, struct xe_exec_queue *q,
u64 extensions, int ext_number, bool create);
static struct xe_exec_queue *__xe_exec_queue_alloc(struct xe_device *xe, static struct xe_exec_queue *__xe_exec_queue_alloc(struct xe_device *xe,
struct xe_vm *vm, struct xe_vm *vm,
u32 logical_mask, u32 logical_mask,
u16 width, struct xe_hw_engine *hwe, u16 width, struct xe_hw_engine *hwe,
u32 flags) u32 flags, u64 extensions)
{ {
struct xe_exec_queue *q; struct xe_exec_queue *q;
struct xe_gt *gt = hwe->gt; struct xe_gt *gt = hwe->gt;
int err;
/* only kernel queues can be permanent */ /* only kernel queues can be permanent */
XE_WARN_ON((flags & EXEC_QUEUE_FLAG_PERMANENT) && !(flags & EXEC_QUEUE_FLAG_KERNEL)); XE_WARN_ON((flags & EXEC_QUEUE_FLAG_PERMANENT) && !(flags & EXEC_QUEUE_FLAG_KERNEL));
...@@ -50,8 +54,6 @@ static struct xe_exec_queue *__xe_exec_queue_alloc(struct xe_device *xe, ...@@ -50,8 +54,6 @@ static struct xe_exec_queue *__xe_exec_queue_alloc(struct xe_device *xe,
q->flags = flags; q->flags = flags;
q->hwe = hwe; q->hwe = hwe;
q->gt = gt; q->gt = gt;
if (vm)
q->vm = xe_vm_get(vm);
q->class = hwe->class; q->class = hwe->class;
q->width = width; q->width = width;
q->logical_mask = logical_mask; q->logical_mask = logical_mask;
...@@ -73,6 +75,21 @@ static struct xe_exec_queue *__xe_exec_queue_alloc(struct xe_device *xe, ...@@ -73,6 +75,21 @@ static struct xe_exec_queue *__xe_exec_queue_alloc(struct xe_device *xe,
else else
q->sched_props.priority = XE_EXEC_QUEUE_PRIORITY_NORMAL; q->sched_props.priority = XE_EXEC_QUEUE_PRIORITY_NORMAL;
if (extensions) {
/*
* may set q->usm, must come before xe_lrc_init(),
* may overwrite q->sched_props, must come before q->ops->init()
*/
err = exec_queue_user_extensions(xe, q, extensions, 0, true);
if (err) {
kfree(q);
return ERR_PTR(err);
}
}
if (vm)
q->vm = xe_vm_get(vm);
if (xe_exec_queue_is_parallel(q)) { if (xe_exec_queue_is_parallel(q)) {
q->parallel.composite_fence_ctx = dma_fence_context_alloc(1); q->parallel.composite_fence_ctx = dma_fence_context_alloc(1);
q->parallel.composite_fence_seqno = XE_FENCE_INITIAL_SEQNO; q->parallel.composite_fence_seqno = XE_FENCE_INITIAL_SEQNO;
...@@ -128,12 +145,14 @@ static int __xe_exec_queue_init(struct xe_exec_queue *q) ...@@ -128,12 +145,14 @@ static int __xe_exec_queue_init(struct xe_exec_queue *q)
struct xe_exec_queue *xe_exec_queue_create(struct xe_device *xe, struct xe_vm *vm, struct xe_exec_queue *xe_exec_queue_create(struct xe_device *xe, struct xe_vm *vm,
u32 logical_mask, u16 width, u32 logical_mask, u16 width,
struct xe_hw_engine *hwe, u32 flags) struct xe_hw_engine *hwe, u32 flags,
u64 extensions)
{ {
struct xe_exec_queue *q; struct xe_exec_queue *q;
int err; int err;
q = __xe_exec_queue_alloc(xe, vm, logical_mask, width, hwe, flags); q = __xe_exec_queue_alloc(xe, vm, logical_mask, width, hwe, flags,
extensions);
if (IS_ERR(q)) if (IS_ERR(q))
return q; return q;
...@@ -178,7 +197,7 @@ struct xe_exec_queue *xe_exec_queue_create_class(struct xe_device *xe, struct xe ...@@ -178,7 +197,7 @@ struct xe_exec_queue *xe_exec_queue_create_class(struct xe_device *xe, struct xe
if (!logical_mask) if (!logical_mask)
return ERR_PTR(-ENODEV); return ERR_PTR(-ENODEV);
return xe_exec_queue_create(xe, vm, logical_mask, 1, hwe0, flags); return xe_exec_queue_create(xe, vm, logical_mask, 1, hwe0, flags, 0);
} }
void xe_exec_queue_destroy(struct kref *ref) void xe_exec_queue_destroy(struct kref *ref)
...@@ -262,7 +281,11 @@ static int exec_queue_set_priority(struct xe_device *xe, struct xe_exec_queue *q ...@@ -262,7 +281,11 @@ static int exec_queue_set_priority(struct xe_device *xe, struct xe_exec_queue *q
if (XE_IOCTL_DBG(xe, value > xe_exec_queue_device_get_max_priority(xe))) if (XE_IOCTL_DBG(xe, value > xe_exec_queue_device_get_max_priority(xe)))
return -EPERM; return -EPERM;
if (!create)
return q->ops->set_priority(q, value); return q->ops->set_priority(q, value);
q->sched_props.priority = value;
return 0;
} }
static bool xe_exec_queue_enforce_schedule_limit(void) static bool xe_exec_queue_enforce_schedule_limit(void)
...@@ -329,7 +352,11 @@ static int exec_queue_set_timeslice(struct xe_device *xe, struct xe_exec_queue * ...@@ -329,7 +352,11 @@ static int exec_queue_set_timeslice(struct xe_device *xe, struct xe_exec_queue *
!xe_hw_engine_timeout_in_range(value, min, max)) !xe_hw_engine_timeout_in_range(value, min, max))
return -EINVAL; return -EINVAL;
if (!create)
return q->ops->set_timeslice(q, value); return q->ops->set_timeslice(q, value);
q->sched_props.timeslice_us = value;
return 0;
} }
static int exec_queue_set_preemption_timeout(struct xe_device *xe, static int exec_queue_set_preemption_timeout(struct xe_device *xe,
...@@ -345,7 +372,11 @@ static int exec_queue_set_preemption_timeout(struct xe_device *xe, ...@@ -345,7 +372,11 @@ static int exec_queue_set_preemption_timeout(struct xe_device *xe,
!xe_hw_engine_timeout_in_range(value, min, max)) !xe_hw_engine_timeout_in_range(value, min, max))
return -EINVAL; return -EINVAL;
if (!create)
return q->ops->set_preempt_timeout(q, value); return q->ops->set_preempt_timeout(q, value);
q->sched_props.preempt_timeout_us = value;
return 0;
} }
static int exec_queue_set_persistence(struct xe_device *xe, struct xe_exec_queue *q, static int exec_queue_set_persistence(struct xe_device *xe, struct xe_exec_queue *q,
...@@ -380,7 +411,9 @@ static int exec_queue_set_job_timeout(struct xe_device *xe, struct xe_exec_queue ...@@ -380,7 +411,9 @@ static int exec_queue_set_job_timeout(struct xe_device *xe, struct xe_exec_queue
!xe_hw_engine_timeout_in_range(value, min, max)) !xe_hw_engine_timeout_in_range(value, min, max))
return -EINVAL; return -EINVAL;
return q->ops->set_job_timeout(q, value); q->sched_props.job_timeout_ms = value;
return 0;
} }
static int exec_queue_set_acc_trigger(struct xe_device *xe, struct xe_exec_queue *q, static int exec_queue_set_acc_trigger(struct xe_device *xe, struct xe_exec_queue *q,
...@@ -655,6 +688,7 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data, ...@@ -655,6 +688,7 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data,
if (eci[0].engine_class == DRM_XE_ENGINE_CLASS_VM_BIND) { if (eci[0].engine_class == DRM_XE_ENGINE_CLASS_VM_BIND) {
for_each_gt(gt, xe, id) { for_each_gt(gt, xe, id) {
struct xe_exec_queue *new; struct xe_exec_queue *new;
u32 flags;
if (xe_gt_is_media_type(gt)) if (xe_gt_is_media_type(gt))
continue; continue;
...@@ -673,14 +707,13 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data, ...@@ -673,14 +707,13 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data,
/* The migration vm doesn't hold rpm ref */ /* The migration vm doesn't hold rpm ref */
xe_device_mem_access_get(xe); xe_device_mem_access_get(xe);
flags = EXEC_QUEUE_FLAG_PERSISTENT | EXEC_QUEUE_FLAG_VM |
(id ? EXEC_QUEUE_FLAG_BIND_ENGINE_CHILD : 0);
migrate_vm = xe_migrate_get_vm(gt_to_tile(gt)->migrate); migrate_vm = xe_migrate_get_vm(gt_to_tile(gt)->migrate);
new = xe_exec_queue_create(xe, migrate_vm, logical_mask, new = xe_exec_queue_create(xe, migrate_vm, logical_mask,
args->width, hwe, args->width, hwe, flags,
EXEC_QUEUE_FLAG_PERSISTENT | args->extensions);
EXEC_QUEUE_FLAG_VM |
(id ?
EXEC_QUEUE_FLAG_BIND_ENGINE_CHILD :
0));
xe_device_mem_access_put(xe); /* now held by engine */ xe_device_mem_access_put(xe); /* now held by engine */
...@@ -728,7 +761,8 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data, ...@@ -728,7 +761,8 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data,
q = xe_exec_queue_create(xe, vm, logical_mask, q = xe_exec_queue_create(xe, vm, logical_mask,
args->width, hwe, args->width, hwe,
xe_vm_in_lr_mode(vm) ? 0 : xe_vm_in_lr_mode(vm) ? 0 :
EXEC_QUEUE_FLAG_PERSISTENT); EXEC_QUEUE_FLAG_PERSISTENT,
args->extensions);
up_read(&vm->lock); up_read(&vm->lock);
xe_vm_put(vm); xe_vm_put(vm);
if (IS_ERR(q)) if (IS_ERR(q))
...@@ -744,12 +778,6 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data, ...@@ -744,12 +778,6 @@ int xe_exec_queue_create_ioctl(struct drm_device *dev, void *data,
} }
} }
if (args->extensions) {
err = exec_queue_user_extensions(xe, q, args->extensions, 0, true);
if (XE_IOCTL_DBG(xe, err))
goto kill_exec_queue;
}
q->persistent.xef = xef; q->persistent.xef = xef;
mutex_lock(&xef->exec_queue.lock); mutex_lock(&xef->exec_queue.lock);
......
...@@ -16,7 +16,8 @@ struct xe_file; ...@@ -16,7 +16,8 @@ struct xe_file;
struct xe_exec_queue *xe_exec_queue_create(struct xe_device *xe, struct xe_vm *vm, struct xe_exec_queue *xe_exec_queue_create(struct xe_device *xe, struct xe_vm *vm,
u32 logical_mask, u16 width, u32 logical_mask, u16 width,
struct xe_hw_engine *hw_engine, u32 flags); struct xe_hw_engine *hw_engine, u32 flags,
u64 extensions);
struct xe_exec_queue *xe_exec_queue_create_class(struct xe_device *xe, struct xe_gt *gt, struct xe_exec_queue *xe_exec_queue_create_class(struct xe_device *xe, struct xe_gt *gt,
struct xe_vm *vm, struct xe_vm *vm,
enum xe_engine_class class, u32 flags); enum xe_engine_class class, u32 flags);
......
...@@ -356,7 +356,7 @@ int xe_gsc_init_post_hwconfig(struct xe_gsc *gsc) ...@@ -356,7 +356,7 @@ int xe_gsc_init_post_hwconfig(struct xe_gsc *gsc)
q = xe_exec_queue_create(xe, NULL, q = xe_exec_queue_create(xe, NULL,
BIT(hwe->logical_instance), 1, hwe, BIT(hwe->logical_instance), 1, hwe,
EXEC_QUEUE_FLAG_KERNEL | EXEC_QUEUE_FLAG_KERNEL |
EXEC_QUEUE_FLAG_PERMANENT); EXEC_QUEUE_FLAG_PERMANENT, 0);
if (IS_ERR(q)) { if (IS_ERR(q)) {
xe_gt_err(gt, "Failed to create queue for GSC submission\n"); xe_gt_err(gt, "Failed to create queue for GSC submission\n");
err = PTR_ERR(q); err = PTR_ERR(q);
......
...@@ -235,7 +235,7 @@ int xe_gt_record_default_lrcs(struct xe_gt *gt) ...@@ -235,7 +235,7 @@ int xe_gt_record_default_lrcs(struct xe_gt *gt)
return -ENOMEM; return -ENOMEM;
q = xe_exec_queue_create(xe, NULL, BIT(hwe->logical_instance), 1, q = xe_exec_queue_create(xe, NULL, BIT(hwe->logical_instance), 1,
hwe, EXEC_QUEUE_FLAG_KERNEL); hwe, EXEC_QUEUE_FLAG_KERNEL, 0);
if (IS_ERR(q)) { if (IS_ERR(q)) {
err = PTR_ERR(q); err = PTR_ERR(q);
xe_gt_err(gt, "hwe %s: xe_exec_queue_create failed (%pe)\n", xe_gt_err(gt, "hwe %s: xe_exec_queue_create failed (%pe)\n",
...@@ -252,7 +252,7 @@ int xe_gt_record_default_lrcs(struct xe_gt *gt) ...@@ -252,7 +252,7 @@ int xe_gt_record_default_lrcs(struct xe_gt *gt)
} }
nop_q = xe_exec_queue_create(xe, NULL, BIT(hwe->logical_instance), nop_q = xe_exec_queue_create(xe, NULL, BIT(hwe->logical_instance),
1, hwe, EXEC_QUEUE_FLAG_KERNEL); 1, hwe, EXEC_QUEUE_FLAG_KERNEL, 0);
if (IS_ERR(nop_q)) { if (IS_ERR(nop_q)) {
err = PTR_ERR(nop_q); err = PTR_ERR(nop_q);
xe_gt_err(gt, "hwe %s: nop xe_exec_queue_create failed (%pe)\n", xe_gt_err(gt, "hwe %s: nop xe_exec_queue_create failed (%pe)\n",
......
...@@ -345,7 +345,7 @@ struct xe_migrate *xe_migrate_init(struct xe_tile *tile) ...@@ -345,7 +345,7 @@ struct xe_migrate *xe_migrate_init(struct xe_tile *tile)
m->q = xe_exec_queue_create(xe, vm, logical_mask, 1, hwe, m->q = xe_exec_queue_create(xe, vm, logical_mask, 1, hwe,
EXEC_QUEUE_FLAG_KERNEL | EXEC_QUEUE_FLAG_KERNEL |
EXEC_QUEUE_FLAG_PERMANENT | EXEC_QUEUE_FLAG_PERMANENT |
EXEC_QUEUE_FLAG_HIGH_PRIORITY); EXEC_QUEUE_FLAG_HIGH_PRIORITY, 0);
} else { } else {
m->q = xe_exec_queue_create_class(xe, primary_gt, vm, m->q = xe_exec_queue_create_class(xe, primary_gt, vm,
XE_ENGINE_CLASS_COPY, XE_ENGINE_CLASS_COPY,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment