Skip to content

Commit 70c96e3

Browse files
committed
drm/i915/gem: Take a copy of the engines for context_barrier_task
When applying the context-barrier, we only care about the current engines, as the next set of engines will be naturally after the barrier. So we can skip holding the ctx->engines_mutex while constructing the request by taking a sneaky reference to the i915_gem_engines instead. Signed-off-by: Chris Wilson <[email protected]> Cc: Maarten Lankhorst <[email protected]> Reviewed-by: Maarten Lankhorst <[email protected]> Link: https://patchwork.freedesktop.org/patch/msgid/[email protected]
1 parent c02aac2 commit 70c96e3

File tree

1 file changed

+77
-37
lines changed

1 file changed

+77
-37
lines changed

drivers/gpu/drm/i915/gem/i915_gem_context.c

Lines changed: 77 additions & 37 deletions
Original file line numberDiff line numberDiff line change
@@ -261,14 +261,54 @@ static void free_engines_rcu(struct rcu_head *rcu)
261261
free_engines(engines);
262262
}
263263

264+
static int __i915_sw_fence_call
265+
engines_notify(struct i915_sw_fence *fence, enum i915_sw_fence_notify state)
266+
{
267+
struct i915_gem_engines *engines =
268+
container_of(fence, typeof(*engines), fence);
269+
270+
switch (state) {
271+
case FENCE_COMPLETE:
272+
if (!list_empty(&engines->link)) {
273+
struct i915_gem_context *ctx = engines->ctx;
274+
unsigned long flags;
275+
276+
spin_lock_irqsave(&ctx->stale.lock, flags);
277+
list_del(&engines->link);
278+
spin_unlock_irqrestore(&ctx->stale.lock, flags);
279+
}
280+
i915_gem_context_put(engines->ctx);
281+
break;
282+
283+
case FENCE_FREE:
284+
init_rcu_head(&engines->rcu);
285+
call_rcu(&engines->rcu, free_engines_rcu);
286+
break;
287+
}
288+
289+
return NOTIFY_DONE;
290+
}
291+
292+
static struct i915_gem_engines *alloc_engines(unsigned int count)
293+
{
294+
struct i915_gem_engines *e;
295+
296+
e = kzalloc(struct_size(e, engines, count), GFP_KERNEL);
297+
if (!e)
298+
return NULL;
299+
300+
i915_sw_fence_init(&e->fence, engines_notify);
301+
return e;
302+
}
303+
264304
static struct i915_gem_engines *default_engines(struct i915_gem_context *ctx)
265305
{
266306
const struct intel_gt *gt = &ctx->i915->gt;
267307
struct intel_engine_cs *engine;
268308
struct i915_gem_engines *e;
269309
enum intel_engine_id id;
270310

271-
e = kzalloc(struct_size(e, engines, I915_NUM_ENGINES), GFP_KERNEL);
311+
e = alloc_engines(I915_NUM_ENGINES);
272312
if (!e)
273313
return ERR_PTR(-ENOMEM);
274314

@@ -519,41 +559,12 @@ static void kill_context(struct i915_gem_context *ctx)
519559
kill_stale_engines(ctx);
520560
}
521561

522-
static int __i915_sw_fence_call
523-
engines_notify(struct i915_sw_fence *fence, enum i915_sw_fence_notify state)
524-
{
525-
struct i915_gem_engines *engines =
526-
container_of(fence, typeof(*engines), fence);
527-
528-
switch (state) {
529-
case FENCE_COMPLETE:
530-
if (!list_empty(&engines->link)) {
531-
struct i915_gem_context *ctx = engines->ctx;
532-
unsigned long flags;
533-
534-
spin_lock_irqsave(&ctx->stale.lock, flags);
535-
list_del(&engines->link);
536-
spin_unlock_irqrestore(&ctx->stale.lock, flags);
537-
}
538-
i915_gem_context_put(engines->ctx);
539-
break;
540-
541-
case FENCE_FREE:
542-
init_rcu_head(&engines->rcu);
543-
call_rcu(&engines->rcu, free_engines_rcu);
544-
break;
545-
}
546-
547-
return NOTIFY_DONE;
548-
}
549-
550562
static void engines_idle_release(struct i915_gem_context *ctx,
551563
struct i915_gem_engines *engines)
552564
{
553565
struct i915_gem_engines_iter it;
554566
struct intel_context *ce;
555567

556-
i915_sw_fence_init(&engines->fence, engines_notify);
557568
INIT_LIST_HEAD(&engines->link);
558569

559570
engines->ctx = i915_gem_context_get(ctx);
@@ -1057,6 +1068,30 @@ static void cb_retire(struct i915_active *base)
10571068
kfree(cb);
10581069
}
10591070

1071+
static inline struct i915_gem_engines *
1072+
__context_engines_await(const struct i915_gem_context *ctx)
1073+
{
1074+
struct i915_gem_engines *engines;
1075+
1076+
rcu_read_lock();
1077+
do {
1078+
engines = rcu_dereference(ctx->engines);
1079+
if (unlikely(!engines))
1080+
break;
1081+
1082+
if (unlikely(!i915_sw_fence_await(&engines->fence)))
1083+
continue;
1084+
1085+
if (likely(engines == rcu_access_pointer(ctx->engines)))
1086+
break;
1087+
1088+
i915_sw_fence_complete(&engines->fence);
1089+
} while (1);
1090+
rcu_read_unlock();
1091+
1092+
return engines;
1093+
}
1094+
10601095
I915_SELFTEST_DECLARE(static intel_engine_mask_t context_barrier_inject_fault);
10611096
static int context_barrier_task(struct i915_gem_context *ctx,
10621097
intel_engine_mask_t engines,
@@ -1067,6 +1102,7 @@ static int context_barrier_task(struct i915_gem_context *ctx,
10671102
{
10681103
struct context_barrier_task *cb;
10691104
struct i915_gem_engines_iter it;
1105+
struct i915_gem_engines *e;
10701106
struct intel_context *ce;
10711107
int err = 0;
10721108

@@ -1083,7 +1119,13 @@ static int context_barrier_task(struct i915_gem_context *ctx,
10831119
return err;
10841120
}
10851121

1086-
for_each_gem_engine(ce, i915_gem_context_lock_engines(ctx), it) {
1122+
e = __context_engines_await(ctx);
1123+
if (!e) {
1124+
i915_active_release(&cb->base);
1125+
return -ENOENT;
1126+
}
1127+
1128+
for_each_gem_engine(ce, e, it) {
10871129
struct i915_request *rq;
10881130

10891131
if (I915_SELFTEST_ONLY(context_barrier_inject_fault &
@@ -1114,7 +1156,7 @@ static int context_barrier_task(struct i915_gem_context *ctx,
11141156
if (err)
11151157
break;
11161158
}
1117-
i915_gem_context_unlock_engines(ctx);
1159+
i915_sw_fence_complete(&e->fence);
11181160

11191161
cb->task = err ? NULL : task; /* caller needs to unwind instead */
11201162
cb->data = data;
@@ -1741,9 +1783,7 @@ set_engines(struct i915_gem_context *ctx,
17411783
* first 64 engines defined here.
17421784
*/
17431785
num_engines = (args->size - sizeof(*user)) / sizeof(*user->engines);
1744-
1745-
set.engines = kmalloc(struct_size(set.engines, engines, num_engines),
1746-
GFP_KERNEL);
1786+
set.engines = alloc_engines(num_engines);
17471787
if (!set.engines)
17481788
return -ENOMEM;
17491789

@@ -1823,7 +1863,7 @@ __copy_engines(struct i915_gem_engines *e)
18231863
struct i915_gem_engines *copy;
18241864
unsigned int n;
18251865

1826-
copy = kmalloc(struct_size(e, engines, e->num_engines), GFP_KERNEL);
1866+
copy = alloc_engines(e->num_engines);
18271867
if (!copy)
18281868
return ERR_PTR(-ENOMEM);
18291869

@@ -2084,7 +2124,7 @@ static int clone_engines(struct i915_gem_context *dst,
20842124
bool user_engines;
20852125
unsigned long n;
20862126

2087-
clone = kmalloc(struct_size(e, engines, e->num_engines), GFP_KERNEL);
2127+
clone = alloc_engines(e->num_engines);
20882128
if (!clone)
20892129
goto err_unlock;
20902130

0 commit comments

Comments
 (0)