Skip to content

Commit efab6d8

Browse files
ickledanvet
authored andcommitted
drm/i915: Use a separate slab for requests
requests are even more frequently allocated than objects and equally benefit from having a dedicated slab. v2: Rebase Signed-off-by: Chris Wilson <[email protected]> Signed-off-by: Daniel Vetter <[email protected]>
1 parent f1e2dae commit efab6d8

File tree

4 files changed

+35
-23
lines changed

4 files changed

+35
-23
lines changed

drivers/gpu/drm/i915/i915_dma.c

Lines changed: 8 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1006,8 +1006,10 @@ int i915_driver_load(struct drm_device *dev, unsigned long flags)
10061006
put_bridge:
10071007
pci_dev_put(dev_priv->bridge_dev);
10081008
free_priv:
1009-
if (dev_priv->slab)
1010-
kmem_cache_destroy(dev_priv->slab);
1009+
if (dev_priv->requests)
1010+
kmem_cache_destroy(dev_priv->requests);
1011+
if (dev_priv->objects)
1012+
kmem_cache_destroy(dev_priv->objects);
10111013
kfree(dev_priv);
10121014
return ret;
10131015
}
@@ -1090,8 +1092,10 @@ int i915_driver_unload(struct drm_device *dev)
10901092
if (dev_priv->regs != NULL)
10911093
pci_iounmap(dev->pdev, dev_priv->regs);
10921094

1093-
if (dev_priv->slab)
1094-
kmem_cache_destroy(dev_priv->slab);
1095+
if (dev_priv->requests)
1096+
kmem_cache_destroy(dev_priv->requests);
1097+
if (dev_priv->objects)
1098+
kmem_cache_destroy(dev_priv->objects);
10951099

10961100
pci_dev_put(dev_priv->bridge_dev);
10971101
kfree(dev_priv);

drivers/gpu/drm/i915/i915_drv.h

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1558,7 +1558,8 @@ struct i915_virtual_gpu {
15581558

15591559
struct drm_i915_private {
15601560
struct drm_device *dev;
1561-
struct kmem_cache *slab;
1561+
struct kmem_cache *objects;
1562+
struct kmem_cache *requests;
15621563

15631564
const struct intel_device_info info;
15641565

@@ -2044,6 +2045,7 @@ struct drm_i915_gem_request {
20442045
struct kref ref;
20452046

20462047
/** On Which ring this request was generated */
2048+
struct drm_i915_private *i915;
20472049
struct intel_engine_cs *ring;
20482050

20492051
/** GEM sequence number associated with this request. */

drivers/gpu/drm/i915/i915_gem.c

Lines changed: 24 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -378,13 +378,13 @@ i915_gem_phys_pwrite(struct drm_i915_gem_object *obj,
378378
void *i915_gem_object_alloc(struct drm_device *dev)
379379
{
380380
struct drm_i915_private *dev_priv = dev->dev_private;
381-
return kmem_cache_zalloc(dev_priv->slab, GFP_KERNEL);
381+
return kmem_cache_zalloc(dev_priv->objects, GFP_KERNEL);
382382
}
383383

384384
void i915_gem_object_free(struct drm_i915_gem_object *obj)
385385
{
386386
struct drm_i915_private *dev_priv = obj->base.dev->dev_private;
387-
kmem_cache_free(dev_priv->slab, obj);
387+
kmem_cache_free(dev_priv->objects, obj);
388388
}
389389

390390
static int
@@ -2506,43 +2506,45 @@ void i915_gem_request_free(struct kref *req_ref)
25062506
i915_gem_context_unreference(ctx);
25072507
}
25082508

2509-
kfree(req);
2509+
kmem_cache_free(req->i915->requests, req);
25102510
}
25112511

25122512
int i915_gem_request_alloc(struct intel_engine_cs *ring,
25132513
struct intel_context *ctx)
25142514
{
2515+
struct drm_i915_private *dev_priv = to_i915(ring->dev);
2516+
struct drm_i915_gem_request *rq;
25152517
int ret;
2516-
struct drm_i915_gem_request *request;
2517-
struct drm_i915_private *dev_private = ring->dev->dev_private;
25182518

25192519
if (ring->outstanding_lazy_request)
25202520
return 0;
25212521

2522-
request = kzalloc(sizeof(*request), GFP_KERNEL);
2523-
if (request == NULL)
2522+
rq = kmem_cache_zalloc(dev_priv->requests, GFP_KERNEL);
2523+
if (rq == NULL)
25242524
return -ENOMEM;
25252525

2526-
ret = i915_gem_get_seqno(ring->dev, &request->seqno);
2526+
kref_init(&rq->ref);
2527+
rq->i915 = dev_priv;
2528+
2529+
ret = i915_gem_get_seqno(ring->dev, &rq->seqno);
25272530
if (ret) {
2528-
kfree(request);
2531+
kfree(rq);
25292532
return ret;
25302533
}
25312534

2532-
kref_init(&request->ref);
2533-
request->ring = ring;
2534-
request->uniq = dev_private->request_uniq++;
2535+
rq->ring = ring;
2536+
rq->uniq = dev_priv->request_uniq++;
25352537

25362538
if (i915.enable_execlists)
2537-
ret = intel_logical_ring_alloc_request_extras(request, ctx);
2539+
ret = intel_logical_ring_alloc_request_extras(rq, ctx);
25382540
else
2539-
ret = intel_ring_alloc_request_extras(request);
2541+
ret = intel_ring_alloc_request_extras(rq);
25402542
if (ret) {
2541-
kfree(request);
2543+
kfree(rq);
25422544
return ret;
25432545
}
25442546

2545-
ring->outstanding_lazy_request = request;
2547+
ring->outstanding_lazy_request = rq;
25462548
return 0;
25472549
}
25482550

@@ -4984,11 +4986,16 @@ i915_gem_load(struct drm_device *dev)
49844986
struct drm_i915_private *dev_priv = dev->dev_private;
49854987
int i;
49864988

4987-
dev_priv->slab =
4989+
dev_priv->objects =
49884990
kmem_cache_create("i915_gem_object",
49894991
sizeof(struct drm_i915_gem_object), 0,
49904992
SLAB_HWCACHE_ALIGN,
49914993
NULL);
4994+
dev_priv->requests =
4995+
kmem_cache_create("i915_gem_request",
4996+
sizeof(struct drm_i915_gem_request), 0,
4997+
SLAB_HWCACHE_ALIGN,
4998+
NULL);
49924999

49935000
INIT_LIST_HEAD(&dev_priv->vm_list);
49945001
i915_init_vm(dev_priv, &dev_priv->gtt.base);

drivers/gpu/drm/i915/intel_ringbuffer.c

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2139,7 +2139,6 @@ int intel_ring_idle(struct intel_engine_cs *ring)
21392139
int intel_ring_alloc_request_extras(struct drm_i915_gem_request *request)
21402140
{
21412141
request->ringbuf = request->ring->buffer;
2142-
21432142
return 0;
21442143
}
21452144

0 commit comments

Comments
 (0)