Skip to content

Commit

Permalink
drm/i915: Parse command buffer earlier in eb_relocate(slow)
Browse files Browse the repository at this point in the history
We want to introduce backoff logic, but we need to lock the
pool object as well for command parsing. Because of this, we
will need backoff logic for the engine pool obj, move the batch
validation up slightly to eb_lookup_vmas, and the actual command
parsing in a separate function which can get called from execbuf
relocation fast and slowpath.

Signed-off-by: Maarten Lankhorst <maarten.lankhorst@linux.intel.com>
Reviewed-by: Thomas Hellström <thomas.hellstrom@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20200819140904.1708856-8-maarten.lankhorst@linux.intel.com
Signed-off-by: Joonas Lahtinen <joonas.lahtinen@linux.intel.com>
  • Loading branch information
Maarten Lankhorst authored and Joonas Lahtinen committed Sep 7, 2020
1 parent 1af343c commit 8e4ba49
Showing 1 changed file with 37 additions and 31 deletions.
68 changes: 37 additions & 31 deletions drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
Original file line number Diff line number Diff line change
Expand Up @@ -296,6 +296,8 @@ struct i915_execbuffer {
unsigned long num_fences;
};

static int eb_parse(struct i915_execbuffer *eb);

static inline bool eb_use_cmdparser(const struct i915_execbuffer *eb)
{
return intel_engine_requires_cmd_parser(eb->engine) ||
Expand Down Expand Up @@ -843,6 +845,7 @@ static struct i915_vma *eb_lookup_vma(struct i915_execbuffer *eb, u32 handle)

static int eb_lookup_vmas(struct i915_execbuffer *eb)
{
struct drm_i915_private *i915 = eb->i915;
unsigned int batch = eb_batch_index(eb);
unsigned int i;
int err = 0;
Expand All @@ -856,18 +859,37 @@ static int eb_lookup_vmas(struct i915_execbuffer *eb)
vma = eb_lookup_vma(eb, eb->exec[i].handle);
if (IS_ERR(vma)) {
err = PTR_ERR(vma);
break;
goto err;
}

err = eb_validate_vma(eb, &eb->exec[i], vma);
if (unlikely(err)) {
i915_vma_put(vma);
break;
goto err;
}

eb_add_vma(eb, i, batch, vma);
}

if (unlikely(eb->batch->flags & EXEC_OBJECT_WRITE)) {
drm_dbg(&i915->drm,
"Attempting to use self-modifying batch buffer\n");
return -EINVAL;
}

if (range_overflows_t(u64,
eb->batch_start_offset, eb->batch_len,
eb->batch->vma->size)) {
drm_dbg(&i915->drm, "Attempting to use out-of-bounds batch\n");
return -EINVAL;
}

if (eb->batch_len == 0)
eb->batch_len = eb->batch->vma->size - eb->batch_start_offset;

return 0;

err:
eb->vma[i].vma = NULL;
return err;
}
Expand Down Expand Up @@ -1802,7 +1824,7 @@ static int eb_prefault_relocations(const struct i915_execbuffer *eb)
return 0;
}

static noinline int eb_relocate_slow(struct i915_execbuffer *eb)
static noinline int eb_relocate_parse_slow(struct i915_execbuffer *eb)
{
bool have_copy = false;
struct eb_vma *ev;
Expand Down Expand Up @@ -1867,6 +1889,11 @@ static noinline int eb_relocate_slow(struct i915_execbuffer *eb)
if (err)
goto err;

/* as last step, parse the command buffer */
err = eb_parse(eb);
if (err)
goto err;

/*
* Leave the user relocations as are, this is the painfully slow path,
* and we want to avoid the complication of dropping the lock whilst
Expand Down Expand Up @@ -1899,7 +1926,7 @@ static noinline int eb_relocate_slow(struct i915_execbuffer *eb)
return err;
}

static int eb_relocate(struct i915_execbuffer *eb)
static int eb_relocate_parse(struct i915_execbuffer *eb)
{
int err;

Expand All @@ -1924,10 +1951,10 @@ static int eb_relocate(struct i915_execbuffer *eb)
}

if (err)
return eb_relocate_slow(eb);
return eb_relocate_parse_slow(eb);
}

return 0;
return eb_parse(eb);
}

static int eb_move_to_gpu(struct i915_execbuffer *eb)
Expand Down Expand Up @@ -3045,7 +3072,7 @@ i915_gem_do_execbuffer(struct drm_device *dev,
if (unlikely(err))
goto err_context;

err = eb_relocate(&eb);
err = eb_relocate_parse(&eb);
if (err) {
/*
* If the user expects the execobject.offset and
Expand All @@ -3058,33 +3085,10 @@ i915_gem_do_execbuffer(struct drm_device *dev,
goto err_vma;
}

if (unlikely(eb.batch->flags & EXEC_OBJECT_WRITE)) {
drm_dbg(&i915->drm,
"Attempting to use self-modifying batch buffer\n");
err = -EINVAL;
goto err_vma;
}

if (range_overflows_t(u64,
eb.batch_start_offset, eb.batch_len,
eb.batch->vma->size)) {
drm_dbg(&i915->drm, "Attempting to use out-of-bounds batch\n");
err = -EINVAL;
goto err_vma;
}

if (eb.batch_len == 0)
eb.batch_len = eb.batch->vma->size - eb.batch_start_offset;

err = eb_parse(&eb);
if (err)
goto err_vma;

/*
* snb/ivb/vlv conflate the "batch in ppgtt" bit with the "non-secure
* batch" bit. Hence we need to pin secure batches into the global gtt.
* hsw should have this fixed, but bdw mucks it up again. */
batch = eb.batch->vma;
if (eb.batch_flags & I915_DISPATCH_SECURE) {
struct i915_vma *vma;

Expand All @@ -3098,13 +3102,15 @@ i915_gem_do_execbuffer(struct drm_device *dev,
* fitting due to fragmentation.
* So this is actually safe.
*/
vma = i915_gem_object_ggtt_pin(batch->obj, NULL, 0, 0, 0);
vma = i915_gem_object_ggtt_pin(eb.batch->vma->obj, NULL, 0, 0, 0);
if (IS_ERR(vma)) {
err = PTR_ERR(vma);
goto err_parse;
}

batch = vma;
} else {
batch = eb.batch->vma;
}

/* All GPU relocation batches must be submitted prior to the user rq */
Expand Down

0 comments on commit 8e4ba49

Please sign in to comment.