Commit 27173f1f authored by Ben Widawsky's avatar Ben Widawsky Committed by Daniel Vetter

drm/i915: Convert execbuf code to use vmas

In order to transition more of our code over to using a VMA instead of
an <OBJ, VM> pair - we must have the vma accessible at execbuf time. Up
until now, we've only had a VMA when actually binding an object.

The previous patch helped handle the distinction on bound vs. unbound.
This patch will help us catch leaks, and other issues before we actually
shuffle a bunch of stuff around.

This attempts to convert all the execbuf code to speak in vmas. Since
the execbuf code is very self contained it was a nice isolated
conversion.

The meat of the code is about turning eb_objects into eb_vma, and then
wiring up the rest of the code to use vmas instead of obj, vm pairs.

Unfortunately, to do this, we must move the exec_list link from the obj
structure. This list is reused in the eviction code, so we must also
modify the eviction code to make this work.

WARNING: This patch makes an already hotly profiled path slower. The cost is
unavoidable. In reply to this mail, I will attach the extra data.

v2: Release table lock early, and two a 2 phase vma lookup to avoid
having to use a GFP_ATOMIC. (Chris)

v3: s/obj_exec_list/obj_exec_link/
Updates to address
commit 6d2b8885
Author: Chris Wilson <chris@chris-wilson.co.uk>
Date:   Wed Aug 7 18:30:54 2013 +0100

    drm/i915: List objects allocated from stolen memory in debugfs

v4: Use obj = vma->obj for neatness in some places (Chris)
need_reloc_mappable() should return false if ppgtt (Chris)
Signed-off-by: default avatarBen Widawsky <ben@bwidawsk.net>
[danvet: Split out prep patches. Also remove a FIXME comment which is
now taken care of.]
Signed-off-by: default avatarDaniel Vetter <daniel.vetter@ffwll.ch>
parent a2dc53e7
...@@ -568,6 +568,13 @@ struct i915_vma { ...@@ -568,6 +568,13 @@ struct i915_vma {
/** This vma's place in the batchbuffer or on the eviction list */ /** This vma's place in the batchbuffer or on the eviction list */
struct list_head exec_list; struct list_head exec_list;
/**
* Used for performing relocations during execbuffer insertion.
*/
struct hlist_node exec_node;
unsigned long exec_handle;
struct drm_i915_gem_exec_object2 *exec_entry;
}; };
struct i915_ctx_hang_stats { struct i915_ctx_hang_stats {
...@@ -1398,8 +1405,6 @@ struct drm_i915_gem_object { ...@@ -1398,8 +1405,6 @@ struct drm_i915_gem_object {
struct list_head ring_list; struct list_head ring_list;
/** Used in execbuf to temporarily hold a ref */ /** Used in execbuf to temporarily hold a ref */
struct list_head obj_exec_link; struct list_head obj_exec_link;
/** This object's place in the batchbuffer or on the eviction list */
struct list_head exec_list;
/** /**
* This is set if the object is on the active lists (has pending * This is set if the object is on the active lists (has pending
...@@ -1485,13 +1490,6 @@ struct drm_i915_gem_object { ...@@ -1485,13 +1490,6 @@ struct drm_i915_gem_object {
void *dma_buf_vmapping; void *dma_buf_vmapping;
int vmapping_count; int vmapping_count;
/**
* Used for performing relocations during execbuffer insertion.
*/
struct hlist_node exec_node;
unsigned long exec_handle;
struct drm_i915_gem_exec_object2 *exec_entry;
struct intel_ring_buffer *ring; struct intel_ring_buffer *ring;
/** Breadcrumb of last rendering to the buffer. */ /** Breadcrumb of last rendering to the buffer. */
......
...@@ -3978,7 +3978,6 @@ void i915_gem_object_init(struct drm_i915_gem_object *obj, ...@@ -3978,7 +3978,6 @@ void i915_gem_object_init(struct drm_i915_gem_object *obj,
{ {
INIT_LIST_HEAD(&obj->global_list); INIT_LIST_HEAD(&obj->global_list);
INIT_LIST_HEAD(&obj->ring_list); INIT_LIST_HEAD(&obj->ring_list);
INIT_LIST_HEAD(&obj->exec_list);
INIT_LIST_HEAD(&obj->obj_exec_link); INIT_LIST_HEAD(&obj->obj_exec_link);
INIT_LIST_HEAD(&obj->vma_list); INIT_LIST_HEAD(&obj->vma_list);
......
...@@ -33,24 +33,24 @@ ...@@ -33,24 +33,24 @@
#include "intel_drv.h" #include "intel_drv.h"
#include <linux/dma_remapping.h> #include <linux/dma_remapping.h>
struct eb_objects { struct eb_vmas {
struct list_head objects; struct list_head vmas;
int and; int and;
union { union {
struct drm_i915_gem_object *lut[0]; struct i915_vma *lut[0];
struct hlist_head buckets[0]; struct hlist_head buckets[0];
}; };
}; };
static struct eb_objects * static struct eb_vmas *
eb_create(struct drm_i915_gem_execbuffer2 *args) eb_create(struct drm_i915_gem_execbuffer2 *args, struct i915_address_space *vm)
{ {
struct eb_objects *eb = NULL; struct eb_vmas *eb = NULL;
if (args->flags & I915_EXEC_HANDLE_LUT) { if (args->flags & I915_EXEC_HANDLE_LUT) {
int size = args->buffer_count; int size = args->buffer_count;
size *= sizeof(struct drm_i915_gem_object *); size *= sizeof(struct i915_vma *);
size += sizeof(struct eb_objects); size += sizeof(struct eb_vmas);
eb = kmalloc(size, GFP_TEMPORARY | __GFP_NOWARN | __GFP_NORETRY); eb = kmalloc(size, GFP_TEMPORARY | __GFP_NOWARN | __GFP_NORETRY);
} }
...@@ -61,7 +61,7 @@ eb_create(struct drm_i915_gem_execbuffer2 *args) ...@@ -61,7 +61,7 @@ eb_create(struct drm_i915_gem_execbuffer2 *args)
while (count > 2*size) while (count > 2*size)
count >>= 1; count >>= 1;
eb = kzalloc(count*sizeof(struct hlist_head) + eb = kzalloc(count*sizeof(struct hlist_head) +
sizeof(struct eb_objects), sizeof(struct eb_vmas),
GFP_TEMPORARY); GFP_TEMPORARY);
if (eb == NULL) if (eb == NULL)
return eb; return eb;
...@@ -70,64 +70,97 @@ eb_create(struct drm_i915_gem_execbuffer2 *args) ...@@ -70,64 +70,97 @@ eb_create(struct drm_i915_gem_execbuffer2 *args)
} else } else
eb->and = -args->buffer_count; eb->and = -args->buffer_count;
INIT_LIST_HEAD(&eb->objects); INIT_LIST_HEAD(&eb->vmas);
return eb; return eb;
} }
static void static void
eb_reset(struct eb_objects *eb) eb_reset(struct eb_vmas *eb)
{ {
if (eb->and >= 0) if (eb->and >= 0)
memset(eb->buckets, 0, (eb->and+1)*sizeof(struct hlist_head)); memset(eb->buckets, 0, (eb->and+1)*sizeof(struct hlist_head));
} }
static int static int
eb_lookup_objects(struct eb_objects *eb, eb_lookup_vmas(struct eb_vmas *eb,
struct drm_i915_gem_exec_object2 *exec, struct drm_i915_gem_exec_object2 *exec,
const struct drm_i915_gem_execbuffer2 *args, const struct drm_i915_gem_execbuffer2 *args,
struct i915_address_space *vm,
struct drm_file *file) struct drm_file *file)
{ {
int i; struct drm_i915_gem_object *obj;
struct list_head objects;
int i, ret = 0;
INIT_LIST_HEAD(&objects);
spin_lock(&file->table_lock); spin_lock(&file->table_lock);
/* Grab a reference to the object and release the lock so we can lookup
* or create the VMA without using GFP_ATOMIC */
for (i = 0; i < args->buffer_count; i++) { for (i = 0; i < args->buffer_count; i++) {
struct drm_i915_gem_object *obj;
obj = to_intel_bo(idr_find(&file->object_idr, exec[i].handle)); obj = to_intel_bo(idr_find(&file->object_idr, exec[i].handle));
if (obj == NULL) { if (obj == NULL) {
spin_unlock(&file->table_lock); spin_unlock(&file->table_lock);
DRM_DEBUG("Invalid object handle %d at index %d\n", DRM_DEBUG("Invalid object handle %d at index %d\n",
exec[i].handle, i); exec[i].handle, i);
return -ENOENT; ret = -ENOENT;
goto out;
} }
if (!list_empty(&obj->exec_list)) { if (!list_empty(&obj->obj_exec_link)) {
spin_unlock(&file->table_lock); spin_unlock(&file->table_lock);
DRM_DEBUG("Object %p [handle %d, index %d] appears more than once in object list\n", DRM_DEBUG("Object %p [handle %d, index %d] appears more than once in object list\n",
obj, exec[i].handle, i); obj, exec[i].handle, i);
return -EINVAL; ret = -EINVAL;
goto out;
} }
drm_gem_object_reference(&obj->base); drm_gem_object_reference(&obj->base);
list_add_tail(&obj->exec_list, &eb->objects); list_add_tail(&obj->obj_exec_link, &objects);
}
spin_unlock(&file->table_lock);
i = 0;
list_for_each_entry(obj, &objects, obj_exec_link) {
struct i915_vma *vma;
obj->exec_entry = &exec[i]; vma = i915_gem_obj_lookup_or_create_vma(obj, vm);
if (IS_ERR(vma)) {
/* XXX: We don't need an error path fro vma because if
* the vma was created just for this execbuf, object
* unreference should kill it off.*/
DRM_DEBUG("Failed to lookup VMA\n");
ret = PTR_ERR(vma);
goto out;
}
list_add_tail(&vma->exec_list, &eb->vmas);
vma->exec_entry = &exec[i];
if (eb->and < 0) { if (eb->and < 0) {
eb->lut[i] = obj; eb->lut[i] = vma;
} else { } else {
uint32_t handle = args->flags & I915_EXEC_HANDLE_LUT ? i : exec[i].handle; uint32_t handle = args->flags & I915_EXEC_HANDLE_LUT ? i : exec[i].handle;
obj->exec_handle = handle; vma->exec_handle = handle;
hlist_add_head(&obj->exec_node, hlist_add_head(&vma->exec_node,
&eb->buckets[handle & eb->and]); &eb->buckets[handle & eb->and]);
} }
++i;
} }
spin_unlock(&file->table_lock);
return 0;
out:
while (!list_empty(&objects)) {
obj = list_first_entry(&objects,
struct drm_i915_gem_object,
obj_exec_link);
list_del_init(&obj->obj_exec_link);
if (ret)
drm_gem_object_unreference(&obj->base);
}
return ret;
} }
static struct drm_i915_gem_object * static struct i915_vma *eb_get_vma(struct eb_vmas *eb, unsigned long handle)
eb_get_object(struct eb_objects *eb, unsigned long handle)
{ {
if (eb->and < 0) { if (eb->and < 0) {
if (handle >= -eb->and) if (handle >= -eb->and)
...@@ -139,27 +172,25 @@ eb_get_object(struct eb_objects *eb, unsigned long handle) ...@@ -139,27 +172,25 @@ eb_get_object(struct eb_objects *eb, unsigned long handle)
head = &eb->buckets[handle & eb->and]; head = &eb->buckets[handle & eb->and];
hlist_for_each(node, head) { hlist_for_each(node, head) {
struct drm_i915_gem_object *obj; struct i915_vma *vma;
obj = hlist_entry(node, struct drm_i915_gem_object, exec_node); vma = hlist_entry(node, struct i915_vma, exec_node);
if (obj->exec_handle == handle) if (vma->exec_handle == handle)
return obj; return vma;
} }
return NULL; return NULL;
} }
} }
static void static void eb_destroy(struct eb_vmas *eb) {
eb_destroy(struct eb_objects *eb) while (!list_empty(&eb->vmas)) {
{ struct i915_vma *vma;
while (!list_empty(&eb->objects)) {
struct drm_i915_gem_object *obj;
obj = list_first_entry(&eb->objects, vma = list_first_entry(&eb->vmas,
struct drm_i915_gem_object, struct i915_vma,
exec_list); exec_list);
list_del_init(&obj->exec_list); list_del_init(&vma->exec_list);
drm_gem_object_unreference(&obj->base); drm_gem_object_unreference(&vma->obj->base);
} }
kfree(eb); kfree(eb);
} }
...@@ -223,22 +254,24 @@ relocate_entry_gtt(struct drm_i915_gem_object *obj, ...@@ -223,22 +254,24 @@ relocate_entry_gtt(struct drm_i915_gem_object *obj,
static int static int
i915_gem_execbuffer_relocate_entry(struct drm_i915_gem_object *obj, i915_gem_execbuffer_relocate_entry(struct drm_i915_gem_object *obj,
struct eb_objects *eb, struct eb_vmas *eb,
struct drm_i915_gem_relocation_entry *reloc, struct drm_i915_gem_relocation_entry *reloc,
struct i915_address_space *vm) struct i915_address_space *vm)
{ {
struct drm_device *dev = obj->base.dev; struct drm_device *dev = obj->base.dev;
struct drm_gem_object *target_obj; struct drm_gem_object *target_obj;
struct drm_i915_gem_object *target_i915_obj; struct drm_i915_gem_object *target_i915_obj;
struct i915_vma *target_vma;
uint32_t target_offset; uint32_t target_offset;
int ret = -EINVAL; int ret = -EINVAL;
/* we've already hold a reference to all valid objects */ /* we've already hold a reference to all valid objects */
target_obj = &eb_get_object(eb, reloc->target_handle)->base; target_vma = eb_get_vma(eb, reloc->target_handle);
if (unlikely(target_obj == NULL)) if (unlikely(target_vma == NULL))
return -ENOENT; return -ENOENT;
target_i915_obj = target_vma->obj;
target_obj = &target_vma->obj->base;
target_i915_obj = to_intel_bo(target_obj);
target_offset = i915_gem_obj_ggtt_offset(target_i915_obj); target_offset = i915_gem_obj_ggtt_offset(target_i915_obj);
/* Sandybridge PPGTT errata: We need a global gtt mapping for MI and /* Sandybridge PPGTT errata: We need a global gtt mapping for MI and
...@@ -320,14 +353,13 @@ i915_gem_execbuffer_relocate_entry(struct drm_i915_gem_object *obj, ...@@ -320,14 +353,13 @@ i915_gem_execbuffer_relocate_entry(struct drm_i915_gem_object *obj,
} }
static int static int
i915_gem_execbuffer_relocate_object(struct drm_i915_gem_object *obj, i915_gem_execbuffer_relocate_vma(struct i915_vma *vma,
struct eb_objects *eb, struct eb_vmas *eb)
struct i915_address_space *vm)
{ {
#define N_RELOC(x) ((x) / sizeof(struct drm_i915_gem_relocation_entry)) #define N_RELOC(x) ((x) / sizeof(struct drm_i915_gem_relocation_entry))
struct drm_i915_gem_relocation_entry stack_reloc[N_RELOC(512)]; struct drm_i915_gem_relocation_entry stack_reloc[N_RELOC(512)];
struct drm_i915_gem_relocation_entry __user *user_relocs; struct drm_i915_gem_relocation_entry __user *user_relocs;
struct drm_i915_gem_exec_object2 *entry = obj->exec_entry; struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
int remain, ret; int remain, ret;
user_relocs = to_user_ptr(entry->relocs_ptr); user_relocs = to_user_ptr(entry->relocs_ptr);
...@@ -346,8 +378,8 @@ i915_gem_execbuffer_relocate_object(struct drm_i915_gem_object *obj, ...@@ -346,8 +378,8 @@ i915_gem_execbuffer_relocate_object(struct drm_i915_gem_object *obj,
do { do {
u64 offset = r->presumed_offset; u64 offset = r->presumed_offset;
ret = i915_gem_execbuffer_relocate_entry(obj, eb, r, ret = i915_gem_execbuffer_relocate_entry(vma->obj, eb, r,
vm); vma->vm);
if (ret) if (ret)
return ret; return ret;
...@@ -368,17 +400,16 @@ i915_gem_execbuffer_relocate_object(struct drm_i915_gem_object *obj, ...@@ -368,17 +400,16 @@ i915_gem_execbuffer_relocate_object(struct drm_i915_gem_object *obj,
} }
static int static int
i915_gem_execbuffer_relocate_object_slow(struct drm_i915_gem_object *obj, i915_gem_execbuffer_relocate_vma_slow(struct i915_vma *vma,
struct eb_objects *eb, struct eb_vmas *eb,
struct drm_i915_gem_relocation_entry *relocs, struct drm_i915_gem_relocation_entry *relocs)
struct i915_address_space *vm)
{ {
const struct drm_i915_gem_exec_object2 *entry = obj->exec_entry; const struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
int i, ret; int i, ret;
for (i = 0; i < entry->relocation_count; i++) { for (i = 0; i < entry->relocation_count; i++) {
ret = i915_gem_execbuffer_relocate_entry(obj, eb, &relocs[i], ret = i915_gem_execbuffer_relocate_entry(vma->obj, eb, &relocs[i],
vm); vma->vm);
if (ret) if (ret)
return ret; return ret;
} }
...@@ -387,10 +418,10 @@ i915_gem_execbuffer_relocate_object_slow(struct drm_i915_gem_object *obj, ...@@ -387,10 +418,10 @@ i915_gem_execbuffer_relocate_object_slow(struct drm_i915_gem_object *obj,
} }
static int static int
i915_gem_execbuffer_relocate(struct eb_objects *eb, i915_gem_execbuffer_relocate(struct eb_vmas *eb,
struct i915_address_space *vm) struct i915_address_space *vm)
{ {
struct drm_i915_gem_object *obj; struct i915_vma *vma;
int ret = 0; int ret = 0;
/* This is the fast path and we cannot handle a pagefault whilst /* This is the fast path and we cannot handle a pagefault whilst
...@@ -401,8 +432,8 @@ i915_gem_execbuffer_relocate(struct eb_objects *eb, ...@@ -401,8 +432,8 @@ i915_gem_execbuffer_relocate(struct eb_objects *eb,
* lockdep complains vehemently. * lockdep complains vehemently.
*/ */
pagefault_disable(); pagefault_disable();
list_for_each_entry(obj, &eb->objects, exec_list) { list_for_each_entry(vma, &eb->vmas, exec_list) {
ret = i915_gem_execbuffer_relocate_object(obj, eb, vm); ret = i915_gem_execbuffer_relocate_vma(vma, eb);
if (ret) if (ret)
break; break;
} }
...@@ -415,31 +446,32 @@ i915_gem_execbuffer_relocate(struct eb_objects *eb, ...@@ -415,31 +446,32 @@ i915_gem_execbuffer_relocate(struct eb_objects *eb,
#define __EXEC_OBJECT_HAS_FENCE (1<<30) #define __EXEC_OBJECT_HAS_FENCE (1<<30)
static int static int
need_reloc_mappable(struct drm_i915_gem_object *obj) need_reloc_mappable(struct i915_vma *vma)
{ {
struct drm_i915_gem_exec_object2 *entry = obj->exec_entry; struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
return entry->relocation_count && !use_cpu_reloc(obj); return entry->relocation_count && !use_cpu_reloc(vma->obj) &&
i915_is_ggtt(vma->vm);
} }
static int static int
i915_gem_execbuffer_reserve_object(struct drm_i915_gem_object *obj, i915_gem_execbuffer_reserve_vma(struct i915_vma *vma,
struct intel_ring_buffer *ring, struct intel_ring_buffer *ring,
struct i915_address_space *vm,
bool *need_reloc) bool *need_reloc)
{ {
struct drm_i915_private *dev_priv = obj->base.dev->dev_private; struct drm_i915_private *dev_priv = ring->dev->dev_private;
struct drm_i915_gem_exec_object2 *entry = obj->exec_entry; struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
bool has_fenced_gpu_access = INTEL_INFO(ring->dev)->gen < 4; bool has_fenced_gpu_access = INTEL_INFO(ring->dev)->gen < 4;
bool need_fence, need_mappable; bool need_fence, need_mappable;
struct drm_i915_gem_object *obj = vma->obj;
int ret; int ret;
need_fence = need_fence =
has_fenced_gpu_access && has_fenced_gpu_access &&
entry->flags & EXEC_OBJECT_NEEDS_FENCE && entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
obj->tiling_mode != I915_TILING_NONE; obj->tiling_mode != I915_TILING_NONE;
need_mappable = need_fence || need_reloc_mappable(obj); need_mappable = need_fence || need_reloc_mappable(vma);
ret = i915_gem_object_pin(obj, vm, entry->alignment, need_mappable, ret = i915_gem_object_pin(obj, vma->vm, entry->alignment, need_mappable,
false); false);
if (ret) if (ret)
return ret; return ret;
...@@ -467,8 +499,8 @@ i915_gem_execbuffer_reserve_object(struct drm_i915_gem_object *obj, ...@@ -467,8 +499,8 @@ i915_gem_execbuffer_reserve_object(struct drm_i915_gem_object *obj,
obj->has_aliasing_ppgtt_mapping = 1; obj->has_aliasing_ppgtt_mapping = 1;
} }
if (entry->offset != i915_gem_obj_offset(obj, vm)) { if (entry->offset != vma->node.start) {
entry->offset = i915_gem_obj_offset(obj, vm); entry->offset = vma->node.start;
*need_reloc = true; *need_reloc = true;
} }
...@@ -485,14 +517,15 @@ i915_gem_execbuffer_reserve_object(struct drm_i915_gem_object *obj, ...@@ -485,14 +517,15 @@ i915_gem_execbuffer_reserve_object(struct drm_i915_gem_object *obj,
} }
static void static void
i915_gem_execbuffer_unreserve_object(struct drm_i915_gem_object *obj) i915_gem_execbuffer_unreserve_vma(struct i915_vma *vma)
{ {
struct drm_i915_gem_exec_object2 *entry; struct drm_i915_gem_exec_object2 *entry;
struct drm_i915_gem_object *obj = vma->obj;
if (!i915_gem_obj_bound_any(obj)) if (!drm_mm_node_allocated(&vma->node))
return; return;
entry = obj->exec_entry; entry = vma->exec_entry;
if (entry->flags & __EXEC_OBJECT_HAS_FENCE) if (entry->flags & __EXEC_OBJECT_HAS_FENCE)
i915_gem_object_unpin_fence(obj); i915_gem_object_unpin_fence(obj);
...@@ -505,41 +538,40 @@ i915_gem_execbuffer_unreserve_object(struct drm_i915_gem_object *obj) ...@@ -505,41 +538,40 @@ i915_gem_execbuffer_unreserve_object(struct drm_i915_gem_object *obj)
static int static int
i915_gem_execbuffer_reserve(struct intel_ring_buffer *ring, i915_gem_execbuffer_reserve(struct intel_ring_buffer *ring,
struct list_head *objects, struct list_head *vmas,
struct i915_address_space *vm,
bool *need_relocs) bool *need_relocs)
{ {
struct drm_i915_gem_object *obj; struct drm_i915_gem_object *obj;
struct list_head ordered_objects; struct i915_vma *vma;
struct list_head ordered_vmas;
bool has_fenced_gpu_access = INTEL_INFO(ring->dev)->gen < 4; bool has_fenced_gpu_access = INTEL_INFO(ring->dev)->gen < 4;
int retry; int retry;
INIT_LIST_HEAD(&ordered_objects); INIT_LIST_HEAD(&ordered_vmas);
while (!list_empty(objects)) { while (!list_empty(vmas)) {
struct drm_i915_gem_exec_object2 *entry; struct drm_i915_gem_exec_object2 *entry;
bool need_fence, need_mappable; bool need_fence, need_mappable;
obj = list_first_entry(objects, vma = list_first_entry(vmas, struct i915_vma, exec_list);
struct drm_i915_gem_object, obj = vma->obj;
exec_list); entry = vma->exec_entry;
entry = obj->exec_entry;
need_fence = need_fence =
has_fenced_gpu_access && has_fenced_gpu_access &&
entry->flags & EXEC_OBJECT_NEEDS_FENCE && entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
obj->tiling_mode != I915_TILING_NONE; obj->tiling_mode != I915_TILING_NONE;
need_mappable = need_fence || need_reloc_mappable(obj); need_mappable = need_fence || need_reloc_mappable(vma);
if (need_mappable) if (need_mappable)
list_move(&obj->exec_list, &ordered_objects); list_move(&vma->exec_list, &ordered_vmas);
else else
list_move_tail(&obj->exec_list, &ordered_objects); list_move_tail(&vma->exec_list, &ordered_vmas);
obj->base.pending_read_domains = I915_GEM_GPU_DOMAINS & ~I915_GEM_DOMAIN_COMMAND; obj->base.pending_read_domains = I915_GEM_GPU_DOMAINS & ~I915_GEM_DOMAIN_COMMAND;
obj->base.pending_write_domain = 0; obj->base.pending_write_domain = 0;
obj->pending_fenced_gpu_access = false; obj->pending_fenced_gpu_access = false;
} }
list_splice(&ordered_objects, objects); list_splice(&ordered_vmas, vmas);
/* Attempt to pin all of the buffers into the GTT. /* Attempt to pin all of the buffers into the GTT.
* This is done in 3 phases: * This is done in 3 phases:
...@@ -558,47 +590,47 @@ i915_gem_execbuffer_reserve(struct intel_ring_buffer *ring, ...@@ -558,47 +590,47 @@ i915_gem_execbuffer_reserve(struct intel_ring_buffer *ring,
int ret = 0; int ret = 0;
/* Unbind any ill-fitting objects or pin. */ /* Unbind any ill-fitting objects or pin. */
list_for_each_entry(obj, objects, exec_list) { list_for_each_entry(vma, vmas, exec_list) {
struct drm_i915_gem_exec_object2 *entry = obj->exec_entry; struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
bool need_fence, need_mappable; bool need_fence, need_mappable;
u32 obj_offset;
if (!i915_gem_obj_bound(obj, vm)) obj = vma->obj;
if (!drm_mm_node_allocated(&vma->node))
continue; continue;
obj_offset = i915_gem_obj_offset(obj, vm);
need_fence = need_fence =
has_fenced_gpu_access && has_fenced_gpu_access &&
entry->flags & EXEC_OBJECT_NEEDS_FENCE && entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
obj->tiling_mode != I915_TILING_NONE; obj->tiling_mode != I915_TILING_NONE;
need_mappable = need_fence || need_reloc_mappable(obj); need_mappable = need_fence || need_reloc_mappable(vma);
WARN_ON((need_mappable || need_fence) && WARN_ON((need_mappable || need_fence) &&
!i915_is_ggtt(vm)); !i915_is_ggtt(vma->vm));
if ((entry->alignment && if ((entry->alignment &&
obj_offset & (entry->alignment - 1)) || vma->node.start & (entry->alignment - 1)) ||
(need_mappable && !obj->map_and_fenceable)) (need_mappable && !obj->map_and_fenceable))
ret = i915_vma_unbind(i915_gem_obj_to_vma(obj, vm)); ret = i915_vma_unbind(vma);
else else
ret = i915_gem_execbuffer_reserve_object(obj, ring, vm, need_relocs); ret = i915_gem_execbuffer_reserve_vma(vma, ring, need_relocs);
if (ret) if (ret)
goto err; goto err;
} }
/* Bind fresh objects */ /* Bind fresh objects */
list_for_each_entry(obj, objects, exec_list) { list_for_each_entry(vma, vmas, exec_list) {
if (i915_gem_obj_bound(obj, vm)) if (drm_mm_node_allocated(&vma->node))
continue; continue;
ret = i915_gem_execbuffer_reserve_object(obj, ring, vm, need_relocs); ret = i915_gem_execbuffer_reserve_vma(vma, ring, need_relocs);
if (ret) if (ret)
goto err; goto err;
} }
err: /* Decrement pin count for bound objects */ err: /* Decrement pin count for bound objects */
list_for_each_entry(obj, objects, exec_list) list_for_each_entry(vma, vmas, exec_list)
i915_gem_execbuffer_unreserve_object(obj); i915_gem_execbuffer_unreserve_vma(vma);
if (ret != -ENOSPC || retry++) if (ret != -ENOSPC || retry++)
return ret; return ret;
...@@ -614,24 +646,27 @@ i915_gem_execbuffer_relocate_slow(struct drm_device *dev, ...@@ -614,24 +646,27 @@ i915_gem_execbuffer_relocate_slow(struct drm_device *dev,
struct drm_i915_gem_execbuffer2 *args, struct drm_i915_gem_execbuffer2 *args,
struct drm_file *file, struct drm_file *file,
struct intel_ring_buffer *ring, struct intel_ring_buffer *ring,
struct eb_objects *eb, struct eb_vmas *eb,
struct drm_i915_gem_exec_object2 *exec, struct drm_i915_gem_exec_object2 *exec)
struct i915_address_space *vm)
{ {
struct drm_i915_gem_relocation_entry *reloc; struct drm_i915_gem_relocation_entry *reloc;
struct drm_i915_gem_object *obj; struct i915_address_space *vm;
struct i915_vma *vma;
bool need_relocs; bool need_relocs;
int *reloc_offset; int *reloc_offset;
int i, total, ret; int i, total, ret;
int count = args->buffer_count; int count = args->buffer_count;
if (WARN_ON(list_empty(&eb->vmas)))
return 0;
vm = list_first_entry(&eb->vmas, struct i915_vma, exec_list)->vm;
/* We may process another execbuffer during the unlock... */ /* We may process another execbuffer during the unlock... */
while (!list_empty(&eb->objects)) { while (!list_empty(&eb->vmas)) {
obj = list_first_entry(&eb->objects, vma = list_first_entry(&eb->vmas, struct i915_vma, exec_list);
struct drm_i915_gem_object, list_del_init(&vma->exec_list);
exec_list); drm_gem_object_unreference(&vma->obj->base);
list_del_init(&obj->exec_list);
drm_gem_object_unreference(&obj->base);
} }
mutex_unlock(&dev->struct_mutex); mutex_unlock(&dev->struct_mutex);
...@@ -695,20 +730,19 @@ i915_gem_execbuffer_relocate_slow(struct drm_device *dev, ...@@ -695,20 +730,19 @@ i915_gem_execbuffer_relocate_slow(struct drm_device *dev,
/* reacquire the objects */ /* reacquire the objects */
eb_reset(eb); eb_reset(eb);
ret = eb_lookup_objects(eb, exec, args, file); ret = eb_lookup_vmas(eb, exec, args, vm, file);
if (ret) if (ret)
goto err; goto err;
need_relocs = (args->flags & I915_EXEC_NO_RELOC) == 0; need_relocs = (args->flags & I915_EXEC_NO_RELOC) == 0;
ret = i915_gem_execbuffer_reserve(ring, &eb->objects, vm, &need_relocs); ret = i915_gem_execbuffer_reserve(ring, &eb->vmas, &need_relocs);
if (ret) if (ret)
goto err; goto err;
list_for_each_entry(obj, &eb->objects, exec_list) { list_for_each_entry(vma, &eb->vmas, exec_list) {
int offset = obj->exec_entry - exec; int offset = vma->exec_entry - exec;
ret = i915_gem_execbuffer_relocate_object_slow(obj, eb, ret = i915_gem_execbuffer_relocate_vma_slow(vma, eb,
reloc + reloc_offset[offset], reloc + reloc_offset[offset]);
vm);
if (ret) if (ret)
goto err; goto err;
} }
...@@ -727,14 +761,15 @@ i915_gem_execbuffer_relocate_slow(struct drm_device *dev, ...@@ -727,14 +761,15 @@ i915_gem_execbuffer_relocate_slow(struct drm_device *dev,
static int static int
i915_gem_execbuffer_move_to_gpu(struct intel_ring_buffer *ring, i915_gem_execbuffer_move_to_gpu(struct intel_ring_buffer *ring,
struct list_head *objects) struct list_head *vmas)
{ {
struct drm_i915_gem_object *obj; struct i915_vma *vma;
uint32_t flush_domains = 0; uint32_t flush_domains = 0;
bool flush_chipset = false; bool flush_chipset = false;
int ret; int ret;
list_for_each_entry(obj, objects, exec_list) { list_for_each_entry(vma, vmas, exec_list) {
struct drm_i915_gem_object *obj = vma->obj;
ret = i915_gem_object_sync(obj, ring); ret = i915_gem_object_sync(obj, ring);
if (ret) if (ret)
return ret; return ret;
...@@ -809,13 +844,13 @@ validate_exec_list(struct drm_i915_gem_exec_object2 *exec, ...@@ -809,13 +844,13 @@ validate_exec_list(struct drm_i915_gem_exec_object2 *exec,
} }
static void static void
i915_gem_execbuffer_move_to_active(struct list_head *objects, i915_gem_execbuffer_move_to_active(struct list_head *vmas,
struct i915_address_space *vm,
struct intel_ring_buffer *ring) struct intel_ring_buffer *ring)
{ {
struct drm_i915_gem_object *obj; struct i915_vma *vma;
list_for_each_entry(obj, objects, exec_list) { list_for_each_entry(vma, vmas, exec_list) {
struct drm_i915_gem_object *obj = vma->obj;
u32 old_read = obj->base.read_domains; u32 old_read = obj->base.read_domains;
u32 old_write = obj->base.write_domain; u32 old_write = obj->base.write_domain;
...@@ -825,8 +860,7 @@ i915_gem_execbuffer_move_to_active(struct list_head *objects, ...@@ -825,8 +860,7 @@ i915_gem_execbuffer_move_to_active(struct list_head *objects,
obj->base.read_domains = obj->base.pending_read_domains; obj->base.read_domains = obj->base.pending_read_domains;
obj->fenced_gpu_access = obj->pending_fenced_gpu_access; obj->fenced_gpu_access = obj->pending_fenced_gpu_access;
/* FIXME: This lookup gets fixed later <-- danvet */ list_move_tail(&vma->mm_list, &vma->vm->active_list);
list_move_tail(&i915_gem_obj_to_vma(obj, vm)->mm_list, &vm->active_list);
i915_gem_object_move_to_active(obj, ring); i915_gem_object_move_to_active(obj, ring);
if (obj->base.write_domain) { if (obj->base.write_domain) {
obj->dirty = 1; obj->dirty = 1;
...@@ -885,7 +919,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data, ...@@ -885,7 +919,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data,
struct i915_address_space *vm) struct i915_address_space *vm)
{ {
drm_i915_private_t *dev_priv = dev->dev_private; drm_i915_private_t *dev_priv = dev->dev_private;
struct eb_objects *eb; struct eb_vmas *eb;
struct drm_i915_gem_object *batch_obj; struct drm_i915_gem_object *batch_obj;
struct drm_clip_rect *cliprects = NULL; struct drm_clip_rect *cliprects = NULL;
struct intel_ring_buffer *ring; struct intel_ring_buffer *ring;
...@@ -1025,7 +1059,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data, ...@@ -1025,7 +1059,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data,
goto pre_mutex_err; goto pre_mutex_err;
} }
eb = eb_create(args); eb = eb_create(args, vm);
if (eb == NULL) { if (eb == NULL) {
mutex_unlock(&dev->struct_mutex); mutex_unlock(&dev->struct_mutex);
ret = -ENOMEM; ret = -ENOMEM;
...@@ -1033,18 +1067,16 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data, ...@@ -1033,18 +1067,16 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data,
} }
/* Look up object handles */ /* Look up object handles */
ret = eb_lookup_objects(eb, exec, args, file); ret = eb_lookup_vmas(eb, exec, args, vm, file);
if (ret) if (ret)
goto err; goto err;
/* take note of the batch buffer before we might reorder the lists */ /* take note of the batch buffer before we might reorder the lists */
batch_obj = list_entry(eb->objects.prev, batch_obj = list_entry(eb->vmas.prev, struct i915_vma, exec_list)->obj;
struct drm_i915_gem_object,
exec_list);
/* Move the objects en-masse into the GTT, evicting if necessary. */ /* Move the objects en-masse into the GTT, evicting if necessary. */
need_relocs = (args->flags & I915_EXEC_NO_RELOC) == 0; need_relocs = (args->flags & I915_EXEC_NO_RELOC) == 0;
ret = i915_gem_execbuffer_reserve(ring, &eb->objects, vm, &need_relocs); ret = i915_gem_execbuffer_reserve(ring, &eb->vmas, &need_relocs);
if (ret) if (ret)
goto err; goto err;
...@@ -1054,7 +1086,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data, ...@@ -1054,7 +1086,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data,
if (ret) { if (ret) {
if (ret == -EFAULT) { if (ret == -EFAULT) {
ret = i915_gem_execbuffer_relocate_slow(dev, args, file, ring, ret = i915_gem_execbuffer_relocate_slow(dev, args, file, ring,
eb, exec, vm); eb, exec);
BUG_ON(!mutex_is_locked(&dev->struct_mutex)); BUG_ON(!mutex_is_locked(&dev->struct_mutex));
} }
if (ret) if (ret)
...@@ -1076,7 +1108,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data, ...@@ -1076,7 +1108,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data,
if (flags & I915_DISPATCH_SECURE && !batch_obj->has_global_gtt_mapping) if (flags & I915_DISPATCH_SECURE && !batch_obj->has_global_gtt_mapping)
i915_gem_gtt_bind_object(batch_obj, batch_obj->cache_level); i915_gem_gtt_bind_object(batch_obj, batch_obj->cache_level);
ret = i915_gem_execbuffer_move_to_gpu(ring, &eb->objects); ret = i915_gem_execbuffer_move_to_gpu(ring, &eb->vmas);
if (ret) if (ret)
goto err; goto err;
...@@ -1131,7 +1163,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data, ...@@ -1131,7 +1163,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, void *data,
trace_i915_gem_ring_dispatch(ring, intel_ring_get_seqno(ring), flags); trace_i915_gem_ring_dispatch(ring, intel_ring_get_seqno(ring), flags);
i915_gem_execbuffer_move_to_active(&eb->objects, vm, ring); i915_gem_execbuffer_move_to_active(&eb->vmas, ring);
i915_gem_execbuffer_retire_commands(dev, file, ring, batch_obj); i915_gem_execbuffer_retire_commands(dev, file, ring, batch_obj);
err: err:
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment