forked from Minki/linux
drm/amdgpu: use a fence array for VMID management
Just wait for any fence to become available, instead of waiting for the last entry of the LRU. Acked-by: Alex Deucher <alexander.deucher@amd.com> Signed-off-by: Christian König <christian.koenig@amd.com> Acked-by: Chunming Zhou <david1.zhou@amd.com> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
This commit is contained in:
parent
8d76001e00
commit
1fbb2e9299
@ -597,10 +597,8 @@ int amdgpu_sync_resv(struct amdgpu_device *adev,
|
|||||||
struct amdgpu_sync *sync,
|
struct amdgpu_sync *sync,
|
||||||
struct reservation_object *resv,
|
struct reservation_object *resv,
|
||||||
void *owner);
|
void *owner);
|
||||||
bool amdgpu_sync_is_idle(struct amdgpu_sync *sync,
|
struct fence *amdgpu_sync_peek_fence(struct amdgpu_sync *sync,
|
||||||
struct amdgpu_ring *ring);
|
struct amdgpu_ring *ring);
|
||||||
int amdgpu_sync_cycle_fences(struct amdgpu_sync *dst, struct amdgpu_sync *src,
|
|
||||||
struct fence *fence);
|
|
||||||
struct fence *amdgpu_sync_get_fence(struct amdgpu_sync *sync);
|
struct fence *amdgpu_sync_get_fence(struct amdgpu_sync *sync);
|
||||||
void amdgpu_sync_free(struct amdgpu_sync *sync);
|
void amdgpu_sync_free(struct amdgpu_sync *sync);
|
||||||
int amdgpu_sync_init(void);
|
int amdgpu_sync_init(void);
|
||||||
@ -909,6 +907,10 @@ struct amdgpu_vm_manager {
|
|||||||
struct list_head ids_lru;
|
struct list_head ids_lru;
|
||||||
struct amdgpu_vm_id ids[AMDGPU_NUM_VM];
|
struct amdgpu_vm_id ids[AMDGPU_NUM_VM];
|
||||||
|
|
||||||
|
/* Handling of VM fences */
|
||||||
|
u64 fence_context;
|
||||||
|
unsigned seqno[AMDGPU_MAX_RINGS];
|
||||||
|
|
||||||
uint32_t max_pfn;
|
uint32_t max_pfn;
|
||||||
/* vram base address for page table entry */
|
/* vram base address for page table entry */
|
||||||
u64 vram_base_offset;
|
u64 vram_base_offset;
|
||||||
|
@ -166,7 +166,7 @@ static struct fence *amdgpu_job_run(struct amd_sched_job *sched_job)
|
|||||||
}
|
}
|
||||||
job = to_amdgpu_job(sched_job);
|
job = to_amdgpu_job(sched_job);
|
||||||
|
|
||||||
BUG_ON(!amdgpu_sync_is_idle(&job->sync, NULL));
|
BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL));
|
||||||
|
|
||||||
trace_amdgpu_sched_run_job(job);
|
trace_amdgpu_sched_run_job(job);
|
||||||
r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs,
|
r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs,
|
||||||
|
@ -223,16 +223,16 @@ int amdgpu_sync_resv(struct amdgpu_device *adev,
|
|||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* amdgpu_sync_is_idle - test if all fences are signaled
|
* amdgpu_sync_peek_fence - get the next fence not signaled yet
|
||||||
*
|
*
|
||||||
* @sync: the sync object
|
* @sync: the sync object
|
||||||
* @ring: optional ring to use for test
|
* @ring: optional ring to use for test
|
||||||
*
|
*
|
||||||
* Returns true if all fences in the sync object are signaled or scheduled to
|
* Returns the next fence not signaled yet without removing it from the sync
|
||||||
* the ring (if provided).
|
* object.
|
||||||
*/
|
*/
|
||||||
bool amdgpu_sync_is_idle(struct amdgpu_sync *sync,
|
struct fence *amdgpu_sync_peek_fence(struct amdgpu_sync *sync,
|
||||||
struct amdgpu_ring *ring)
|
struct amdgpu_ring *ring)
|
||||||
{
|
{
|
||||||
struct amdgpu_sync_entry *e;
|
struct amdgpu_sync_entry *e;
|
||||||
struct hlist_node *tmp;
|
struct hlist_node *tmp;
|
||||||
@ -246,9 +246,12 @@ bool amdgpu_sync_is_idle(struct amdgpu_sync *sync,
|
|||||||
/* For fences from the same ring it is sufficient
|
/* For fences from the same ring it is sufficient
|
||||||
* when they are scheduled.
|
* when they are scheduled.
|
||||||
*/
|
*/
|
||||||
if (s_fence->sched == &ring->sched &&
|
if (s_fence->sched == &ring->sched) {
|
||||||
fence_is_signaled(&s_fence->scheduled))
|
if (fence_is_signaled(&s_fence->scheduled))
|
||||||
continue;
|
continue;
|
||||||
|
|
||||||
|
return &s_fence->scheduled;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (fence_is_signaled(f)) {
|
if (fence_is_signaled(f)) {
|
||||||
@ -258,56 +261,10 @@ bool amdgpu_sync_is_idle(struct amdgpu_sync *sync,
|
|||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
return false;
|
return f;
|
||||||
}
|
}
|
||||||
|
|
||||||
return true;
|
return NULL;
|
||||||
}
|
|
||||||
|
|
||||||
/**
|
|
||||||
* amdgpu_sync_cycle_fences - move fences from one sync object into another
|
|
||||||
*
|
|
||||||
* @dst: the destination sync object
|
|
||||||
* @src: the source sync object
|
|
||||||
* @fence: fence to add to source
|
|
||||||
*
|
|
||||||
* Remove all fences from source and put them into destination and add
|
|
||||||
* fence as new one into source.
|
|
||||||
*/
|
|
||||||
int amdgpu_sync_cycle_fences(struct amdgpu_sync *dst, struct amdgpu_sync *src,
|
|
||||||
struct fence *fence)
|
|
||||||
{
|
|
||||||
struct amdgpu_sync_entry *e, *newone;
|
|
||||||
struct hlist_node *tmp;
|
|
||||||
int i;
|
|
||||||
|
|
||||||
/* Allocate the new entry before moving the old ones */
|
|
||||||
newone = kmem_cache_alloc(amdgpu_sync_slab, GFP_KERNEL);
|
|
||||||
if (!newone)
|
|
||||||
return -ENOMEM;
|
|
||||||
|
|
||||||
hash_for_each_safe(src->fences, i, tmp, e, node) {
|
|
||||||
struct fence *f = e->fence;
|
|
||||||
|
|
||||||
hash_del(&e->node);
|
|
||||||
if (fence_is_signaled(f)) {
|
|
||||||
fence_put(f);
|
|
||||||
kmem_cache_free(amdgpu_sync_slab, e);
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (amdgpu_sync_add_later(dst, f)) {
|
|
||||||
kmem_cache_free(amdgpu_sync_slab, e);
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
hash_add(dst->fences, &e->node, f->context);
|
|
||||||
}
|
|
||||||
|
|
||||||
hash_add(src->fences, &newone->node, fence->context);
|
|
||||||
newone->fence = fence_get(fence);
|
|
||||||
|
|
||||||
return 0;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -25,6 +25,7 @@
|
|||||||
* Alex Deucher
|
* Alex Deucher
|
||||||
* Jerome Glisse
|
* Jerome Glisse
|
||||||
*/
|
*/
|
||||||
|
#include <linux/fence-array.h>
|
||||||
#include <drm/drmP.h>
|
#include <drm/drmP.h>
|
||||||
#include <drm/amdgpu_drm.h>
|
#include <drm/amdgpu_drm.h>
|
||||||
#include "amdgpu.h"
|
#include "amdgpu.h"
|
||||||
@ -180,82 +181,116 @@ int amdgpu_vm_grab_id(struct amdgpu_vm *vm, struct amdgpu_ring *ring,
|
|||||||
struct amdgpu_device *adev = ring->adev;
|
struct amdgpu_device *adev = ring->adev;
|
||||||
struct fence *updates = sync->last_vm_update;
|
struct fence *updates = sync->last_vm_update;
|
||||||
struct amdgpu_vm_id *id, *idle;
|
struct amdgpu_vm_id *id, *idle;
|
||||||
unsigned i = ring->idx;
|
struct fence **fences;
|
||||||
int r;
|
unsigned i;
|
||||||
|
int r = 0;
|
||||||
|
|
||||||
|
fences = kmalloc_array(sizeof(void *), adev->vm_manager.num_ids,
|
||||||
|
GFP_KERNEL);
|
||||||
|
if (!fences)
|
||||||
|
return -ENOMEM;
|
||||||
|
|
||||||
mutex_lock(&adev->vm_manager.lock);
|
mutex_lock(&adev->vm_manager.lock);
|
||||||
|
|
||||||
/* Check if we have an idle VMID */
|
/* Check if we have an idle VMID */
|
||||||
|
i = 0;
|
||||||
list_for_each_entry(idle, &adev->vm_manager.ids_lru, list) {
|
list_for_each_entry(idle, &adev->vm_manager.ids_lru, list) {
|
||||||
if (amdgpu_sync_is_idle(&idle->active, ring))
|
fences[i] = amdgpu_sync_peek_fence(&idle->active, ring);
|
||||||
|
if (!fences[i])
|
||||||
break;
|
break;
|
||||||
|
++i;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* If we can't find a idle VMID to use, just wait for the oldest */
|
/* If we can't find a idle VMID to use, wait till one becomes available */
|
||||||
if (&idle->list == &adev->vm_manager.ids_lru) {
|
if (&idle->list == &adev->vm_manager.ids_lru) {
|
||||||
id = list_first_entry(&adev->vm_manager.ids_lru,
|
u64 fence_context = adev->vm_manager.fence_context + ring->idx;
|
||||||
struct amdgpu_vm_id,
|
unsigned seqno = ++adev->vm_manager.seqno[ring->idx];
|
||||||
list);
|
struct fence_array *array;
|
||||||
} else {
|
unsigned j;
|
||||||
/* Check if we can use a VMID already assigned to this VM */
|
|
||||||
do {
|
|
||||||
struct fence *flushed;
|
|
||||||
|
|
||||||
id = vm->ids[i++];
|
for (j = 0; j < i; ++j)
|
||||||
if (i == AMDGPU_MAX_RINGS)
|
fence_get(fences[j]);
|
||||||
i = 0;
|
|
||||||
|
|
||||||
/* Check all the prerequisites to using this VMID */
|
array = fence_array_create(i, fences, fence_context,
|
||||||
if (!id)
|
seqno, true);
|
||||||
continue;
|
if (!array) {
|
||||||
|
for (j = 0; j < i; ++j)
|
||||||
|
fence_put(fences[j]);
|
||||||
|
kfree(fences);
|
||||||
|
r = -ENOMEM;
|
||||||
|
goto error;
|
||||||
|
}
|
||||||
|
|
||||||
if (atomic64_read(&id->owner) != vm->client_id)
|
|
||||||
continue;
|
|
||||||
|
|
||||||
if (pd_addr != id->pd_gpu_addr)
|
r = amdgpu_sync_fence(ring->adev, sync, &array->base);
|
||||||
continue;
|
fence_put(&array->base);
|
||||||
|
if (r)
|
||||||
|
goto error;
|
||||||
|
|
||||||
if (id->last_user != ring && (!id->last_flush ||
|
mutex_unlock(&adev->vm_manager.lock);
|
||||||
!fence_is_signaled(id->last_flush)))
|
return 0;
|
||||||
continue;
|
|
||||||
|
|
||||||
flushed = id->flushed_updates;
|
}
|
||||||
if (updates && (!flushed ||
|
kfree(fences);
|
||||||
fence_is_later(updates, flushed)))
|
|
||||||
continue;
|
|
||||||
|
|
||||||
/* Good we can use this VMID */
|
/* Check if we can use a VMID already assigned to this VM */
|
||||||
if (id->last_user == ring) {
|
i = ring->idx;
|
||||||
r = amdgpu_sync_fence(ring->adev, sync,
|
do {
|
||||||
id->first);
|
struct fence *flushed;
|
||||||
if (r)
|
|
||||||
goto error;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* And remember this submission as user of the VMID */
|
id = vm->ids[i++];
|
||||||
r = amdgpu_sync_fence(ring->adev, &id->active, fence);
|
if (i == AMDGPU_MAX_RINGS)
|
||||||
|
i = 0;
|
||||||
|
|
||||||
|
/* Check all the prerequisites to using this VMID */
|
||||||
|
if (!id)
|
||||||
|
continue;
|
||||||
|
|
||||||
|
if (atomic64_read(&id->owner) != vm->client_id)
|
||||||
|
continue;
|
||||||
|
|
||||||
|
if (pd_addr != id->pd_gpu_addr)
|
||||||
|
continue;
|
||||||
|
|
||||||
|
if (id->last_user != ring &&
|
||||||
|
(!id->last_flush || !fence_is_signaled(id->last_flush)))
|
||||||
|
continue;
|
||||||
|
|
||||||
|
flushed = id->flushed_updates;
|
||||||
|
if (updates &&
|
||||||
|
(!flushed || fence_is_later(updates, flushed)))
|
||||||
|
continue;
|
||||||
|
|
||||||
|
/* Good we can use this VMID */
|
||||||
|
if (id->last_user == ring) {
|
||||||
|
r = amdgpu_sync_fence(ring->adev, sync,
|
||||||
|
id->first);
|
||||||
if (r)
|
if (r)
|
||||||
goto error;
|
goto error;
|
||||||
|
}
|
||||||
|
|
||||||
list_move_tail(&id->list, &adev->vm_manager.ids_lru);
|
/* And remember this submission as user of the VMID */
|
||||||
vm->ids[ring->idx] = id;
|
r = amdgpu_sync_fence(ring->adev, &id->active, fence);
|
||||||
|
if (r)
|
||||||
|
goto error;
|
||||||
|
|
||||||
*vm_id = id - adev->vm_manager.ids;
|
list_move_tail(&id->list, &adev->vm_manager.ids_lru);
|
||||||
*vm_pd_addr = AMDGPU_VM_NO_FLUSH;
|
vm->ids[ring->idx] = id;
|
||||||
trace_amdgpu_vm_grab_id(vm, ring->idx, *vm_id,
|
|
||||||
*vm_pd_addr);
|
|
||||||
|
|
||||||
mutex_unlock(&adev->vm_manager.lock);
|
*vm_id = id - adev->vm_manager.ids;
|
||||||
return 0;
|
*vm_pd_addr = AMDGPU_VM_NO_FLUSH;
|
||||||
|
trace_amdgpu_vm_grab_id(vm, ring->idx, *vm_id, *vm_pd_addr);
|
||||||
|
|
||||||
} while (i != ring->idx);
|
mutex_unlock(&adev->vm_manager.lock);
|
||||||
|
return 0;
|
||||||
|
|
||||||
/* Still no ID to use? Then use the idle one found earlier */
|
} while (i != ring->idx);
|
||||||
id = idle;
|
|
||||||
}
|
|
||||||
|
|
||||||
r = amdgpu_sync_cycle_fences(sync, &id->active, fence);
|
/* Still no ID to use? Then use the idle one found earlier */
|
||||||
|
id = idle;
|
||||||
|
|
||||||
|
/* Remember this submission as user of the VMID */
|
||||||
|
r = amdgpu_sync_fence(ring->adev, &id->active, fence);
|
||||||
if (r)
|
if (r)
|
||||||
goto error;
|
goto error;
|
||||||
|
|
||||||
@ -1515,6 +1550,10 @@ void amdgpu_vm_manager_init(struct amdgpu_device *adev)
|
|||||||
&adev->vm_manager.ids_lru);
|
&adev->vm_manager.ids_lru);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
adev->vm_manager.fence_context = fence_context_alloc(AMDGPU_MAX_RINGS);
|
||||||
|
for (i = 0; i < AMDGPU_MAX_RINGS; ++i)
|
||||||
|
adev->vm_manager.seqno[i] = 0;
|
||||||
|
|
||||||
atomic_set(&adev->vm_manager.vm_pte_next_ring, 0);
|
atomic_set(&adev->vm_manager.vm_pte_next_ring, 0);
|
||||||
atomic64_set(&adev->vm_manager.client_counter, 0);
|
atomic64_set(&adev->vm_manager.client_counter, 0);
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user