Commit 7fc11959 authored by Christian König's avatar Christian König Committed by Alex Deucher

drm/amdgpu: stop using addr to check for BO move v3

It is theoretically possible that a swapped out BO gets the
same GTT address, but different backing pages while being swapped in.

Instead just use another VA state to note updated areas.
Ported from not upstream yet radeon commit with the same name.

v2: fix some bugs in the original implementation found in the radeon code.
v3: squash in VCE/UVD fix
Signed-off-by: default avatarChristian König <christian.koenig@amd.com>
Reviewed-by: default avatarAlex Deucher <alexander.deucher@amd.com>
parent 7f06c236
...@@ -539,14 +539,16 @@ struct amdgpu_bo_va_mapping { ...@@ -539,14 +539,16 @@ struct amdgpu_bo_va_mapping {
struct amdgpu_bo_va { struct amdgpu_bo_va {
/* protected by bo being reserved */ /* protected by bo being reserved */
struct list_head bo_list; struct list_head bo_list;
uint64_t addr;
struct amdgpu_fence *last_pt_update; struct amdgpu_fence *last_pt_update;
unsigned ref_count; unsigned ref_count;
/* protected by vm mutex */ /* protected by vm mutex and spinlock */
struct list_head mappings;
struct list_head vm_status; struct list_head vm_status;
/* mappings for this bo_va */
struct list_head invalids;
struct list_head valids;
/* constant after initialization */ /* constant after initialization */
struct amdgpu_vm *vm; struct amdgpu_vm *vm;
struct amdgpu_bo *bo; struct amdgpu_bo *bo;
...@@ -964,13 +966,16 @@ struct amdgpu_vm { ...@@ -964,13 +966,16 @@ struct amdgpu_vm {
struct rb_root va; struct rb_root va;
/* protecting invalidated and freed */ /* protecting invalidated */
spinlock_t status_lock; spinlock_t status_lock;
/* BOs moved, but not yet updated in the PT */ /* BOs moved, but not yet updated in the PT */
struct list_head invalidated; struct list_head invalidated;
/* BOs freed, but not yet updated in the PT */ /* BOs cleared in the PT because of a move */
struct list_head cleared;
/* BO mappings freed, but not yet updated in the PT */
struct list_head freed; struct list_head freed;
/* contains the page directory */ /* contains the page directory */
......
...@@ -1009,7 +1009,16 @@ amdgpu_cs_find_mapping(struct amdgpu_cs_parser *parser, ...@@ -1009,7 +1009,16 @@ amdgpu_cs_find_mapping(struct amdgpu_cs_parser *parser,
if (!reloc->bo_va) if (!reloc->bo_va)
continue; continue;
list_for_each_entry(mapping, &reloc->bo_va->mappings, list) { list_for_each_entry(mapping, &reloc->bo_va->valids, list) {
if (mapping->it.start > addr ||
addr > mapping->it.last)
continue;
*bo = reloc->bo_va->bo;
return mapping;
}
list_for_each_entry(mapping, &reloc->bo_va->invalids, list) {
if (mapping->it.start > addr || if (mapping->it.start > addr ||
addr > mapping->it.last) addr > mapping->it.last)
continue; continue;
......
...@@ -951,21 +951,24 @@ int amdgpu_vm_bo_update(struct amdgpu_device *adev, ...@@ -951,21 +951,24 @@ int amdgpu_vm_bo_update(struct amdgpu_device *adev,
addr = 0; addr = 0;
} }
if (addr == bo_va->addr)
return 0;
flags = amdgpu_ttm_tt_pte_flags(adev, bo_va->bo->tbo.ttm, mem); flags = amdgpu_ttm_tt_pte_flags(adev, bo_va->bo->tbo.ttm, mem);
list_for_each_entry(mapping, &bo_va->mappings, list) { spin_lock(&vm->status_lock);
if (!list_empty(&bo_va->vm_status))
list_splice_init(&bo_va->valids, &bo_va->invalids);
spin_unlock(&vm->status_lock);
list_for_each_entry(mapping, &bo_va->invalids, list) {
r = amdgpu_vm_bo_update_mapping(adev, vm, mapping, addr, r = amdgpu_vm_bo_update_mapping(adev, vm, mapping, addr,
flags, &bo_va->last_pt_update); flags, &bo_va->last_pt_update);
if (r) if (r)
return r; return r;
} }
bo_va->addr = addr;
spin_lock(&vm->status_lock); spin_lock(&vm->status_lock);
list_del_init(&bo_va->vm_status); list_del_init(&bo_va->vm_status);
if (!mem)
list_add(&bo_va->vm_status, &vm->cleared);
spin_unlock(&vm->status_lock); spin_unlock(&vm->status_lock);
return 0; return 0;
...@@ -1065,10 +1068,10 @@ struct amdgpu_bo_va *amdgpu_vm_bo_add(struct amdgpu_device *adev, ...@@ -1065,10 +1068,10 @@ struct amdgpu_bo_va *amdgpu_vm_bo_add(struct amdgpu_device *adev,
} }
bo_va->vm = vm; bo_va->vm = vm;
bo_va->bo = bo; bo_va->bo = bo;
bo_va->addr = 0;
bo_va->ref_count = 1; bo_va->ref_count = 1;
INIT_LIST_HEAD(&bo_va->bo_list); INIT_LIST_HEAD(&bo_va->bo_list);
INIT_LIST_HEAD(&bo_va->mappings); INIT_LIST_HEAD(&bo_va->valids);
INIT_LIST_HEAD(&bo_va->invalids);
INIT_LIST_HEAD(&bo_va->vm_status); INIT_LIST_HEAD(&bo_va->vm_status);
mutex_lock(&vm->mutex); mutex_lock(&vm->mutex);
...@@ -1157,12 +1160,10 @@ int amdgpu_vm_bo_map(struct amdgpu_device *adev, ...@@ -1157,12 +1160,10 @@ int amdgpu_vm_bo_map(struct amdgpu_device *adev,
mapping->offset = offset; mapping->offset = offset;
mapping->flags = flags; mapping->flags = flags;
list_add(&mapping->list, &bo_va->mappings); list_add(&mapping->list, &bo_va->invalids);
interval_tree_insert(&mapping->it, &vm->va); interval_tree_insert(&mapping->it, &vm->va);
trace_amdgpu_vm_bo_map(bo_va, mapping); trace_amdgpu_vm_bo_map(bo_va, mapping);
bo_va->addr = 0;
/* Make sure the page tables are allocated */ /* Make sure the page tables are allocated */
saddr >>= amdgpu_vm_block_size; saddr >>= amdgpu_vm_block_size;
eaddr >>= amdgpu_vm_block_size; eaddr >>= amdgpu_vm_block_size;
...@@ -1243,17 +1244,27 @@ int amdgpu_vm_bo_unmap(struct amdgpu_device *adev, ...@@ -1243,17 +1244,27 @@ int amdgpu_vm_bo_unmap(struct amdgpu_device *adev,
{ {
struct amdgpu_bo_va_mapping *mapping; struct amdgpu_bo_va_mapping *mapping;
struct amdgpu_vm *vm = bo_va->vm; struct amdgpu_vm *vm = bo_va->vm;
bool valid = true;
saddr /= AMDGPU_GPU_PAGE_SIZE; saddr /= AMDGPU_GPU_PAGE_SIZE;
list_for_each_entry(mapping, &bo_va->mappings, list) { list_for_each_entry(mapping, &bo_va->valids, list) {
if (mapping->it.start == saddr) if (mapping->it.start == saddr)
break; break;
} }
if (&mapping->list == &bo_va->mappings) { if (&mapping->list == &bo_va->valids) {
amdgpu_bo_unreserve(bo_va->bo); valid = false;
return -ENOENT;
list_for_each_entry(mapping, &bo_va->invalids, list) {
if (mapping->it.start == saddr)
break;
}
if (&mapping->list == &bo_va->invalids) {
amdgpu_bo_unreserve(bo_va->bo);
return -ENOENT;
}
} }
mutex_lock(&vm->mutex); mutex_lock(&vm->mutex);
...@@ -1261,12 +1272,10 @@ int amdgpu_vm_bo_unmap(struct amdgpu_device *adev, ...@@ -1261,12 +1272,10 @@ int amdgpu_vm_bo_unmap(struct amdgpu_device *adev,
interval_tree_remove(&mapping->it, &vm->va); interval_tree_remove(&mapping->it, &vm->va);
trace_amdgpu_vm_bo_unmap(bo_va, mapping); trace_amdgpu_vm_bo_unmap(bo_va, mapping);
if (bo_va->addr) { if (valid)
/* clear the old address */
list_add(&mapping->list, &vm->freed); list_add(&mapping->list, &vm->freed);
} else { else
kfree(mapping); kfree(mapping);
}
mutex_unlock(&vm->mutex); mutex_unlock(&vm->mutex);
amdgpu_bo_unreserve(bo_va->bo); amdgpu_bo_unreserve(bo_va->bo);
...@@ -1297,15 +1306,18 @@ void amdgpu_vm_bo_rmv(struct amdgpu_device *adev, ...@@ -1297,15 +1306,18 @@ void amdgpu_vm_bo_rmv(struct amdgpu_device *adev,
list_del(&bo_va->vm_status); list_del(&bo_va->vm_status);
spin_unlock(&vm->status_lock); spin_unlock(&vm->status_lock);
list_for_each_entry_safe(mapping, next, &bo_va->mappings, list) { list_for_each_entry_safe(mapping, next, &bo_va->valids, list) {
list_del(&mapping->list); list_del(&mapping->list);
interval_tree_remove(&mapping->it, &vm->va); interval_tree_remove(&mapping->it, &vm->va);
trace_amdgpu_vm_bo_unmap(bo_va, mapping); trace_amdgpu_vm_bo_unmap(bo_va, mapping);
if (bo_va->addr) list_add(&mapping->list, &vm->freed);
list_add(&mapping->list, &vm->freed); }
else list_for_each_entry_safe(mapping, next, &bo_va->invalids, list) {
kfree(mapping); list_del(&mapping->list);
interval_tree_remove(&mapping->it, &vm->va);
kfree(mapping);
} }
amdgpu_fence_unref(&bo_va->last_pt_update); amdgpu_fence_unref(&bo_va->last_pt_update);
kfree(bo_va); kfree(bo_va);
...@@ -1327,12 +1339,10 @@ void amdgpu_vm_bo_invalidate(struct amdgpu_device *adev, ...@@ -1327,12 +1339,10 @@ void amdgpu_vm_bo_invalidate(struct amdgpu_device *adev,
struct amdgpu_bo_va *bo_va; struct amdgpu_bo_va *bo_va;
list_for_each_entry(bo_va, &bo->va, bo_list) { list_for_each_entry(bo_va, &bo->va, bo_list) {
if (bo_va->addr) { spin_lock(&bo_va->vm->status_lock);
spin_lock(&bo_va->vm->status_lock); if (list_empty(&bo_va->vm_status))
list_del(&bo_va->vm_status);
list_add(&bo_va->vm_status, &bo_va->vm->invalidated); list_add(&bo_va->vm_status, &bo_va->vm->invalidated);
spin_unlock(&bo_va->vm->status_lock); spin_unlock(&bo_va->vm->status_lock);
}
} }
} }
...@@ -1360,6 +1370,7 @@ int amdgpu_vm_init(struct amdgpu_device *adev, struct amdgpu_vm *vm) ...@@ -1360,6 +1370,7 @@ int amdgpu_vm_init(struct amdgpu_device *adev, struct amdgpu_vm *vm)
vm->va = RB_ROOT; vm->va = RB_ROOT;
spin_lock_init(&vm->status_lock); spin_lock_init(&vm->status_lock);
INIT_LIST_HEAD(&vm->invalidated); INIT_LIST_HEAD(&vm->invalidated);
INIT_LIST_HEAD(&vm->cleared);
INIT_LIST_HEAD(&vm->freed); INIT_LIST_HEAD(&vm->freed);
pd_size = amdgpu_vm_directory_size(adev); pd_size = amdgpu_vm_directory_size(adev);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment