drm/i915: Use the vma resource as argument for gtt binding / unbinding
When introducing asynchronous unbinding, the vma itself may no longer be alive when the actual binding or unbinding takes place. Update the gtt i915_vma_ops accordingly to take a struct i915_vma_resource instead of a struct i915_vma for the bind_vma() and unbind_vma() ops. Similarly change the insert_entries() op for struct i915_address_space. Replace a couple of i915_vma_snapshot members with their newly introduced i915_vma_resource counterparts, since they have the same lifetime. Also make sure to avoid changing the struct i915_vma_flags (in particular the bind flags) async. That should now only be done sync under the vm mutex. v2: - Update the vma_res::bound_flags when binding to the aliased ggtt v6: - Remove I915_VMA_ALLOC_BIT (Matthew Auld) - Change some members of struct i915_vma_resource from unsigned long to u64 (Matthew Auld) v7: - Fix vma resource size parameters to be u64 rather than unsigned long (Matthew Auld) Signed-off-by: Thomas Hellström <thomas.hellstrom@linux.intel.com> Reviewed-by: Matthew Auld <matthew.auld@intel.com> Link: https://patchwork.freedesktop.org/patch/msgid/20220110172219.107131-3-thomas.hellstrom@linux.intel.com
This commit is contained in:
parent
e1a4bbb6e8
commit
39a2bd34c9
@ -48,7 +48,7 @@ static void dpt_insert_page(struct i915_address_space *vm,
|
||||
}
|
||||
|
||||
static void dpt_insert_entries(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level level,
|
||||
u32 flags)
|
||||
{
|
||||
@ -64,8 +64,8 @@ static void dpt_insert_entries(struct i915_address_space *vm,
|
||||
* not to allow the user to override access to a read only page.
|
||||
*/
|
||||
|
||||
i = vma->node.start / I915_GTT_PAGE_SIZE;
|
||||
for_each_sgt_daddr(addr, sgt_iter, vma->pages)
|
||||
i = vma_res->start / I915_GTT_PAGE_SIZE;
|
||||
for_each_sgt_daddr(addr, sgt_iter, vma_res->bi.pages)
|
||||
gen8_set_pte(&base[i++], pte_encode | addr);
|
||||
}
|
||||
|
||||
@ -76,35 +76,38 @@ static void dpt_clear_range(struct i915_address_space *vm,
|
||||
|
||||
static void dpt_bind_vma(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
struct drm_i915_gem_object *obj = vma->obj;
|
||||
u32 pte_flags;
|
||||
|
||||
if (vma_res->bound_flags)
|
||||
return;
|
||||
|
||||
/* Applicable to VLV (gen8+ do not support RO in the GGTT) */
|
||||
pte_flags = 0;
|
||||
if (vma->vm->has_read_only && i915_gem_object_is_readonly(obj))
|
||||
if (vm->has_read_only && vma_res->bi.readonly)
|
||||
pte_flags |= PTE_READ_ONLY;
|
||||
if (i915_gem_object_is_lmem(obj))
|
||||
if (vma_res->bi.lmem)
|
||||
pte_flags |= PTE_LM;
|
||||
|
||||
vma->vm->insert_entries(vma->vm, vma, cache_level, pte_flags);
|
||||
vm->insert_entries(vm, vma_res, cache_level, pte_flags);
|
||||
|
||||
vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
|
||||
vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
|
||||
|
||||
/*
|
||||
* Without aliasing PPGTT there's no difference between
|
||||
* GLOBAL/LOCAL_BIND, it's all the same ptes. Hence unconditionally
|
||||
* upgrade to both bound if we bind either to avoid double-binding.
|
||||
*/
|
||||
atomic_or(I915_VMA_GLOBAL_BIND | I915_VMA_LOCAL_BIND, &vma->flags);
|
||||
vma_res->bound_flags = I915_VMA_GLOBAL_BIND | I915_VMA_LOCAL_BIND;
|
||||
}
|
||||
|
||||
static void dpt_unbind_vma(struct i915_address_space *vm, struct i915_vma *vma)
|
||||
static void dpt_unbind_vma(struct i915_address_space *vm,
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
vm->clear_range(vm, vma->node.start, vma->size);
|
||||
vm->clear_range(vm, vma_res->start, vma_res->vma_size);
|
||||
}
|
||||
|
||||
static void dpt_cleanup(struct i915_address_space *vm)
|
||||
|
@ -15,6 +15,7 @@
|
||||
|
||||
#include "i915_active.h"
|
||||
#include "i915_selftest.h"
|
||||
#include "i915_vma_resource.h"
|
||||
|
||||
struct drm_i915_gem_object;
|
||||
struct intel_fronbuffer;
|
||||
@ -566,31 +567,7 @@ struct drm_i915_gem_object {
|
||||
struct sg_table *pages;
|
||||
void *mapping;
|
||||
|
||||
struct i915_page_sizes {
|
||||
/**
|
||||
* The sg mask of the pages sg_table. i.e the mask of
|
||||
* of the lengths for each sg entry.
|
||||
*/
|
||||
unsigned int phys;
|
||||
|
||||
/**
|
||||
* The gtt page sizes we are allowed to use given the
|
||||
* sg mask and the supported page sizes. This will
|
||||
* express the smallest unit we can use for the whole
|
||||
* object, as well as the larger sizes we may be able
|
||||
* to use opportunistically.
|
||||
*/
|
||||
unsigned int sg;
|
||||
|
||||
/**
|
||||
* The actual gtt page size usage. Since we can have
|
||||
* multiple vma associated with this object we need to
|
||||
* prevent any trampling of state, hence a copy of this
|
||||
* struct also lives in each vma, therefore the gtt
|
||||
* value here should only be read/write through the vma.
|
||||
*/
|
||||
unsigned int gtt;
|
||||
} page_sizes;
|
||||
struct i915_page_sizes page_sizes;
|
||||
|
||||
I915_SELFTEST_DECLARE(unsigned int page_mask);
|
||||
|
||||
|
@ -370,9 +370,9 @@ static int igt_check_page_sizes(struct i915_vma *vma)
|
||||
err = -EINVAL;
|
||||
}
|
||||
|
||||
if (!HAS_PAGE_SIZES(i915, vma->page_sizes.gtt)) {
|
||||
if (!HAS_PAGE_SIZES(i915, vma->resource->page_sizes_gtt)) {
|
||||
pr_err("unsupported page_sizes.gtt=%u, supported=%u\n",
|
||||
vma->page_sizes.gtt & ~supported, supported);
|
||||
vma->resource->page_sizes_gtt & ~supported, supported);
|
||||
err = -EINVAL;
|
||||
}
|
||||
|
||||
@ -403,15 +403,9 @@ static int igt_check_page_sizes(struct i915_vma *vma)
|
||||
if (i915_gem_object_is_lmem(obj) &&
|
||||
IS_ALIGNED(vma->node.start, SZ_2M) &&
|
||||
vma->page_sizes.sg & SZ_2M &&
|
||||
vma->page_sizes.gtt < SZ_2M) {
|
||||
vma->resource->page_sizes_gtt < SZ_2M) {
|
||||
pr_err("gtt pages mismatch for LMEM, expected 2M GTT pages, sg(%u), gtt(%u)\n",
|
||||
vma->page_sizes.sg, vma->page_sizes.gtt);
|
||||
err = -EINVAL;
|
||||
}
|
||||
|
||||
if (obj->mm.page_sizes.gtt) {
|
||||
pr_err("obj->page_sizes.gtt(%u) should never be set\n",
|
||||
obj->mm.page_sizes.gtt);
|
||||
vma->page_sizes.sg, vma->resource->page_sizes_gtt);
|
||||
err = -EINVAL;
|
||||
}
|
||||
|
||||
@ -547,9 +541,9 @@ static int igt_mock_memory_region_huge_pages(void *arg)
|
||||
goto out_unpin;
|
||||
}
|
||||
|
||||
if (vma->page_sizes.gtt != page_size) {
|
||||
if (vma->resource->page_sizes_gtt != page_size) {
|
||||
pr_err("%s page_sizes.gtt=%u, expected=%u\n",
|
||||
__func__, vma->page_sizes.gtt,
|
||||
__func__, vma->resource->page_sizes_gtt,
|
||||
page_size);
|
||||
err = -EINVAL;
|
||||
goto out_unpin;
|
||||
@ -630,9 +624,9 @@ static int igt_mock_ppgtt_misaligned_dma(void *arg)
|
||||
|
||||
err = igt_check_page_sizes(vma);
|
||||
|
||||
if (vma->page_sizes.gtt != page_size) {
|
||||
if (vma->resource->page_sizes_gtt != page_size) {
|
||||
pr_err("page_sizes.gtt=%u, expected %u\n",
|
||||
vma->page_sizes.gtt, page_size);
|
||||
vma->resource->page_sizes_gtt, page_size);
|
||||
err = -EINVAL;
|
||||
}
|
||||
|
||||
@ -657,9 +651,10 @@ static int igt_mock_ppgtt_misaligned_dma(void *arg)
|
||||
|
||||
err = igt_check_page_sizes(vma);
|
||||
|
||||
if (vma->page_sizes.gtt != I915_GTT_PAGE_SIZE_4K) {
|
||||
if (vma->resource->page_sizes_gtt != I915_GTT_PAGE_SIZE_4K) {
|
||||
pr_err("page_sizes.gtt=%u, expected %llu\n",
|
||||
vma->page_sizes.gtt, I915_GTT_PAGE_SIZE_4K);
|
||||
vma->resource->page_sizes_gtt,
|
||||
I915_GTT_PAGE_SIZE_4K);
|
||||
err = -EINVAL;
|
||||
}
|
||||
|
||||
@ -805,9 +800,9 @@ static int igt_mock_ppgtt_huge_fill(void *arg)
|
||||
}
|
||||
}
|
||||
|
||||
if (vma->page_sizes.gtt != expected_gtt) {
|
||||
if (vma->resource->page_sizes_gtt != expected_gtt) {
|
||||
pr_err("gtt=%u, expected=%u, size=%zd, single=%s\n",
|
||||
vma->page_sizes.gtt, expected_gtt,
|
||||
vma->resource->page_sizes_gtt, expected_gtt,
|
||||
obj->base.size, yesno(!!single));
|
||||
err = -EINVAL;
|
||||
break;
|
||||
@ -961,10 +956,10 @@ static int igt_mock_ppgtt_64K(void *arg)
|
||||
}
|
||||
}
|
||||
|
||||
if (vma->page_sizes.gtt != expected_gtt) {
|
||||
if (vma->resource->page_sizes_gtt != expected_gtt) {
|
||||
pr_err("gtt=%u, expected=%u, i=%d, single=%s\n",
|
||||
vma->page_sizes.gtt, expected_gtt, i,
|
||||
yesno(!!single));
|
||||
vma->resource->page_sizes_gtt,
|
||||
expected_gtt, i, yesno(!!single));
|
||||
err = -EINVAL;
|
||||
goto out_vma_unpin;
|
||||
}
|
||||
|
@ -104,17 +104,17 @@ static void gen6_ppgtt_clear_range(struct i915_address_space *vm,
|
||||
}
|
||||
|
||||
static void gen6_ppgtt_insert_entries(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
struct i915_ppgtt *ppgtt = i915_vm_to_ppgtt(vm);
|
||||
struct i915_page_directory * const pd = ppgtt->pd;
|
||||
unsigned int first_entry = vma->node.start / I915_GTT_PAGE_SIZE;
|
||||
unsigned int first_entry = vma_res->start / I915_GTT_PAGE_SIZE;
|
||||
unsigned int act_pt = first_entry / GEN6_PTES;
|
||||
unsigned int act_pte = first_entry % GEN6_PTES;
|
||||
const u32 pte_encode = vm->pte_encode(0, cache_level, flags);
|
||||
struct sgt_dma iter = sgt_dma(vma);
|
||||
struct sgt_dma iter = sgt_dma(vma_res);
|
||||
gen6_pte_t *vaddr;
|
||||
|
||||
GEM_BUG_ON(!pd->entry[act_pt]);
|
||||
@ -140,7 +140,7 @@ static void gen6_ppgtt_insert_entries(struct i915_address_space *vm,
|
||||
}
|
||||
} while (1);
|
||||
|
||||
vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
|
||||
vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
|
||||
}
|
||||
|
||||
static void gen6_flush_pd(struct gen6_ppgtt *ppgtt, u64 start, u64 end)
|
||||
@ -271,13 +271,13 @@ static void gen6_ppgtt_cleanup(struct i915_address_space *vm)
|
||||
|
||||
static void pd_vma_bind(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 unused)
|
||||
{
|
||||
struct i915_ggtt *ggtt = i915_vm_to_ggtt(vm);
|
||||
struct gen6_ppgtt *ppgtt = vma->private;
|
||||
u32 ggtt_offset = i915_ggtt_offset(vma) / I915_GTT_PAGE_SIZE;
|
||||
struct gen6_ppgtt *ppgtt = vma_res->private;
|
||||
u32 ggtt_offset = vma_res->start / I915_GTT_PAGE_SIZE;
|
||||
|
||||
ppgtt->pp_dir = ggtt_offset * sizeof(gen6_pte_t) << 10;
|
||||
ppgtt->pd_addr = (gen6_pte_t __iomem *)ggtt->gsm + ggtt_offset;
|
||||
@ -285,9 +285,10 @@ static void pd_vma_bind(struct i915_address_space *vm,
|
||||
gen6_flush_pd(ppgtt, 0, ppgtt->base.vm.total);
|
||||
}
|
||||
|
||||
static void pd_vma_unbind(struct i915_address_space *vm, struct i915_vma *vma)
|
||||
static void pd_vma_unbind(struct i915_address_space *vm,
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
struct gen6_ppgtt *ppgtt = vma->private;
|
||||
struct gen6_ppgtt *ppgtt = vma_res->private;
|
||||
struct i915_page_directory * const pd = ppgtt->base.pd;
|
||||
struct i915_page_table *pt;
|
||||
unsigned int pde;
|
||||
|
@ -453,20 +453,21 @@ gen8_ppgtt_insert_pte(struct i915_ppgtt *ppgtt,
|
||||
return idx;
|
||||
}
|
||||
|
||||
static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
|
||||
static void gen8_ppgtt_insert_huge(struct i915_address_space *vm,
|
||||
struct i915_vma_resource *vma_res,
|
||||
struct sgt_dma *iter,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
const gen8_pte_t pte_encode = gen8_pte_encode(0, cache_level, flags);
|
||||
unsigned int rem = sg_dma_len(iter->sg);
|
||||
u64 start = vma->node.start;
|
||||
u64 start = vma_res->start;
|
||||
|
||||
GEM_BUG_ON(!i915_vm_is_4lvl(vma->vm));
|
||||
GEM_BUG_ON(!i915_vm_is_4lvl(vm));
|
||||
|
||||
do {
|
||||
struct i915_page_directory * const pdp =
|
||||
gen8_pdp_for_page_address(vma->vm, start);
|
||||
gen8_pdp_for_page_address(vm, start);
|
||||
struct i915_page_directory * const pd =
|
||||
i915_pd_entry(pdp, __gen8_pte_index(start, 2));
|
||||
gen8_pte_t encode = pte_encode;
|
||||
@ -475,7 +476,7 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
|
||||
gen8_pte_t *vaddr;
|
||||
u16 index;
|
||||
|
||||
if (vma->page_sizes.sg & I915_GTT_PAGE_SIZE_2M &&
|
||||
if (vma_res->bi.page_sizes.sg & I915_GTT_PAGE_SIZE_2M &&
|
||||
IS_ALIGNED(iter->dma, I915_GTT_PAGE_SIZE_2M) &&
|
||||
rem >= I915_GTT_PAGE_SIZE_2M &&
|
||||
!__gen8_pte_index(start, 0)) {
|
||||
@ -492,7 +493,7 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
|
||||
page_size = I915_GTT_PAGE_SIZE;
|
||||
|
||||
if (!index &&
|
||||
vma->page_sizes.sg & I915_GTT_PAGE_SIZE_64K &&
|
||||
vma_res->bi.page_sizes.sg & I915_GTT_PAGE_SIZE_64K &&
|
||||
IS_ALIGNED(iter->dma, I915_GTT_PAGE_SIZE_64K) &&
|
||||
(IS_ALIGNED(rem, I915_GTT_PAGE_SIZE_64K) ||
|
||||
rem >= (I915_PDES - index) * I915_GTT_PAGE_SIZE))
|
||||
@ -541,9 +542,9 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
|
||||
*/
|
||||
if (maybe_64K != -1 &&
|
||||
(index == I915_PDES ||
|
||||
(i915_vm_has_scratch_64K(vma->vm) &&
|
||||
!iter->sg && IS_ALIGNED(vma->node.start +
|
||||
vma->node.size,
|
||||
(i915_vm_has_scratch_64K(vm) &&
|
||||
!iter->sg && IS_ALIGNED(vma_res->start +
|
||||
vma_res->node_size,
|
||||
I915_GTT_PAGE_SIZE_2M)))) {
|
||||
vaddr = px_vaddr(pd);
|
||||
vaddr[maybe_64K] |= GEN8_PDE_IPS_64K;
|
||||
@ -559,10 +560,10 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
|
||||
* instead - which we detect as missing results during
|
||||
* selftests.
|
||||
*/
|
||||
if (I915_SELFTEST_ONLY(vma->vm->scrub_64K)) {
|
||||
if (I915_SELFTEST_ONLY(vm->scrub_64K)) {
|
||||
u16 i;
|
||||
|
||||
encode = vma->vm->scratch[0]->encode;
|
||||
encode = vm->scratch[0]->encode;
|
||||
vaddr = px_vaddr(i915_pt_entry(pd, maybe_64K));
|
||||
|
||||
for (i = 1; i < index; i += 16)
|
||||
@ -572,22 +573,22 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
|
||||
}
|
||||
}
|
||||
|
||||
vma->page_sizes.gtt |= page_size;
|
||||
vma_res->page_sizes_gtt |= page_size;
|
||||
} while (iter->sg && sg_dma_len(iter->sg));
|
||||
}
|
||||
|
||||
static void gen8_ppgtt_insert(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
struct i915_ppgtt * const ppgtt = i915_vm_to_ppgtt(vm);
|
||||
struct sgt_dma iter = sgt_dma(vma);
|
||||
struct sgt_dma iter = sgt_dma(vma_res);
|
||||
|
||||
if (vma->page_sizes.sg > I915_GTT_PAGE_SIZE) {
|
||||
gen8_ppgtt_insert_huge(vma, &iter, cache_level, flags);
|
||||
if (vma_res->bi.page_sizes.sg > I915_GTT_PAGE_SIZE) {
|
||||
gen8_ppgtt_insert_huge(vm, vma_res, &iter, cache_level, flags);
|
||||
} else {
|
||||
u64 idx = vma->node.start >> GEN8_PTE_SHIFT;
|
||||
u64 idx = vma_res->start >> GEN8_PTE_SHIFT;
|
||||
|
||||
do {
|
||||
struct i915_page_directory * const pdp =
|
||||
@ -597,7 +598,7 @@ static void gen8_ppgtt_insert(struct i915_address_space *vm,
|
||||
cache_level, flags);
|
||||
} while (idx);
|
||||
|
||||
vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
|
||||
vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -1718,8 +1718,8 @@ static void print_request_ring(struct drm_printer *m, struct i915_request *rq)
|
||||
drm_printf(m,
|
||||
"[head %04x, postfix %04x, tail %04x, batch 0x%08x_%08x]:\n",
|
||||
rq->head, rq->postfix, rq->tail,
|
||||
vsnap ? upper_32_bits(vsnap->gtt_offset) : ~0u,
|
||||
vsnap ? lower_32_bits(vsnap->gtt_offset) : ~0u);
|
||||
vsnap ? upper_32_bits(vsnap->vma_resource->start) : ~0u,
|
||||
vsnap ? lower_32_bits(vsnap->vma_resource->start) : ~0u);
|
||||
|
||||
size = rq->tail - rq->head;
|
||||
if (rq->tail < rq->head)
|
||||
|
@ -218,7 +218,7 @@ static void gen8_ggtt_insert_page(struct i915_address_space *vm,
|
||||
}
|
||||
|
||||
static void gen8_ggtt_insert_entries(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level level,
|
||||
u32 flags)
|
||||
{
|
||||
@ -235,10 +235,10 @@ static void gen8_ggtt_insert_entries(struct i915_address_space *vm,
|
||||
*/
|
||||
|
||||
gte = (gen8_pte_t __iomem *)ggtt->gsm;
|
||||
gte += vma->node.start / I915_GTT_PAGE_SIZE;
|
||||
end = gte + vma->node.size / I915_GTT_PAGE_SIZE;
|
||||
gte += vma_res->start / I915_GTT_PAGE_SIZE;
|
||||
end = gte + vma_res->node_size / I915_GTT_PAGE_SIZE;
|
||||
|
||||
for_each_sgt_daddr(addr, iter, vma->pages)
|
||||
for_each_sgt_daddr(addr, iter, vma_res->bi.pages)
|
||||
gen8_set_pte(gte++, pte_encode | addr);
|
||||
GEM_BUG_ON(gte > end);
|
||||
|
||||
@ -275,7 +275,7 @@ static void gen6_ggtt_insert_page(struct i915_address_space *vm,
|
||||
* through the GMADR mapped BAR (i915->mm.gtt->gtt).
|
||||
*/
|
||||
static void gen6_ggtt_insert_entries(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level level,
|
||||
u32 flags)
|
||||
{
|
||||
@ -286,10 +286,10 @@ static void gen6_ggtt_insert_entries(struct i915_address_space *vm,
|
||||
dma_addr_t addr;
|
||||
|
||||
gte = (gen6_pte_t __iomem *)ggtt->gsm;
|
||||
gte += vma->node.start / I915_GTT_PAGE_SIZE;
|
||||
end = gte + vma->node.size / I915_GTT_PAGE_SIZE;
|
||||
gte += vma_res->start / I915_GTT_PAGE_SIZE;
|
||||
end = gte + vma_res->node_size / I915_GTT_PAGE_SIZE;
|
||||
|
||||
for_each_sgt_daddr(addr, iter, vma->pages)
|
||||
for_each_sgt_daddr(addr, iter, vma_res->bi.pages)
|
||||
iowrite32(vm->pte_encode(addr, level, flags), gte++);
|
||||
GEM_BUG_ON(gte > end);
|
||||
|
||||
@ -372,7 +372,7 @@ static void bxt_vtd_ggtt_insert_page__BKL(struct i915_address_space *vm,
|
||||
|
||||
struct insert_entries {
|
||||
struct i915_address_space *vm;
|
||||
struct i915_vma *vma;
|
||||
struct i915_vma_resource *vma_res;
|
||||
enum i915_cache_level level;
|
||||
u32 flags;
|
||||
};
|
||||
@ -381,18 +381,18 @@ static int bxt_vtd_ggtt_insert_entries__cb(void *_arg)
|
||||
{
|
||||
struct insert_entries *arg = _arg;
|
||||
|
||||
gen8_ggtt_insert_entries(arg->vm, arg->vma, arg->level, arg->flags);
|
||||
gen8_ggtt_insert_entries(arg->vm, arg->vma_res, arg->level, arg->flags);
|
||||
bxt_vtd_ggtt_wa(arg->vm);
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void bxt_vtd_ggtt_insert_entries__BKL(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level level,
|
||||
u32 flags)
|
||||
{
|
||||
struct insert_entries arg = { vm, vma, level, flags };
|
||||
struct insert_entries arg = { vm, vma_res, level, flags };
|
||||
|
||||
stop_machine(bxt_vtd_ggtt_insert_entries__cb, &arg, NULL);
|
||||
}
|
||||
@ -431,14 +431,14 @@ static void i915_ggtt_insert_page(struct i915_address_space *vm,
|
||||
}
|
||||
|
||||
static void i915_ggtt_insert_entries(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 unused)
|
||||
{
|
||||
unsigned int flags = (cache_level == I915_CACHE_NONE) ?
|
||||
AGP_USER_MEMORY : AGP_USER_CACHED_MEMORY;
|
||||
|
||||
intel_gtt_insert_sg_entries(vma->pages, vma->node.start >> PAGE_SHIFT,
|
||||
intel_gtt_insert_sg_entries(vma_res->bi.pages, vma_res->start >> PAGE_SHIFT,
|
||||
flags);
|
||||
}
|
||||
|
||||
@ -450,30 +450,32 @@ static void i915_ggtt_clear_range(struct i915_address_space *vm,
|
||||
|
||||
static void ggtt_bind_vma(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
struct drm_i915_gem_object *obj = vma->obj;
|
||||
u32 pte_flags;
|
||||
|
||||
if (i915_vma_is_bound(vma, ~flags & I915_VMA_BIND_MASK))
|
||||
if (vma_res->bound_flags & (~flags & I915_VMA_BIND_MASK))
|
||||
return;
|
||||
|
||||
vma_res->bound_flags |= flags;
|
||||
|
||||
/* Applicable to VLV (gen8+ do not support RO in the GGTT) */
|
||||
pte_flags = 0;
|
||||
if (i915_gem_object_is_readonly(obj))
|
||||
if (vma_res->bi.readonly)
|
||||
pte_flags |= PTE_READ_ONLY;
|
||||
if (i915_gem_object_is_lmem(obj))
|
||||
if (vma_res->bi.lmem)
|
||||
pte_flags |= PTE_LM;
|
||||
|
||||
vm->insert_entries(vm, vma, cache_level, pte_flags);
|
||||
vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
|
||||
vm->insert_entries(vm, vma_res, cache_level, pte_flags);
|
||||
vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
|
||||
}
|
||||
|
||||
static void ggtt_unbind_vma(struct i915_address_space *vm, struct i915_vma *vma)
|
||||
static void ggtt_unbind_vma(struct i915_address_space *vm,
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
vm->clear_range(vm, vma->node.start, vma->size);
|
||||
vm->clear_range(vm, vma_res->start, vma_res->vma_size);
|
||||
}
|
||||
|
||||
static int ggtt_reserve_guc_top(struct i915_ggtt *ggtt)
|
||||
@ -606,7 +608,7 @@ err:
|
||||
|
||||
static void aliasing_gtt_bind_vma(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
@ -614,25 +616,27 @@ static void aliasing_gtt_bind_vma(struct i915_address_space *vm,
|
||||
|
||||
/* Currently applicable only to VLV */
|
||||
pte_flags = 0;
|
||||
if (i915_gem_object_is_readonly(vma->obj))
|
||||
if (vma_res->bi.readonly)
|
||||
pte_flags |= PTE_READ_ONLY;
|
||||
|
||||
if (flags & I915_VMA_LOCAL_BIND)
|
||||
ppgtt_bind_vma(&i915_vm_to_ggtt(vm)->alias->vm,
|
||||
stash, vma, cache_level, flags);
|
||||
stash, vma_res, cache_level, flags);
|
||||
|
||||
if (flags & I915_VMA_GLOBAL_BIND)
|
||||
vm->insert_entries(vm, vma, cache_level, pte_flags);
|
||||
vm->insert_entries(vm, vma_res, cache_level, pte_flags);
|
||||
|
||||
vma_res->bound_flags |= flags;
|
||||
}
|
||||
|
||||
static void aliasing_gtt_unbind_vma(struct i915_address_space *vm,
|
||||
struct i915_vma *vma)
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
if (i915_vma_is_bound(vma, I915_VMA_GLOBAL_BIND))
|
||||
vm->clear_range(vm, vma->node.start, vma->size);
|
||||
if (vma_res->bound_flags & I915_VMA_GLOBAL_BIND)
|
||||
vm->clear_range(vm, vma_res->start, vma_res->vma_size);
|
||||
|
||||
if (i915_vma_is_bound(vma, I915_VMA_LOCAL_BIND))
|
||||
ppgtt_unbind_vma(&i915_vm_to_ggtt(vm)->alias->vm, vma);
|
||||
if (vma_res->bound_flags & I915_VMA_LOCAL_BIND)
|
||||
ppgtt_unbind_vma(&i915_vm_to_ggtt(vm)->alias->vm, vma_res);
|
||||
}
|
||||
|
||||
static int init_aliasing_ppgtt(struct i915_ggtt *ggtt)
|
||||
@ -1253,7 +1257,7 @@ void i915_ggtt_resume(struct i915_ggtt *ggtt)
|
||||
atomic_read(&vma->flags) & I915_VMA_BIND_MASK;
|
||||
|
||||
GEM_BUG_ON(!was_bound);
|
||||
vma->ops->bind_vma(&ggtt->vm, NULL, vma,
|
||||
vma->ops->bind_vma(&ggtt->vm, NULL, vma->resource,
|
||||
obj ? obj->cache_level : 0,
|
||||
was_bound);
|
||||
if (obj) { /* only used during resume => exclusive access */
|
||||
|
@ -27,6 +27,7 @@
|
||||
|
||||
#include "gt/intel_reset.h"
|
||||
#include "i915_selftest.h"
|
||||
#include "i915_vma_resource.h"
|
||||
#include "i915_vma_types.h"
|
||||
|
||||
#define I915_GFP_ALLOW_FAIL (GFP_KERNEL | __GFP_RETRY_MAYFAIL | __GFP_NOWARN)
|
||||
@ -200,7 +201,7 @@ struct i915_vma_ops {
|
||||
/* Map an object into an address space with the given cache flags. */
|
||||
void (*bind_vma)(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags);
|
||||
/*
|
||||
@ -208,7 +209,8 @@ struct i915_vma_ops {
|
||||
* setting the valid PTE entries to a reserved scratch page.
|
||||
*/
|
||||
void (*unbind_vma)(struct i915_address_space *vm,
|
||||
struct i915_vma *vma);
|
||||
struct i915_vma_resource *vma_res);
|
||||
|
||||
};
|
||||
|
||||
struct i915_address_space {
|
||||
@ -285,7 +287,7 @@ struct i915_address_space {
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags);
|
||||
void (*insert_entries)(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags);
|
||||
void (*cleanup)(struct i915_address_space *vm);
|
||||
@ -598,11 +600,11 @@ void gen6_ggtt_invalidate(struct i915_ggtt *ggtt);
|
||||
|
||||
void ppgtt_bind_vma(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags);
|
||||
void ppgtt_unbind_vma(struct i915_address_space *vm,
|
||||
struct i915_vma *vma);
|
||||
struct i915_vma_resource *vma_res);
|
||||
|
||||
void gtt_write_workarounds(struct intel_gt *gt);
|
||||
|
||||
@ -625,8 +627,8 @@ __vm_create_scratch_for_read_pinned(struct i915_address_space *vm, unsigned long
|
||||
static inline struct sgt_dma {
|
||||
struct scatterlist *sg;
|
||||
dma_addr_t dma, max;
|
||||
} sgt_dma(struct i915_vma *vma) {
|
||||
struct scatterlist *sg = vma->pages->sgl;
|
||||
} sgt_dma(struct i915_vma_resource *vma_res) {
|
||||
struct scatterlist *sg = vma_res->bi.pages->sgl;
|
||||
dma_addr_t addr = sg_dma_address(sg);
|
||||
|
||||
return (struct sgt_dma){ sg, addr, addr + sg_dma_len(sg) };
|
||||
|
@ -179,32 +179,34 @@ struct i915_ppgtt *i915_ppgtt_create(struct intel_gt *gt,
|
||||
|
||||
void ppgtt_bind_vma(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
u32 pte_flags;
|
||||
|
||||
if (!test_bit(I915_VMA_ALLOC_BIT, __i915_vma_flags(vma))) {
|
||||
vm->allocate_va_range(vm, stash, vma->node.start, vma->size);
|
||||
set_bit(I915_VMA_ALLOC_BIT, __i915_vma_flags(vma));
|
||||
if (!vma_res->allocated) {
|
||||
vm->allocate_va_range(vm, stash, vma_res->start,
|
||||
vma_res->vma_size);
|
||||
vma_res->allocated = true;
|
||||
}
|
||||
|
||||
/* Applicable to VLV, and gen8+ */
|
||||
pte_flags = 0;
|
||||
if (i915_gem_object_is_readonly(vma->obj))
|
||||
if (vma_res->bi.readonly)
|
||||
pte_flags |= PTE_READ_ONLY;
|
||||
if (i915_gem_object_is_lmem(vma->obj))
|
||||
if (vma_res->bi.lmem)
|
||||
pte_flags |= PTE_LM;
|
||||
|
||||
vm->insert_entries(vm, vma, cache_level, pte_flags);
|
||||
vm->insert_entries(vm, vma_res, cache_level, pte_flags);
|
||||
wmb();
|
||||
}
|
||||
|
||||
void ppgtt_unbind_vma(struct i915_address_space *vm, struct i915_vma *vma)
|
||||
void ppgtt_unbind_vma(struct i915_address_space *vm,
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
if (test_and_clear_bit(I915_VMA_ALLOC_BIT, __i915_vma_flags(vma)))
|
||||
vm->clear_range(vm, vma->node.start, vma->size);
|
||||
if (vma_res->allocated)
|
||||
vm->clear_range(vm, vma_res->start, vma_res->vma_size);
|
||||
}
|
||||
|
||||
static unsigned long pd_count(u64 size, int shift)
|
||||
|
@ -448,20 +448,19 @@ static void uc_fw_bind_ggtt(struct intel_uc_fw *uc_fw)
|
||||
{
|
||||
struct drm_i915_gem_object *obj = uc_fw->obj;
|
||||
struct i915_ggtt *ggtt = __uc_fw_to_gt(uc_fw)->ggtt;
|
||||
struct i915_vma *dummy = &uc_fw->dummy;
|
||||
struct i915_vma_resource *dummy = &uc_fw->dummy;
|
||||
u32 pte_flags = 0;
|
||||
|
||||
dummy->node.start = uc_fw_ggtt_offset(uc_fw);
|
||||
dummy->node.size = obj->base.size;
|
||||
dummy->pages = obj->mm.pages;
|
||||
dummy->vm = &ggtt->vm;
|
||||
dummy->start = uc_fw_ggtt_offset(uc_fw);
|
||||
dummy->node_size = obj->base.size;
|
||||
dummy->bi.pages = obj->mm.pages;
|
||||
|
||||
GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
|
||||
GEM_BUG_ON(dummy->node.size > ggtt->uc_fw.size);
|
||||
GEM_BUG_ON(dummy->node_size > ggtt->uc_fw.size);
|
||||
|
||||
/* uc_fw->obj cache domains were not controlled across suspend */
|
||||
if (i915_gem_object_has_struct_page(obj))
|
||||
drm_clflush_sg(dummy->pages);
|
||||
drm_clflush_sg(dummy->bi.pages);
|
||||
|
||||
if (i915_gem_object_is_lmem(obj))
|
||||
pte_flags |= PTE_LM;
|
||||
|
@ -85,7 +85,7 @@ struct intel_uc_fw {
|
||||
* threaded as it done during driver load (inherently single threaded)
|
||||
* or during a GT reset (mutex guarantees single threaded).
|
||||
*/
|
||||
struct i915_vma dummy;
|
||||
struct i915_vma_resource dummy;
|
||||
struct i915_vma *rsa_data;
|
||||
|
||||
/*
|
||||
|
@ -171,7 +171,8 @@ i915_debugfs_describe_obj(struct seq_file *m, struct drm_i915_gem_object *obj)
|
||||
seq_printf(m, " (%s offset: %08llx, size: %08llx, pages: %s",
|
||||
stringify_vma_type(vma),
|
||||
vma->node.start, vma->node.size,
|
||||
stringify_page_sizes(vma->page_sizes.gtt, NULL, 0));
|
||||
stringify_page_sizes(vma->resource->page_sizes_gtt,
|
||||
NULL, 0));
|
||||
if (i915_vma_is_ggtt(vma) || i915_vma_is_dpt(vma)) {
|
||||
switch (vma->ggtt_view.type) {
|
||||
case I915_GGTT_VIEW_NORMAL:
|
||||
|
@ -1040,9 +1040,9 @@ i915_vma_coredump_create(const struct intel_gt *gt,
|
||||
strcpy(dst->name, vsnap->name);
|
||||
dst->next = NULL;
|
||||
|
||||
dst->gtt_offset = vsnap->gtt_offset;
|
||||
dst->gtt_size = vsnap->gtt_size;
|
||||
dst->gtt_page_sizes = vsnap->page_sizes;
|
||||
dst->gtt_offset = vsnap->vma_resource->start;
|
||||
dst->gtt_size = vsnap->vma_resource->node_size;
|
||||
dst->gtt_page_sizes = vsnap->vma_resource->page_sizes_gtt;
|
||||
dst->unused = 0;
|
||||
|
||||
ret = -EINVAL;
|
||||
|
@ -298,7 +298,7 @@ static void __vma_bind(struct dma_fence_work *work)
|
||||
struct i915_vma *vma = vw->vma;
|
||||
|
||||
vma->ops->bind_vma(vw->vm, &vw->stash,
|
||||
vma, vw->cache_level, vw->flags);
|
||||
vma->resource, vw->cache_level, vw->flags);
|
||||
}
|
||||
|
||||
static void __vma_release(struct dma_fence_work *work)
|
||||
@ -375,6 +375,21 @@ static int i915_vma_verify_bind_complete(struct i915_vma *vma)
|
||||
#define i915_vma_verify_bind_complete(_vma) 0
|
||||
#endif
|
||||
|
||||
I915_SELFTEST_EXPORT void
|
||||
i915_vma_resource_init_from_vma(struct i915_vma_resource *vma_res,
|
||||
struct i915_vma *vma)
|
||||
{
|
||||
struct drm_i915_gem_object *obj = vma->obj;
|
||||
|
||||
i915_vma_resource_init(vma_res, vma->pages, &vma->page_sizes,
|
||||
i915_gem_object_is_readonly(obj),
|
||||
i915_gem_object_is_lmem(obj),
|
||||
vma->private,
|
||||
vma->node.start,
|
||||
vma->node.size,
|
||||
vma->size);
|
||||
}
|
||||
|
||||
/**
|
||||
* i915_vma_bind - Sets up PTEs for an VMA in it's corresponding address space.
|
||||
* @vma: VMA to map
|
||||
@ -432,7 +447,7 @@ int i915_vma_bind(struct i915_vma *vma,
|
||||
GEM_WARN_ON(!vma_flags);
|
||||
kfree(vma_res);
|
||||
} else {
|
||||
i915_vma_resource_init(vma_res);
|
||||
i915_vma_resource_init_from_vma(vma_res, vma);
|
||||
vma->resource = vma_res;
|
||||
}
|
||||
trace_i915_vma_bind(vma, bind_flags);
|
||||
@ -472,7 +487,8 @@ int i915_vma_bind(struct i915_vma *vma,
|
||||
if (ret)
|
||||
return ret;
|
||||
}
|
||||
vma->ops->bind_vma(vma->vm, NULL, vma, cache_level, bind_flags);
|
||||
vma->ops->bind_vma(vma->vm, NULL, vma->resource, cache_level,
|
||||
bind_flags);
|
||||
}
|
||||
|
||||
atomic_or(bind_flags, &vma->flags);
|
||||
@ -1723,7 +1739,7 @@ void __i915_vma_evict(struct i915_vma *vma)
|
||||
|
||||
if (likely(atomic_read(&vma->vm->open))) {
|
||||
trace_i915_vma_unbind(vma);
|
||||
vma->ops->unbind_vma(vma->vm, vma);
|
||||
vma->ops->unbind_vma(vma->vm, vma->resource);
|
||||
}
|
||||
atomic_and(~(I915_VMA_BIND_MASK | I915_VMA_ERROR | I915_VMA_GGTT_WRITE),
|
||||
&vma->flags);
|
||||
|
@ -339,12 +339,6 @@ void __iomem *i915_vma_pin_iomap(struct i915_vma *vma);
|
||||
*/
|
||||
void i915_vma_unpin_iomap(struct i915_vma *vma);
|
||||
|
||||
static inline struct page *i915_vma_first_page(struct i915_vma *vma)
|
||||
{
|
||||
GEM_BUG_ON(!vma->pages);
|
||||
return sg_page(vma->pages->sgl);
|
||||
}
|
||||
|
||||
/**
|
||||
* i915_vma_pin_fence - pin fencing state
|
||||
* @vma: vma to pin fencing for
|
||||
@ -445,6 +439,11 @@ i915_vma_get_current_resource(struct i915_vma *vma)
|
||||
return i915_vma_resource_get(vma->resource);
|
||||
}
|
||||
|
||||
#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
|
||||
void i915_vma_resource_init_from_vma(struct i915_vma_resource *vma_res,
|
||||
struct i915_vma *vma);
|
||||
#endif
|
||||
|
||||
void i915_vma_module_exit(void);
|
||||
int i915_vma_module_init(void);
|
||||
|
||||
|
@ -23,15 +23,12 @@ static struct dma_fence_ops unbind_fence_ops = {
|
||||
};
|
||||
|
||||
/**
|
||||
* i915_vma_resource_init - Initialize a vma resource.
|
||||
* __i915_vma_resource_init - Initialize a vma resource.
|
||||
* @vma_res: The vma resource to initialize
|
||||
*
|
||||
* Initializes a vma resource allocated using i915_vma_resource_alloc().
|
||||
* The reason for having separate allocate and initialize function is that
|
||||
* initialization may need to be performed from under a lock where
|
||||
* allocation is not allowed.
|
||||
* Initializes the private members of a vma resource.
|
||||
*/
|
||||
void i915_vma_resource_init(struct i915_vma_resource *vma_res)
|
||||
void __i915_vma_resource_init(struct i915_vma_resource *vma_res)
|
||||
{
|
||||
spin_lock_init(&vma_res->lock);
|
||||
dma_fence_init(&vma_res->unbind_fence, &unbind_fence_ops,
|
||||
|
@ -9,6 +9,25 @@
|
||||
#include <linux/dma-fence.h>
|
||||
#include <linux/refcount.h>
|
||||
|
||||
#include "i915_gem.h"
|
||||
|
||||
struct i915_page_sizes {
|
||||
/**
|
||||
* The sg mask of the pages sg_table. i.e the mask of
|
||||
* the lengths for each sg entry.
|
||||
*/
|
||||
unsigned int phys;
|
||||
|
||||
/**
|
||||
* The gtt page sizes we are allowed to use given the
|
||||
* sg mask and the supported page sizes. This will
|
||||
* express the smallest unit we can use for the whole
|
||||
* object, as well as the larger sizes we may be able
|
||||
* to use opportunistically.
|
||||
*/
|
||||
unsigned int sg;
|
||||
};
|
||||
|
||||
/**
|
||||
* struct i915_vma_resource - Snapshotted unbind information.
|
||||
* @unbind_fence: Fence to mark unbinding complete. Note that this fence
|
||||
@ -19,6 +38,13 @@
|
||||
* @hold_count: Number of holders blocking the fence from finishing.
|
||||
* The vma itself is keeping a hold, which is released when unbind
|
||||
* is scheduled.
|
||||
* @private: Bind backend private info.
|
||||
* @start: Offset into the address space of bind range start.
|
||||
* @node_size: Size of the allocated range manager node.
|
||||
* @vma_size: Bind size.
|
||||
* @page_sizes_gtt: Resulting page sizes from the bind operation.
|
||||
* @bound_flags: Flags indicating binding status.
|
||||
* @allocated: Backend private data. TODO: Should move into @private.
|
||||
*
|
||||
* The lifetime of a struct i915_vma_resource is from a binding request to
|
||||
* the actual possible asynchronous unbind has completed.
|
||||
@ -28,6 +54,32 @@ struct i915_vma_resource {
|
||||
/* See above for description of the lock. */
|
||||
spinlock_t lock;
|
||||
refcount_t hold_count;
|
||||
|
||||
/**
|
||||
* struct i915_vma_bindinfo - Information needed for async bind
|
||||
* only but that can be dropped after the bind has taken place.
|
||||
* Consider making this a separate argument to the bind_vma
|
||||
* op, coalescing with other arguments like vm, stash, cache_level
|
||||
* and flags
|
||||
* @pages: The pages sg-table.
|
||||
* @page_sizes: Page sizes of the pages.
|
||||
* @readonly: Whether the vma should be bound read-only.
|
||||
* @lmem: Whether the vma points to lmem.
|
||||
*/
|
||||
struct i915_vma_bindinfo {
|
||||
struct sg_table *pages;
|
||||
struct i915_page_sizes page_sizes;
|
||||
bool readonly:1;
|
||||
bool lmem:1;
|
||||
} bi;
|
||||
|
||||
void *private;
|
||||
u64 start;
|
||||
u64 node_size;
|
||||
u64 vma_size;
|
||||
u32 page_sizes_gtt;
|
||||
u32 bound_flags;
|
||||
bool allocated:1;
|
||||
};
|
||||
|
||||
bool i915_vma_resource_hold(struct i915_vma_resource *vma_res,
|
||||
@ -40,6 +92,8 @@ struct i915_vma_resource *i915_vma_resource_alloc(void);
|
||||
|
||||
struct dma_fence *i915_vma_resource_unbind(struct i915_vma_resource *vma_res);
|
||||
|
||||
void __i915_vma_resource_init(struct i915_vma_resource *vma_res);
|
||||
|
||||
/**
|
||||
* i915_vma_resource_get - Take a reference on a vma resource
|
||||
* @vma_res: The vma resource on which to take a reference.
|
||||
@ -62,8 +116,47 @@ static inline void i915_vma_resource_put(struct i915_vma_resource *vma_res)
|
||||
dma_fence_put(&vma_res->unbind_fence);
|
||||
}
|
||||
|
||||
#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
|
||||
void i915_vma_resource_init(struct i915_vma_resource *vma_res);
|
||||
#endif
|
||||
/**
|
||||
* i915_vma_resource_init - Initialize a vma resource.
|
||||
* @vma_res: The vma resource to initialize
|
||||
* @pages: The pages sg-table.
|
||||
* @page_sizes: Page sizes of the pages.
|
||||
* @readonly: Whether the vma should be bound read-only.
|
||||
* @lmem: Whether the vma points to lmem.
|
||||
* @private: Bind backend private info.
|
||||
* @start: Offset into the address space of bind range start.
|
||||
* @node_size: Size of the allocated range manager node.
|
||||
* @size: Bind size.
|
||||
*
|
||||
* Initializes a vma resource allocated using i915_vma_resource_alloc().
|
||||
* The reason for having separate allocate and initialize function is that
|
||||
* initialization may need to be performed from under a lock where
|
||||
* allocation is not allowed.
|
||||
*/
|
||||
static inline void i915_vma_resource_init(struct i915_vma_resource *vma_res,
|
||||
struct sg_table *pages,
|
||||
const struct i915_page_sizes *page_sizes,
|
||||
bool readonly,
|
||||
bool lmem,
|
||||
void *private,
|
||||
u64 start,
|
||||
u64 node_size,
|
||||
u64 size)
|
||||
{
|
||||
__i915_vma_resource_init(vma_res);
|
||||
vma_res->bi.pages = pages;
|
||||
vma_res->bi.page_sizes = *page_sizes;
|
||||
vma_res->bi.readonly = readonly;
|
||||
vma_res->bi.lmem = lmem;
|
||||
vma_res->private = private;
|
||||
vma_res->start = start;
|
||||
vma_res->node_size = node_size;
|
||||
vma_res->vma_size = size;
|
||||
}
|
||||
|
||||
static inline void i915_vma_resource_fini(struct i915_vma_resource *vma_res)
|
||||
{
|
||||
GEM_BUG_ON(refcount_read(&vma_res->hold_count) != 1);
|
||||
}
|
||||
|
||||
#endif
|
||||
|
@ -24,11 +24,7 @@ void i915_vma_snapshot_init(struct i915_vma_snapshot *vsnap,
|
||||
assert_object_held(vma->obj);
|
||||
|
||||
vsnap->name = name;
|
||||
vsnap->size = vma->size;
|
||||
vsnap->obj_size = vma->obj->base.size;
|
||||
vsnap->gtt_offset = vma->node.start;
|
||||
vsnap->gtt_size = vma->node.size;
|
||||
vsnap->page_sizes = vma->page_sizes.gtt;
|
||||
vsnap->pages = vma->pages;
|
||||
vsnap->pages_rsgt = NULL;
|
||||
vsnap->mr = NULL;
|
||||
|
@ -23,31 +23,23 @@ struct sg_table;
|
||||
|
||||
/**
|
||||
* struct i915_vma_snapshot - Snapshot of vma metadata.
|
||||
* @size: The vma size in bytes.
|
||||
* @obj_size: The size of the underlying object in bytes.
|
||||
* @gtt_offset: The gtt offset the vma is bound to.
|
||||
* @gtt_size: The size in bytes allocated for the vma in the GTT.
|
||||
* @pages: The struct sg_table pointing to the pages bound.
|
||||
* @pages_rsgt: The refcounted sg_table holding the reference for @pages if any.
|
||||
* @mr: The memory region pointed for the pages bound.
|
||||
* @kref: Reference for this structure.
|
||||
* @vma_resource: Pointer to the vma resource representing the vma binding.
|
||||
* @page_sizes: The vma GTT page sizes information.
|
||||
* @onstack: Whether the structure shouldn't be freed on final put.
|
||||
* @present: Whether the structure is present and initialized.
|
||||
*/
|
||||
struct i915_vma_snapshot {
|
||||
const char *name;
|
||||
size_t size;
|
||||
size_t obj_size;
|
||||
size_t gtt_offset;
|
||||
size_t gtt_size;
|
||||
struct sg_table *pages;
|
||||
struct i915_refct_sgt *pages_rsgt;
|
||||
struct intel_memory_region *mr;
|
||||
struct kref kref;
|
||||
struct i915_vma_resource *vma_resource;
|
||||
u32 page_sizes;
|
||||
bool onstack:1;
|
||||
bool present:1;
|
||||
};
|
||||
|
@ -240,22 +240,20 @@ struct i915_vma {
|
||||
|
||||
#define I915_VMA_BIND_MASK (I915_VMA_GLOBAL_BIND | I915_VMA_LOCAL_BIND)
|
||||
|
||||
#define I915_VMA_ALLOC_BIT 12
|
||||
|
||||
#define I915_VMA_ERROR_BIT 13
|
||||
#define I915_VMA_ERROR_BIT 12
|
||||
#define I915_VMA_ERROR ((int)BIT(I915_VMA_ERROR_BIT))
|
||||
|
||||
#define I915_VMA_GGTT_BIT 14
|
||||
#define I915_VMA_CAN_FENCE_BIT 15
|
||||
#define I915_VMA_USERFAULT_BIT 16
|
||||
#define I915_VMA_GGTT_WRITE_BIT 17
|
||||
#define I915_VMA_GGTT_BIT 13
|
||||
#define I915_VMA_CAN_FENCE_BIT 14
|
||||
#define I915_VMA_USERFAULT_BIT 15
|
||||
#define I915_VMA_GGTT_WRITE_BIT 16
|
||||
|
||||
#define I915_VMA_GGTT ((int)BIT(I915_VMA_GGTT_BIT))
|
||||
#define I915_VMA_CAN_FENCE ((int)BIT(I915_VMA_CAN_FENCE_BIT))
|
||||
#define I915_VMA_USERFAULT ((int)BIT(I915_VMA_USERFAULT_BIT))
|
||||
#define I915_VMA_GGTT_WRITE ((int)BIT(I915_VMA_GGTT_WRITE_BIT))
|
||||
|
||||
#define I915_VMA_SCANOUT_BIT 18
|
||||
#define I915_VMA_SCANOUT_BIT 17
|
||||
#define I915_VMA_SCANOUT ((int)BIT(I915_VMA_SCANOUT_BIT))
|
||||
|
||||
struct i915_active active;
|
||||
|
@ -239,11 +239,11 @@ static int lowlevel_hole(struct i915_address_space *vm,
|
||||
unsigned long end_time)
|
||||
{
|
||||
I915_RND_STATE(seed_prng);
|
||||
struct i915_vma *mock_vma;
|
||||
struct i915_vma_resource *mock_vma_res;
|
||||
unsigned int size;
|
||||
|
||||
mock_vma = kzalloc(sizeof(*mock_vma), GFP_KERNEL);
|
||||
if (!mock_vma)
|
||||
mock_vma_res = kzalloc(sizeof(*mock_vma_res), GFP_KERNEL);
|
||||
if (!mock_vma_res)
|
||||
return -ENOMEM;
|
||||
|
||||
/* Keep creating larger objects until one cannot fit into the hole */
|
||||
@ -269,7 +269,7 @@ static int lowlevel_hole(struct i915_address_space *vm,
|
||||
break;
|
||||
} while (count >>= 1);
|
||||
if (!count) {
|
||||
kfree(mock_vma);
|
||||
kfree(mock_vma_res);
|
||||
return -ENOMEM;
|
||||
}
|
||||
GEM_BUG_ON(!order);
|
||||
@ -343,12 +343,12 @@ alloc_vm_end:
|
||||
break;
|
||||
}
|
||||
|
||||
mock_vma->pages = obj->mm.pages;
|
||||
mock_vma->node.size = BIT_ULL(size);
|
||||
mock_vma->node.start = addr;
|
||||
mock_vma_res->bi.pages = obj->mm.pages;
|
||||
mock_vma_res->node_size = BIT_ULL(size);
|
||||
mock_vma_res->start = addr;
|
||||
|
||||
with_intel_runtime_pm(vm->gt->uncore->rpm, wakeref)
|
||||
vm->insert_entries(vm, mock_vma,
|
||||
vm->insert_entries(vm, mock_vma_res,
|
||||
I915_CACHE_NONE, 0);
|
||||
}
|
||||
count = n;
|
||||
@ -371,7 +371,7 @@ alloc_vm_end:
|
||||
cleanup_freed_objects(vm->i915);
|
||||
}
|
||||
|
||||
kfree(mock_vma);
|
||||
kfree(mock_vma_res);
|
||||
return 0;
|
||||
}
|
||||
|
||||
@ -1280,6 +1280,7 @@ static void track_vma_bind(struct i915_vma *vma)
|
||||
atomic_set(&vma->pages_count, I915_VMA_PAGES_ACTIVE);
|
||||
__i915_gem_object_pin_pages(obj);
|
||||
vma->pages = obj->mm.pages;
|
||||
vma->resource->bi.pages = vma->pages;
|
||||
|
||||
mutex_lock(&vma->vm->mutex);
|
||||
list_add_tail(&vma->vm_link, &vma->vm->bound_list);
|
||||
@ -1354,7 +1355,7 @@ static int reserve_gtt_with_resource(struct i915_vma *vma, u64 offset)
|
||||
obj->cache_level,
|
||||
0);
|
||||
if (!err) {
|
||||
i915_vma_resource_init(vma_res);
|
||||
i915_vma_resource_init_from_vma(vma_res, vma);
|
||||
vma->resource = vma_res;
|
||||
} else {
|
||||
kfree(vma_res);
|
||||
@ -1533,7 +1534,7 @@ static int insert_gtt_with_resource(struct i915_vma *vma)
|
||||
err = i915_gem_gtt_insert(vm, &vma->node, obj->base.size, 0,
|
||||
obj->cache_level, 0, vm->total, 0);
|
||||
if (!err) {
|
||||
i915_vma_resource_init(vma_res);
|
||||
i915_vma_resource_init_from_vma(vma_res, vma);
|
||||
vma->resource = vma_res;
|
||||
} else {
|
||||
kfree(vma_res);
|
||||
@ -1960,6 +1961,7 @@ static int igt_cs_tlb(void *arg)
|
||||
struct i915_vm_pt_stash stash = {};
|
||||
struct i915_request *rq;
|
||||
struct i915_gem_ww_ctx ww;
|
||||
struct i915_vma_resource *vma_res;
|
||||
u64 offset;
|
||||
|
||||
offset = igt_random_offset(&prng,
|
||||
@ -1980,6 +1982,13 @@ static int igt_cs_tlb(void *arg)
|
||||
if (err)
|
||||
goto end;
|
||||
|
||||
vma_res = i915_vma_resource_alloc();
|
||||
if (IS_ERR(vma_res)) {
|
||||
i915_vma_put_pages(vma);
|
||||
err = PTR_ERR(vma_res);
|
||||
goto end;
|
||||
}
|
||||
|
||||
i915_gem_ww_ctx_init(&ww, false);
|
||||
retry:
|
||||
err = i915_vm_lock_objects(vm, &ww);
|
||||
@ -2001,33 +2010,41 @@ end_ww:
|
||||
goto retry;
|
||||
}
|
||||
i915_gem_ww_ctx_fini(&ww);
|
||||
if (err)
|
||||
if (err) {
|
||||
kfree(vma_res);
|
||||
goto end;
|
||||
}
|
||||
|
||||
i915_vma_resource_init_from_vma(vma_res, vma);
|
||||
/* Prime the TLB with the dummy pages */
|
||||
for (i = 0; i < count; i++) {
|
||||
vma->node.start = offset + i * PAGE_SIZE;
|
||||
vm->insert_entries(vm, vma, I915_CACHE_NONE, 0);
|
||||
vma_res->start = offset + i * PAGE_SIZE;
|
||||
vm->insert_entries(vm, vma_res, I915_CACHE_NONE,
|
||||
0);
|
||||
|
||||
rq = submit_batch(ce, vma->node.start);
|
||||
rq = submit_batch(ce, vma_res->start);
|
||||
if (IS_ERR(rq)) {
|
||||
err = PTR_ERR(rq);
|
||||
i915_vma_resource_fini(vma_res);
|
||||
kfree(vma_res);
|
||||
goto end;
|
||||
}
|
||||
i915_request_put(rq);
|
||||
}
|
||||
|
||||
i915_vma_resource_fini(vma_res);
|
||||
i915_vma_put_pages(vma);
|
||||
|
||||
err = context_sync(ce);
|
||||
if (err) {
|
||||
pr_err("%s: dummy setup timed out\n",
|
||||
ce->engine->name);
|
||||
kfree(vma_res);
|
||||
goto end;
|
||||
}
|
||||
|
||||
vma = i915_vma_instance(act, vm, NULL);
|
||||
if (IS_ERR(vma)) {
|
||||
kfree(vma_res);
|
||||
err = PTR_ERR(vma);
|
||||
goto end;
|
||||
}
|
||||
@ -2035,19 +2052,22 @@ end_ww:
|
||||
i915_gem_object_lock(act, NULL);
|
||||
err = i915_vma_get_pages(vma);
|
||||
i915_gem_object_unlock(act);
|
||||
if (err)
|
||||
if (err) {
|
||||
kfree(vma_res);
|
||||
goto end;
|
||||
}
|
||||
|
||||
i915_vma_resource_init_from_vma(vma_res, vma);
|
||||
/* Replace the TLB with target batches */
|
||||
for (i = 0; i < count; i++) {
|
||||
struct i915_request *rq;
|
||||
u32 *cs = batch + i * 64 / sizeof(*cs);
|
||||
u64 addr;
|
||||
|
||||
vma->node.start = offset + i * PAGE_SIZE;
|
||||
vm->insert_entries(vm, vma, I915_CACHE_NONE, 0);
|
||||
vma_res->start = offset + i * PAGE_SIZE;
|
||||
vm->insert_entries(vm, vma_res, I915_CACHE_NONE, 0);
|
||||
|
||||
addr = vma->node.start + i * 64;
|
||||
addr = vma_res->start + i * 64;
|
||||
cs[4] = MI_NOOP;
|
||||
cs[6] = lower_32_bits(addr);
|
||||
cs[7] = upper_32_bits(addr);
|
||||
@ -2056,6 +2076,8 @@ end_ww:
|
||||
rq = submit_batch(ce, addr);
|
||||
if (IS_ERR(rq)) {
|
||||
err = PTR_ERR(rq);
|
||||
i915_vma_resource_fini(vma_res);
|
||||
kfree(vma_res);
|
||||
goto end;
|
||||
}
|
||||
|
||||
@ -2072,6 +2094,8 @@ end_ww:
|
||||
}
|
||||
end_spin(batch, count - 1);
|
||||
|
||||
i915_vma_resource_fini(vma_res);
|
||||
kfree(vma_res);
|
||||
i915_vma_put_pages(vma);
|
||||
|
||||
err = context_sync(ce);
|
||||
|
@ -33,23 +33,23 @@ static void mock_insert_page(struct i915_address_space *vm,
|
||||
}
|
||||
|
||||
static void mock_insert_entries(struct i915_address_space *vm,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level level, u32 flags)
|
||||
{
|
||||
}
|
||||
|
||||
static void mock_bind_ppgtt(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
GEM_BUG_ON(flags & I915_VMA_GLOBAL_BIND);
|
||||
set_bit(I915_VMA_LOCAL_BIND_BIT, __i915_vma_flags(vma));
|
||||
vma_res->bound_flags |= flags;
|
||||
}
|
||||
|
||||
static void mock_unbind_ppgtt(struct i915_address_space *vm,
|
||||
struct i915_vma *vma)
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
}
|
||||
|
||||
@ -93,14 +93,14 @@ struct i915_ppgtt *mock_ppgtt(struct drm_i915_private *i915, const char *name)
|
||||
|
||||
static void mock_bind_ggtt(struct i915_address_space *vm,
|
||||
struct i915_vm_pt_stash *stash,
|
||||
struct i915_vma *vma,
|
||||
struct i915_vma_resource *vma_res,
|
||||
enum i915_cache_level cache_level,
|
||||
u32 flags)
|
||||
{
|
||||
}
|
||||
|
||||
static void mock_unbind_ggtt(struct i915_address_space *vm,
|
||||
struct i915_vma *vma)
|
||||
struct i915_vma_resource *vma_res)
|
||||
{
|
||||
}
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user