[+Kent, Yong, Harish] This means updating page tables can invalidate page directories. You prepared amdgpu_cs for this. On our amd-kfd-staging branch amdgpu_amdkfd_gpuvm.c we will need an equivalent change when we pick up this patch. Currently we update page directories in vm_validate_pt_pd_bos. We'll have to split page directory update out of this function and invoke it separately after any page table updates. The series is Acked-by: Felix Kuehling <Felix.Kuehling at amd.com> Regards,  Felix On 2018-01-02 09:47 AM, Christian König wrote: > Update the PDEs after resetting the huge flag. > > Signed-off-by: Christian König <christian.koenig at amd.com> > --- > drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c | 60 ++++++++++------------------------ > 1 file changed, 18 insertions(+), 42 deletions(-) > > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c > index c1c5ccdee783..81505870eebc 100644 > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c > @@ -946,54 +946,38 @@ static void amdgpu_vm_handle_huge_pages(struct amdgpu_pte_update_params *p, > unsigned nptes, uint64_t dst, > uint64_t flags) > { > - bool use_cpu_update = (p->func == amdgpu_vm_cpu_set_ptes); > uint64_t pd_addr, pde; > > /* In the case of a mixed PT the PDE must point to it*/ > - if (p->adev->asic_type < CHIP_VEGA10 || p->src || > - nptes != AMDGPU_VM_PTE_COUNT(p->adev)) { > - dst = amdgpu_bo_gpu_offset(entry->base.bo); > - flags = AMDGPU_PTE_VALID; > - } else { > + if (p->adev->asic_type >= CHIP_VEGA10 && !p->src && > + nptes == AMDGPU_VM_PTE_COUNT(p->adev)) { > /* Set the huge page flag to stop scanning at this PDE */ > flags |= AMDGPU_PDE_PTE; > } > > - if (!entry->huge && !(flags & AMDGPU_PDE_PTE)) > + if (!(flags & AMDGPU_PDE_PTE)) { > + if (entry->huge) { > + /* Add the entry to the relocated list to update it. */ > + entry->huge = false; > + spin_lock(&p->vm->status_lock); > + list_move(&entry->base.vm_status, &p->vm->relocated); > + spin_unlock(&p->vm->status_lock); > + } > return; > - entry->huge = !!(flags & AMDGPU_PDE_PTE); > + } > > + entry->huge = true; > amdgpu_gart_get_vm_pde(p->adev, AMDGPU_VM_PDB0, > &dst, &flags); > > - if (use_cpu_update) { > - /* In case a huge page is replaced with a system > - * memory mapping, p->pages_addr != NULL and > - * amdgpu_vm_cpu_set_ptes would try to translate dst > - * through amdgpu_vm_map_gart. But dst is already a > - * GPU address (of the page table). Disable > - * amdgpu_vm_map_gart temporarily. > - */ > - dma_addr_t *tmp; > - > - tmp = p->pages_addr; > - p->pages_addr = NULL; > - > - pd_addr = (unsigned long)amdgpu_bo_kptr(parent->base.bo); > - pde = pd_addr + (entry - parent->entries) * 8; > - amdgpu_vm_cpu_set_ptes(p, pde, dst, 1, 0, flags); > - > - p->pages_addr = tmp; > - } else { > - if (parent->base.bo->shadow) { > - pd_addr = amdgpu_bo_gpu_offset(parent->base.bo->shadow); > - pde = pd_addr + (entry - parent->entries) * 8; > - amdgpu_vm_do_set_ptes(p, pde, dst, 1, 0, flags); > - } > - pd_addr = amdgpu_bo_gpu_offset(parent->base.bo); > + if (parent->base.bo->shadow) { > + pd_addr = amdgpu_bo_gpu_offset(parent->base.bo->shadow); > pde = pd_addr + (entry - parent->entries) * 8; > - amdgpu_vm_do_set_ptes(p, pde, dst, 1, 0, flags); > + p->func(p, pde, dst, 1, 0, flags); > } > + pd_addr = amdgpu_bo_gpu_offset(parent->base.bo); > + pde = pd_addr + (entry - parent->entries) * 8; > + p->func(p, pde, dst, 1, 0, flags); > } > > /** > @@ -1205,12 +1189,6 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev, > /* padding, etc. */ > ndw = 64; > > - /* one PDE write for each huge page */ > - if (vm->root.base.bo->shadow) > - ndw += ((nptes >> adev->vm_manager.block_size) + 1) * 6 * 2; > - else > - ndw += ((nptes >> adev->vm_manager.block_size) + 1) * 6; > - > if (pages_addr) { > /* copy commands needed */ > ndw += ncmds * adev->vm_manager.vm_pte_funcs->copy_pte_num_dw; > @@ -1285,8 +1263,6 @@ static int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev, > > error_free: > amdgpu_job_free(job); > - amdgpu_vm_invalidate_level(adev, vm, &vm->root, > - adev->vm_manager.root_level); > return r; > } >