On Wed, Jun 7, 2017 at 3:17 PM, Tom Lendacky <thomas.lendacky@xxxxxxx> wrote: > The IOMMU is programmed with physical addresses for the various tables > and buffers that are used to communicate between the device and the > driver. When the driver allocates this memory it is encrypted. In order > for the IOMMU to access the memory as encrypted the encryption mask needs > to be included in these physical addresses during configuration. > > The PTE entries created by the IOMMU should also include the encryption > mask so that when the device behind the IOMMU performs a DMA, the DMA > will be performed to encrypted memory. > > Signed-off-by: Tom Lendacky <thomas.lendacky@xxxxxxx> > --- > arch/x86/include/asm/mem_encrypt.h | 7 +++++++ > arch/x86/mm/mem_encrypt.c | 30 ++++++++++++++++++++++++++++++ > drivers/iommu/amd_iommu.c | 36 +++++++++++++++++++----------------- > drivers/iommu/amd_iommu_init.c | 18 ++++++++++++------ > drivers/iommu/amd_iommu_proto.h | 10 ++++++++++ > drivers/iommu/amd_iommu_types.h | 2 +- > include/asm-generic/mem_encrypt.h | 5 +++++ > 7 files changed, 84 insertions(+), 24 deletions(-) > > diff --git a/arch/x86/include/asm/mem_encrypt.h b/arch/x86/include/asm/mem_encrypt.h > index c7a2525..d86e544 100644 > --- a/arch/x86/include/asm/mem_encrypt.h > +++ b/arch/x86/include/asm/mem_encrypt.h > @@ -31,6 +31,8 @@ void __init sme_early_decrypt(resource_size_t paddr, > > void __init sme_early_init(void); > > +bool sme_iommu_supported(void); > + > /* Architecture __weak replacement functions */ > void __init mem_encrypt_init(void); > > @@ -62,6 +64,11 @@ static inline void __init sme_early_init(void) > { > } > > +static inline bool sme_iommu_supported(void) > +{ > + return true; > +} > + > #endif /* CONFIG_AMD_MEM_ENCRYPT */ > > static inline bool sme_active(void) > diff --git a/arch/x86/mm/mem_encrypt.c b/arch/x86/mm/mem_encrypt.c > index 5d7c51d..018b58a 100644 > --- a/arch/x86/mm/mem_encrypt.c > +++ b/arch/x86/mm/mem_encrypt.c > @@ -197,6 +197,36 @@ void __init sme_early_init(void) > protection_map[i] = pgprot_encrypted(protection_map[i]); > } > > +bool sme_iommu_supported(void) > +{ > + struct cpuinfo_x86 *c = &boot_cpu_data; > + > + if (!sme_me_mask || (c->x86 != 0x17)) > + return true; > + > + /* For Fam17h, a specific level of support is required */ > + switch (c->microcode & 0xf000) { > + case 0x0000: > + return false; > + case 0x1000: > + switch (c->microcode & 0x0f00) { > + case 0x0000: > + return false; > + case 0x0100: > + if ((c->microcode & 0xff) < 0x26) > + return false; > + break; > + case 0x0200: > + if ((c->microcode & 0xff) < 0x05) > + return false; > + break; > + } > + break; > + } > + > + return true; > +} > + > /* Architecture __weak replacement functions */ > void __init mem_encrypt_init(void) > { > diff --git a/drivers/iommu/amd_iommu.c b/drivers/iommu/amd_iommu.c > index 63cacf5..94eb130 100644 > --- a/drivers/iommu/amd_iommu.c > +++ b/drivers/iommu/amd_iommu.c > @@ -544,7 +544,7 @@ static void dump_dte_entry(u16 devid) > > static void dump_command(unsigned long phys_addr) > { > - struct iommu_cmd *cmd = phys_to_virt(phys_addr); > + struct iommu_cmd *cmd = iommu_phys_to_virt(phys_addr); > int i; > > for (i = 0; i < 4; ++i) > @@ -863,13 +863,15 @@ static void copy_cmd_to_buffer(struct amd_iommu *iommu, > writel(tail, iommu->mmio_base + MMIO_CMD_TAIL_OFFSET); > } > > -static void build_completion_wait(struct iommu_cmd *cmd, u64 address) > +static void build_completion_wait(struct iommu_cmd *cmd, volatile u64 *sem) > { > + u64 address = iommu_virt_to_phys((void *)sem); > + > WARN_ON(address & 0x7ULL); > > memset(cmd, 0, sizeof(*cmd)); > - cmd->data[0] = lower_32_bits(__pa(address)) | CMD_COMPL_WAIT_STORE_MASK; > - cmd->data[1] = upper_32_bits(__pa(address)); > + cmd->data[0] = lower_32_bits(address) | CMD_COMPL_WAIT_STORE_MASK; > + cmd->data[1] = upper_32_bits(address); > cmd->data[2] = 1; > CMD_SET_TYPE(cmd, CMD_COMPL_WAIT); > } > @@ -1033,7 +1035,7 @@ static int __iommu_queue_command_sync(struct amd_iommu *iommu, > > iommu->cmd_sem = 0; > > - build_completion_wait(&sync_cmd, (u64)&iommu->cmd_sem); > + build_completion_wait(&sync_cmd, &iommu->cmd_sem); > copy_cmd_to_buffer(iommu, &sync_cmd, tail); > > if ((ret = wait_on_sem(&iommu->cmd_sem)) != 0) > @@ -1083,7 +1085,7 @@ static int iommu_completion_wait(struct amd_iommu *iommu) > return 0; > > > - build_completion_wait(&cmd, (u64)&iommu->cmd_sem); > + build_completion_wait(&cmd, &iommu->cmd_sem); > > spin_lock_irqsave(&iommu->lock, flags); > > @@ -1328,7 +1330,7 @@ static bool increase_address_space(struct protection_domain *domain, > return false; > > *pte = PM_LEVEL_PDE(domain->mode, > - virt_to_phys(domain->pt_root)); > + iommu_virt_to_phys(domain->pt_root)); > domain->pt_root = pte; > domain->mode += 1; > domain->updated = true; > @@ -1365,7 +1367,7 @@ static u64 *alloc_pte(struct protection_domain *domain, > if (!page) > return NULL; > > - __npte = PM_LEVEL_PDE(level, virt_to_phys(page)); > + __npte = PM_LEVEL_PDE(level, iommu_virt_to_phys(page)); > > /* pte could have been changed somewhere. */ > if (cmpxchg64(pte, __pte, __npte) != __pte) { > @@ -1481,10 +1483,10 @@ static int iommu_map_page(struct protection_domain *dom, > return -EBUSY; > > if (count > 1) { > - __pte = PAGE_SIZE_PTE(phys_addr, page_size); > + __pte = PAGE_SIZE_PTE(__sme_set(phys_addr), page_size); > __pte |= PM_LEVEL_ENC(7) | IOMMU_PTE_P | IOMMU_PTE_FC; > } else > - __pte = phys_addr | IOMMU_PTE_P | IOMMU_PTE_FC; > + __pte = __sme_set(phys_addr) | IOMMU_PTE_P | IOMMU_PTE_FC; > > if (prot & IOMMU_PROT_IR) > __pte |= IOMMU_PTE_IR; > @@ -1700,7 +1702,7 @@ static void free_gcr3_tbl_level1(u64 *tbl) > if (!(tbl[i] & GCR3_VALID)) > continue; > > - ptr = __va(tbl[i] & PAGE_MASK); > + ptr = iommu_phys_to_virt(tbl[i] & PAGE_MASK); > > free_page((unsigned long)ptr); > } > @@ -1715,7 +1717,7 @@ static void free_gcr3_tbl_level2(u64 *tbl) > if (!(tbl[i] & GCR3_VALID)) > continue; > > - ptr = __va(tbl[i] & PAGE_MASK); > + ptr = iommu_phys_to_virt(tbl[i] & PAGE_MASK); > > free_gcr3_tbl_level1(ptr); > } > @@ -1807,7 +1809,7 @@ static void set_dte_entry(u16 devid, struct protection_domain *domain, bool ats) > u64 flags = 0; > > if (domain->mode != PAGE_MODE_NONE) > - pte_root = virt_to_phys(domain->pt_root); > + pte_root = iommu_virt_to_phys(domain->pt_root); > > pte_root |= (domain->mode & DEV_ENTRY_MODE_MASK) > << DEV_ENTRY_MODE_SHIFT; > @@ -1819,7 +1821,7 @@ static void set_dte_entry(u16 devid, struct protection_domain *domain, bool ats) > flags |= DTE_FLAG_IOTLB; > > if (domain->flags & PD_IOMMUV2_MASK) { > - u64 gcr3 = __pa(domain->gcr3_tbl); > + u64 gcr3 = iommu_virt_to_phys(domain->gcr3_tbl); > u64 glx = domain->glx; > u64 tmp; > > @@ -3470,10 +3472,10 @@ static u64 *__get_gcr3_pte(u64 *root, int level, int pasid, bool alloc) > if (root == NULL) > return NULL; > > - *pte = __pa(root) | GCR3_VALID; > + *pte = iommu_virt_to_phys(root) | GCR3_VALID; > } > > - root = __va(*pte & PAGE_MASK); > + root = iommu_phys_to_virt(*pte & PAGE_MASK); > > level -= 1; > } > @@ -3652,7 +3654,7 @@ static void set_dte_irq_entry(u16 devid, struct irq_remap_table *table) > > dte = amd_iommu_dev_table[devid].data[2]; > dte &= ~DTE_IRQ_PHYS_ADDR_MASK; > - dte |= virt_to_phys(table->table); > + dte |= iommu_virt_to_phys(table->table); > dte |= DTE_IRQ_REMAP_INTCTL; > dte |= DTE_IRQ_TABLE_LEN; > dte |= DTE_IRQ_REMAP_ENABLE; > diff --git a/drivers/iommu/amd_iommu_init.c b/drivers/iommu/amd_iommu_init.c > index 5a11328..2870a6b 100644 > --- a/drivers/iommu/amd_iommu_init.c > +++ b/drivers/iommu/amd_iommu_init.c > @@ -29,6 +29,7 @@ > #include <linux/export.h> > #include <linux/iommu.h> > #include <linux/kmemleak.h> > +#include <linux/mem_encrypt.h> > #include <asm/pci-direct.h> > #include <asm/iommu.h> > #include <asm/gart.h> > @@ -346,7 +347,7 @@ static void iommu_set_device_table(struct amd_iommu *iommu) > > BUG_ON(iommu->mmio_base == NULL); > > - entry = virt_to_phys(amd_iommu_dev_table); > + entry = iommu_virt_to_phys(amd_iommu_dev_table); > entry |= (dev_table_size >> 12) - 1; > memcpy_toio(iommu->mmio_base + MMIO_DEV_TABLE_OFFSET, > &entry, sizeof(entry)); > @@ -602,7 +603,7 @@ static void iommu_enable_command_buffer(struct amd_iommu *iommu) > > BUG_ON(iommu->cmd_buf == NULL); > > - entry = (u64)virt_to_phys(iommu->cmd_buf); > + entry = iommu_virt_to_phys(iommu->cmd_buf); > entry |= MMIO_CMD_SIZE_512; > > memcpy_toio(iommu->mmio_base + MMIO_CMD_BUF_OFFSET, > @@ -631,7 +632,7 @@ static void iommu_enable_event_buffer(struct amd_iommu *iommu) > > BUG_ON(iommu->evt_buf == NULL); > > - entry = (u64)virt_to_phys(iommu->evt_buf) | EVT_LEN_MASK; > + entry = iommu_virt_to_phys(iommu->evt_buf) | EVT_LEN_MASK; > > memcpy_toio(iommu->mmio_base + MMIO_EVT_BUF_OFFSET, > &entry, sizeof(entry)); > @@ -664,7 +665,7 @@ static void iommu_enable_ppr_log(struct amd_iommu *iommu) > if (iommu->ppr_log == NULL) > return; > > - entry = (u64)virt_to_phys(iommu->ppr_log) | PPR_LOG_SIZE_512; > + entry = iommu_virt_to_phys(iommu->ppr_log) | PPR_LOG_SIZE_512; > > memcpy_toio(iommu->mmio_base + MMIO_PPR_LOG_OFFSET, > &entry, sizeof(entry)); > @@ -744,10 +745,10 @@ static int iommu_init_ga_log(struct amd_iommu *iommu) > if (!iommu->ga_log_tail) > goto err_out; > > - entry = (u64)virt_to_phys(iommu->ga_log) | GA_LOG_SIZE_512; > + entry = iommu_virt_to_phys(iommu->ga_log) | GA_LOG_SIZE_512; > memcpy_toio(iommu->mmio_base + MMIO_GA_LOG_BASE_OFFSET, > &entry, sizeof(entry)); > - entry = ((u64)virt_to_phys(iommu->ga_log) & 0xFFFFFFFFFFFFFULL) & ~7ULL; > + entry = (iommu_virt_to_phys(iommu->ga_log) & 0xFFFFFFFFFFFFFULL) & ~7ULL; > memcpy_toio(iommu->mmio_base + MMIO_GA_LOG_TAIL_OFFSET, > &entry, sizeof(entry)); > writel(0x00, iommu->mmio_base + MMIO_GA_HEAD_OFFSET); > @@ -2552,6 +2553,11 @@ int __init amd_iommu_detect(void) > if (amd_iommu_disabled) > return -ENODEV; > > + if (!sme_iommu_supported()) { > + pr_notice("AMD-Vi: IOMMU not supported when SME is active\n"); > + return -ENODEV; > + } > + > ret = iommu_go_to_state(IOMMU_IVRS_DETECTED); > if (ret) > return ret; > diff --git a/drivers/iommu/amd_iommu_proto.h b/drivers/iommu/amd_iommu_proto.h > index 466260f..3f12fb2 100644 > --- a/drivers/iommu/amd_iommu_proto.h > +++ b/drivers/iommu/amd_iommu_proto.h > @@ -87,4 +87,14 @@ static inline bool iommu_feature(struct amd_iommu *iommu, u64 f) > return !!(iommu->features & f); > } > > +static inline u64 iommu_virt_to_phys(void *vaddr) > +{ > + return (u64)__sme_set(virt_to_phys(vaddr)); > +} > + > +static inline void *iommu_phys_to_virt(unsigned long paddr) > +{ > + return phys_to_virt(__sme_clr(paddr)); > +} > + > #endif /* _ASM_X86_AMD_IOMMU_PROTO_H */ > diff --git a/drivers/iommu/amd_iommu_types.h b/drivers/iommu/amd_iommu_types.h > index 4de8f41..3ce587d 100644 > --- a/drivers/iommu/amd_iommu_types.h > +++ b/drivers/iommu/amd_iommu_types.h > @@ -343,7 +343,7 @@ > > #define IOMMU_PAGE_MASK (((1ULL << 52) - 1) & ~0xfffULL) > #define IOMMU_PTE_PRESENT(pte) ((pte) & IOMMU_PTE_P) > -#define IOMMU_PTE_PAGE(pte) (phys_to_virt((pte) & IOMMU_PAGE_MASK)) > +#define IOMMU_PTE_PAGE(pte) (iommu_phys_to_virt((pte) & IOMMU_PAGE_MASK)) > #define IOMMU_PTE_MODE(pte) (((pte) >> 9) & 0x07) > > #define IOMMU_PROT_MASK 0x03 > diff --git a/include/asm-generic/mem_encrypt.h b/include/asm-generic/mem_encrypt.h > index fb02ff0..bbc49e1 100644 > --- a/include/asm-generic/mem_encrypt.h > +++ b/include/asm-generic/mem_encrypt.h > @@ -27,6 +27,11 @@ static inline u64 sme_dma_mask(void) > return 0ULL; > } > > +static inline bool sme_iommu_supported(void) > +{ > + return true; > +} > + > /* > * The __sme_set() and __sme_clr() macros are useful for adding or removing > * the encryption mask from a value (e.g. when dealing with pagetable > > _______________________________________________ > iommu mailing list > iommu@xxxxxxxxxxxxxxxxxxxxxxxxxx > https://lists.linuxfoundation.org/mailman/listinfo/iommu Hi Tom, This sounds like a cool feature. I'm trying to test it on my Ryzen system, but c->microcode & 0xf000 is evaluating as 0, so IOMMU is not being enabled on my system. I'm using the latest microcode for AGESA 1.0.0.6, 0x08001126. Is this work reliant on a future microcode update, or is there some other issue? Thanks, Sarnex