We have tlb_remove_tlb_entry to indicate a pte tlb flush entry should be flushed, but not a corresponding API for pmd entry. This isn't a problem so far because THP is only for x86 currently and tlb_flush() under x86 will flush entire TLB. But thsi is confusion and could be missed if thp is ported to other arch. Signed-off-by: Shaohua Li <shaohua.li@xxxxxxxxx> --- arch/x86/include/asm/tlb.h | 1 + include/asm-generic/tlb.h | 10 ++++++++++ include/linux/huge_mm.h | 2 +- mm/huge_memory.c | 3 ++- mm/memory.c | 2 +- 5 files changed, 15 insertions(+), 3 deletions(-) Index: linux/arch/x86/include/asm/tlb.h =================================================================== --- linux.orig/arch/x86/include/asm/tlb.h 2011-10-25 09:00:39.000000000 +0800 +++ linux/arch/x86/include/asm/tlb.h 2011-10-25 09:02:52.000000000 +0800 @@ -4,6 +4,7 @@ #define tlb_start_vma(tlb, vma) do { } while (0) #define tlb_end_vma(tlb, vma) do { } while (0) #define __tlb_remove_tlb_entry(tlb, ptep, address) do { } while (0) +#define __tlb_remove_pmd_tlb_entry(tlb, pmdp, address) do { } while (0) #define tlb_flush(tlb) flush_tlb_mm((tlb)->mm) #include <asm-generic/tlb.h> Index: linux/include/asm-generic/tlb.h =================================================================== --- linux.orig/include/asm-generic/tlb.h 2011-10-25 09:00:23.000000000 +0800 +++ linux/include/asm-generic/tlb.h 2011-10-25 09:18:01.000000000 +0800 @@ -139,6 +139,16 @@ static inline void tlb_remove_page(struc __tlb_remove_tlb_entry(tlb, ptep, address); \ } while (0) +#ifndef __tlb_remove_pmd_tlb_entry +#define __tlb_remove_pmd_tlb_entry(tlb, pmdp, address) do {} while(0) +#endif + +#define tlb_remove_pmd_tlb_entry(tlb, pmdp, address) \ + do { \ + tlb->need_flush = 1; \ + __tlb_remove_pmd_tlb_entry(tlb, pmdp, address); \ + } while (0) + #define pte_free_tlb(tlb, ptep, address) \ do { \ tlb->need_flush = 1; \ Index: linux/include/linux/huge_mm.h =================================================================== --- linux.orig/include/linux/huge_mm.h 2011-10-25 09:07:12.000000000 +0800 +++ linux/include/linux/huge_mm.h 2011-10-25 09:07:44.000000000 +0800 @@ -18,7 +18,7 @@ extern struct page *follow_trans_huge_pm unsigned int flags); extern int zap_huge_pmd(struct mmu_gather *tlb, struct vm_area_struct *vma, - pmd_t *pmd); + pmd_t *pmd, unsigned long addr); extern int mincore_huge_pmd(struct vm_area_struct *vma, pmd_t *pmd, unsigned long addr, unsigned long end, unsigned char *vec); Index: linux/mm/huge_memory.c =================================================================== --- linux.orig/mm/huge_memory.c 2011-10-25 09:00:07.000000000 +0800 +++ linux/mm/huge_memory.c 2011-10-25 09:06:55.000000000 +0800 @@ -1005,7 +1005,7 @@ out: } int zap_huge_pmd(struct mmu_gather *tlb, struct vm_area_struct *vma, - pmd_t *pmd) + pmd_t *pmd, unsigned long addr) { int ret = 0; @@ -1021,6 +1021,7 @@ int zap_huge_pmd(struct mmu_gather *tlb, pgtable = get_pmd_huge_pte(tlb->mm); page = pmd_page(*pmd); pmd_clear(pmd); + tlb_remove_pmd_tlb_entry(tlb, pmd, addr); page_remove_rmap(page); VM_BUG_ON(page_mapcount(page) < 0); add_mm_counter(tlb->mm, MM_ANONPAGES, -HPAGE_PMD_NR); Index: linux/mm/memory.c =================================================================== --- linux.orig/mm/memory.c 2011-10-25 09:07:49.000000000 +0800 +++ linux/mm/memory.c 2011-10-25 09:08:29.000000000 +0800 @@ -1231,7 +1231,7 @@ static inline unsigned long zap_pmd_rang if (next-addr != HPAGE_PMD_SIZE) { VM_BUG_ON(!rwsem_is_locked(&tlb->mm->mmap_sem)); split_huge_page_pmd(vma->vm_mm, pmd); - } else if (zap_huge_pmd(tlb, vma, pmd)) + } else if (zap_huge_pmd(tlb, vma, pmd, addr)) continue; /* fall through */ } -- To unsubscribe, send a message with 'unsubscribe linux-mm' in the body to majordomo@xxxxxxxxx. For more info on Linux MM, see: http://www.linux-mm.org/ . Fight unfair telecom internet charges in Canada: sign http://stopthemeter.ca/ Don't email: <a href=mailto:"dont@xxxxxxxxx"> email@xxxxxxxxx </a>