On 05/25/2017 07:35 PM, Zi Yan wrote:
> On 25 May 2017, at 18:43, Andrew Morton wrote:
> 
>> On Thu, 25 May 2017 13:19:54 -0400 "Zi Yan" <[email protected]> wrote:
>>
>>> On 25 May 2017, at 13:06, kbuild test robot wrote:
>>>
>>>> Hi Zi,
>>>>
>>>> [auto build test WARNING on mmotm/master]
>>>> [also build test WARNING on v4.12-rc2 next-20170525]
>>>> [if your patch is applied to the wrong git tree, please drop us a note to 
>>>> help improve the system]
>>>>
>>>> url:    
>>>> https://github.com/0day-ci/linux/commits/Zi-Yan/mm-page-migration-enhancement-for-thp/20170526-003749
>>>> base:   git://git.cmpxchg.org/linux-mmotm.git master
>>>> config: i386-randconfig-x016-201721 (attached as .config)
>>>> compiler: gcc-6 (Debian 6.2.0-3) 6.2.0 20160901
>>>> reproduce:
>>>>         # save the attached .config to linux build tree
>>>>         make ARCH=i386
>>>>
>>>> All warnings (new ones prefixed by >>):
>>>>
>>>>    In file included from fs/proc/task_mmu.c:15:0:
>>>>    include/linux/swapops.h: In function 'swp_entry_to_pmd':
>>>>>> include/linux/swapops.h:222:16: warning: missing braces around 
>>>>>> initializer [-Wmissing-braces]
>>>>      return (pmd_t){{ 0 }};
>>>>                    ^
>>>
>>> The braces are added to eliminate the warning from "m68k-linux-gcc (GCC) 
>>> 4.9.0",
>>> which has the bug: https://gcc.gnu.org/bugzilla/show_bug.cgi?id=53119.
>>
>> I think we'd prefer to have a warning on m68k than on i386!  Is there
>> something smarter we can do here?
> 
> I will remove the braces in the next version.
> 
> The bug is present in gcc 4.8 and 4.9 and m68k has newer gcc to use,
> so kbuild test robot needs to upgrade its m68k gcc (maybe it has done it).
>

Removed the braces.

---
 arch/x86/include/asm/pgtable_64.h |  2 +
 include/linux/swapops.h           | 69 +++++++++++++++++++++++++++++++-
 mm/huge_memory.c                  | 84 ++++++++++++++++++++++++++++++++++++---
 mm/migrate.c                      | 30 +++++++++++++-
 mm/page_vma_mapped.c              | 13 ++++--
 mm/pgtable-generic.c              |  3 +-
 mm/rmap.c                         | 11 +++++
 7 files changed, 200 insertions(+), 12 deletions(-)

diff --git a/arch/x86/include/asm/pgtable_64.h 
b/arch/x86/include/asm/pgtable_64.h
index 45b7a4094de0..eac7f8cf4ae0 100644
--- a/arch/x86/include/asm/pgtable_64.h
+++ b/arch/x86/include/asm/pgtable_64.h
@@ -208,7 +208,9 @@ static inline int pgd_large(pgd_t pgd) { return 0; }
                                         ((type) << (SWP_TYPE_FIRST_BIT)) \
                                         | ((offset) << SWP_OFFSET_FIRST_BIT) })
 #define __pte_to_swp_entry(pte)                ((swp_entry_t) { pte_val((pte)) 
})
+#define __pmd_to_swp_entry(pmd)                ((swp_entry_t) { pmd_val((pmd)) 
})
 #define __swp_entry_to_pte(x)          ((pte_t) { .pte = (x).val })
+#define __swp_entry_to_pmd(x)          ((pmd_t) { .pmd = (x).val })
 
 extern int kern_addr_valid(unsigned long addr);
 extern void cleanup_highmap(void);
diff --git a/include/linux/swapops.h b/include/linux/swapops.h
index 5c3a5f3e7eec..c543c6f25e8f 100644
--- a/include/linux/swapops.h
+++ b/include/linux/swapops.h
@@ -103,7 +103,8 @@ static inline void *swp_to_radix_entry(swp_entry_t entry)
 #ifdef CONFIG_MIGRATION
 static inline swp_entry_t make_migration_entry(struct page *page, int write)
 {
-       BUG_ON(!PageLocked(page));
+       BUG_ON(!PageLocked(compound_head(page)));
+
        return swp_entry(write ? SWP_MIGRATION_WRITE : SWP_MIGRATION_READ,
                        page_to_pfn(page));
 }
@@ -126,7 +127,7 @@ static inline struct page 
*migration_entry_to_page(swp_entry_t entry)
         * Any use of migration entries may only occur while the
         * corresponding page is locked
         */
-       BUG_ON(!PageLocked(p));
+       BUG_ON(!PageLocked(compound_head(p)));
        return p;
 }
 
@@ -163,6 +164,70 @@ static inline int is_write_migration_entry(swp_entry_t 
entry)
 
 #endif
 
+struct page_vma_mapped_walk;
+
+#ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION
+extern void set_pmd_migration_entry(struct page_vma_mapped_walk *pvmw,
+               struct page *page);
+
+extern void remove_migration_pmd(struct page_vma_mapped_walk *pvmw,
+               struct page *new);
+
+extern void pmd_migration_entry_wait(struct mm_struct *mm, pmd_t *pmd);
+
+static inline swp_entry_t pmd_to_swp_entry(pmd_t pmd)
+{
+       swp_entry_t arch_entry;
+
+       arch_entry = __pmd_to_swp_entry(pmd);
+       return swp_entry(__swp_type(arch_entry), __swp_offset(arch_entry));
+}
+
+static inline pmd_t swp_entry_to_pmd(swp_entry_t entry)
+{
+       swp_entry_t arch_entry;
+
+       arch_entry = __swp_entry(swp_type(entry), swp_offset(entry));
+       return __swp_entry_to_pmd(arch_entry);
+}
+
+static inline int is_pmd_migration_entry(pmd_t pmd)
+{
+       return !pmd_present(pmd) && is_migration_entry(pmd_to_swp_entry(pmd));
+}
+#else
+static inline void set_pmd_migration_entry(struct page_vma_mapped_walk *pvmw,
+               struct page *page)
+{
+       BUILD_BUG();
+}
+
+static inline void remove_migration_pmd(struct page_vma_mapped_walk *pvmw,
+               struct page *new)
+{
+       BUILD_BUG();
+}
+
+static inline void pmd_migration_entry_wait(struct mm_struct *m, pmd_t *p) { }
+
+static inline swp_entry_t pmd_to_swp_entry(pmd_t pmd)
+{
+       BUILD_BUG();
+       return swp_entry(0, 0);
+}
+
+static inline pmd_t swp_entry_to_pmd(swp_entry_t entry)
+{
+       BUILD_BUG();
+       return (pmd_t){ 0 };
+}
+
+static inline int is_pmd_migration_entry(pmd_t pmd)
+{
+       return 0;
+}
+#endif
+
 #ifdef CONFIG_MEMORY_FAILURE
 
 extern atomic_long_t num_poisoned_pages __read_mostly;
diff --git a/mm/huge_memory.c b/mm/huge_memory.c
index b137f60bd983..05d8288c3eea 100644
--- a/mm/huge_memory.c
+++ b/mm/huge_memory.c
@@ -1635,10 +1635,23 @@ int zap_huge_pmd(struct mmu_gather *tlb, struct 
vm_area_struct *vma,
                spin_unlock(ptl);
                tlb_remove_page_size(tlb, pmd_page(orig_pmd), HPAGE_PMD_SIZE);
        } else {
-               struct page *page = pmd_page(orig_pmd);
-               page_remove_rmap(page, true);
-               VM_BUG_ON_PAGE(page_mapcount(page) < 0, page);
-               VM_BUG_ON_PAGE(!PageHead(page), page);
+               struct page *page = NULL;
+               int migration = 0;
+
+               if (pmd_present(orig_pmd)) {
+                       page = pmd_page(orig_pmd);
+                       page_remove_rmap(page, true);
+                       VM_BUG_ON_PAGE(page_mapcount(page) < 0, page);
+                       VM_BUG_ON_PAGE(!PageHead(page), page);
+               } else {
+                       swp_entry_t entry;
+
+                       VM_BUG_ON(!is_pmd_migration_entry(orig_pmd));
+                       entry = pmd_to_swp_entry(orig_pmd);
+                       page = pfn_to_page(swp_offset(entry));
+                       migration = 1;
+               }
+
                if (PageAnon(page)) {
                        zap_deposited_table(tlb->mm, pmd);
                        add_mm_counter(tlb->mm, MM_ANONPAGES, -HPAGE_PMD_NR);
@@ -1647,8 +1660,10 @@ int zap_huge_pmd(struct mmu_gather *tlb, struct 
vm_area_struct *vma,
                                zap_deposited_table(tlb->mm, pmd);
                        add_mm_counter(tlb->mm, MM_FILEPAGES, -HPAGE_PMD_NR);
                }
+
                spin_unlock(ptl);
-               tlb_remove_page_size(tlb, page, HPAGE_PMD_SIZE);
+               if (!migration)
+                       tlb_remove_page_size(tlb, page, HPAGE_PMD_SIZE);
        }
        return 1;
 }
@@ -2688,3 +2703,62 @@ static int __init split_huge_pages_debugfs(void)
 }
 late_initcall(split_huge_pages_debugfs);
 #endif
+
+#ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION
+void set_pmd_migration_entry(struct page_vma_mapped_walk *pvmw,
+               struct page *page)
+{
+       struct vm_area_struct *vma = pvmw->vma;
+       struct mm_struct *mm = vma->vm_mm;
+       unsigned long address = pvmw->address;
+       pmd_t pmdval;
+       swp_entry_t entry;
+
+       if (!(pvmw->pmd && !pvmw->pte))
+               return;
+
+       mmu_notifier_invalidate_range_start(mm, address,
+                       address + HPAGE_PMD_SIZE);
+
+       flush_cache_range(vma, address, address + HPAGE_PMD_SIZE);
+       pmdval = pmdp_huge_clear_flush(vma, address, pvmw->pmd);
+       if (pmd_dirty(pmdval))
+               set_page_dirty(page);
+       entry = make_migration_entry(page, pmd_write(pmdval));
+       pmdval = swp_entry_to_pmd(entry);
+       set_pmd_at(mm, address, pvmw->pmd, pmdval);
+       page_remove_rmap(page, true);
+       put_page(page);
+
+       mmu_notifier_invalidate_range_end(mm, address,
+                       address + HPAGE_PMD_SIZE);
+}
+
+void remove_migration_pmd(struct page_vma_mapped_walk *pvmw, struct page *new)
+{
+       struct vm_area_struct *vma = pvmw->vma;
+       struct mm_struct *mm = vma->vm_mm;
+       unsigned long address = pvmw->address;
+       unsigned long mmun_start = address & HPAGE_PMD_MASK;
+       unsigned long mmun_end = mmun_start + HPAGE_PMD_SIZE;
+       pmd_t pmde;
+       swp_entry_t entry;
+
+       if (!(pvmw->pmd && !pvmw->pte))
+               return;
+
+       entry = pmd_to_swp_entry(*pvmw->pmd);
+       get_page(new);
+       pmde = pmd_mkold(mk_huge_pmd(new, vma->vm_page_prot));
+       if (is_write_migration_entry(entry))
+               pmde = maybe_pmd_mkwrite(pmde, vma);
+
+       flush_cache_range(vma, mmun_start, mmun_end);
+       page_add_anon_rmap(new, vma, mmun_start, true);
+       set_pmd_at(mm, mmun_start, pvmw->pmd, pmde);
+       flush_tlb_range(vma, mmun_start, mmun_end);
+       if (vma->vm_flags & VM_LOCKED)
+               mlock_vma_page(new);
+       update_mmu_cache_pmd(vma, address, pvmw->pmd);
+}
+#endif
diff --git a/mm/migrate.c b/mm/migrate.c
index 051cc1555d36..37c3eb14cbaa 100644
--- a/mm/migrate.c
+++ b/mm/migrate.c
@@ -215,6 +215,13 @@ static bool remove_migration_pte(struct page *page, struct 
vm_area_struct *vma,
                        new = page - pvmw.page->index +
                                linear_page_index(vma, pvmw.address);
 
+               /* PMD-mapped THP migration entry */
+               if (!pvmw.pte && pvmw.page) {
+                       VM_BUG_ON_PAGE(PageHuge(page) || 
!PageTransCompound(page), page);
+                       remove_migration_pmd(&pvmw, new);
+                       continue;
+               }
+
                get_page(new);
                pte = pte_mkold(mk_pte(new, READ_ONCE(vma->vm_page_prot)));
                if (pte_swp_soft_dirty(*pvmw.pte))
@@ -329,6 +336,27 @@ void migration_entry_wait_huge(struct vm_area_struct *vma,
        __migration_entry_wait(mm, pte, ptl);
 }
 
+#ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION
+void pmd_migration_entry_wait(struct mm_struct *mm, pmd_t *pmd)
+{
+       spinlock_t *ptl;
+       struct page *page;
+
+       ptl = pmd_lock(mm, pmd);
+       if (!is_pmd_migration_entry(*pmd))
+               goto unlock;
+       page = migration_entry_to_page(pmd_to_swp_entry(*pmd));
+       if (!get_page_unless_zero(page))
+               goto unlock;
+       spin_unlock(ptl);
+       wait_on_page_locked(page);
+       put_page(page);
+       return;
+unlock:
+       spin_unlock(ptl);
+}
+#endif
+
 #ifdef CONFIG_BLOCK
 /* Returns true if all buffers are successfully locked */
 static bool buffer_migrate_lock_buffers(struct buffer_head *head,
@@ -1087,7 +1115,7 @@ static ICE_noinline int unmap_and_move(new_page_t 
get_new_page,
                goto out;
        }
 
-       if (unlikely(PageTransHuge(page))) {
+       if (unlikely(PageTransHuge(page) && !PageTransHuge(newpage))) {
                lock_page(page);
                rc = split_huge_page(page);
                unlock_page(page);
diff --git a/mm/page_vma_mapped.c b/mm/page_vma_mapped.c
index de9c40d7304a..e209a12d8722 100644
--- a/mm/page_vma_mapped.c
+++ b/mm/page_vma_mapped.c
@@ -137,16 +137,23 @@ bool page_vma_mapped_walk(struct page_vma_mapped_walk 
*pvmw)
        if (!pud_present(*pud))
                return false;
        pvmw->pmd = pmd_offset(pud, pvmw->address);
-       if (pmd_trans_huge(*pvmw->pmd)) {
+       if (pmd_trans_huge(*pvmw->pmd) || is_pmd_migration_entry(*pvmw->pmd)) {
                pvmw->ptl = pmd_lock(mm, pvmw->pmd);
-               if (!pmd_present(*pvmw->pmd))
-                       return not_found(pvmw);
                if (likely(pmd_trans_huge(*pvmw->pmd))) {
                        if (pvmw->flags & PVMW_MIGRATION)
                                return not_found(pvmw);
                        if (pmd_page(*pvmw->pmd) != page)
                                return not_found(pvmw);
                        return true;
+               } else if (!pmd_present(*pvmw->pmd)) {
+                       if 
(unlikely(is_migration_entry(pmd_to_swp_entry(*pvmw->pmd)))) {
+                               swp_entry_t entry = 
pmd_to_swp_entry(*pvmw->pmd);
+
+                               if (migration_entry_to_page(entry) != page)
+                                       return not_found(pvmw);
+                               return true;
+                       }
+                       return not_found(pvmw);
                } else {
                        /* THP pmd was split under us: handle on pte level */
                        spin_unlock(pvmw->ptl);
diff --git a/mm/pgtable-generic.c b/mm/pgtable-generic.c
index c99d9512a45b..1175f6a24fdb 100644
--- a/mm/pgtable-generic.c
+++ b/mm/pgtable-generic.c
@@ -124,7 +124,8 @@ pmd_t pmdp_huge_clear_flush(struct vm_area_struct *vma, 
unsigned long address,
 {
        pmd_t pmd;
        VM_BUG_ON(address & ~HPAGE_PMD_MASK);
-       VM_BUG_ON(!pmd_trans_huge(*pmdp) && !pmd_devmap(*pmdp));
+       VM_BUG_ON((pmd_present(*pmdp) && !pmd_trans_huge(*pmdp) &&
+                          !pmd_devmap(*pmdp)) || !pmd_present(*pmdp));
        pmd = pmdp_huge_get_and_clear(vma->vm_mm, address, pmdp);
        flush_pmd_tlb_range(vma, address, address + HPAGE_PMD_SIZE);
        return pmd;
diff --git a/mm/rmap.c b/mm/rmap.c
index d6056310513f..6e1146a97021 100644
--- a/mm/rmap.c
+++ b/mm/rmap.c
@@ -1304,6 +1304,7 @@ static bool try_to_unmap_one(struct page *page, struct 
vm_area_struct *vma,
        bool ret = true;
        enum ttu_flags flags = (enum ttu_flags)arg;
 
+
        /* munlock has nothing to gain from examining un-locked vmas */
        if ((flags & TTU_MUNLOCK) && !(vma->vm_flags & VM_LOCKED))
                return true;
@@ -1314,6 +1315,16 @@ static bool try_to_unmap_one(struct page *page, struct 
vm_area_struct *vma,
        }
 
        while (page_vma_mapped_walk(&pvmw)) {
+               /* PMD-mapped THP migration entry */
+               if (flags & TTU_MIGRATION) {
+                       if (!pvmw.pte && page) {
+                               VM_BUG_ON_PAGE(PageHuge(page) || 
!PageTransCompound(page),
+                                               page);
+                               set_pmd_migration_entry(&pvmw, page);
+                               continue;
+                       }
+               }
+
                /*
                 * If the page is mlock()d, we cannot swap it out.
                 * If it's recently referenced (perhaps page_referenced
-- 
2.11.0



-- 
Best Regards,
Yan Zi

Attachment: signature.asc
Description: OpenPGP digital signature

Reply via email to