[RFC] [PATCH 2.6.37-rc5-tip 1/20] 1: mm: Move replace_page() / write_protect_page() to mm/memory.c

Previous message: [thread] [date] [author]
Next message: [thread] [date] [author]
From: Srikar Dronamraju
Date: Thursday, December 16, 2010 - 2:57 am

User bkpt will use background page replacement approach to insert/delete
breakpoints. Background page replacement approach will be based on
replace_page and write_protect_page.  Now replace_page() and
write_protect_page loses their static attribute.

Signed-off-by: Srikar Dronamraju <srikar@linux.vnet.ibm.com>
Signed-off-by: Ananth N Mavinakayanahalli <ananth@in.ibm.com>
---
 include/linux/mm.h |    4 ++
 mm/ksm.c           |  114 -------------------------------------------------
 mm/memory.c        |  122 ++++++++++++++++++++++++++++++++++++++++++++++++++++
 3 files changed, 126 insertions(+), 114 deletions(-)

diff --git a/include/linux/mm.h b/include/linux/mm.h
index 721f451..24f8bb0 100644
--- a/include/linux/mm.h
+++ b/include/linux/mm.h
@@ -874,6 +874,10 @@ void account_page_writeback(struct page *page);
 int set_page_dirty(struct page *page);
 int set_page_dirty_lock(struct page *page);
 int clear_page_dirty_for_io(struct page *page);
+int replace_page(struct vm_area_struct *vma, struct page *page,
+					struct page *kpage, pte_t orig_pte);
+int write_protect_page(struct vm_area_struct *vma, struct page *page,
+						      pte_t *orig_pte);
 
 /* Is the vma a continuation of the stack vma above it? */
 static inline int vma_stack_continue(struct vm_area_struct *vma, unsigned long addr)
diff --git a/mm/ksm.c b/mm/ksm.c
index 43bc893..0169c6b 100644
--- a/mm/ksm.c
+++ b/mm/ksm.c
@@ -694,120 +694,6 @@ static inline int pages_identical(struct page *page1, struct page *page2)
 	return !memcmp_pages(page1, page2);
 }
 
-static int write_protect_page(struct vm_area_struct *vma, struct page *page,
-			      pte_t *orig_pte)
-{
-	struct mm_struct *mm = vma->vm_mm;
-	unsigned long addr;
-	pte_t *ptep;
-	spinlock_t *ptl;
-	int swapped;
-	int err = -EFAULT;
-
-	addr = page_address_in_vma(page, vma);
-	if (addr == -EFAULT)
-		goto out;
-
-	ptep = page_check_address(page, mm, addr, &ptl, 0);
-	if (!ptep)
-		goto out;
-
-	if (pte_write(*ptep) || pte_dirty(*ptep)) {
-		pte_t entry;
-
-		swapped = PageSwapCache(page);
-		flush_cache_page(vma, addr, page_to_pfn(page));
-		/*
-		 * Ok this is tricky, when get_user_pages_fast() run it doesnt
-		 * take any lock, therefore the check that we are going to make
-		 * with the pagecount against the mapcount is racey and
-		 * O_DIRECT can happen right after the check.
-		 * So we clear the pte and flush the tlb before the check
-		 * this assure us that no O_DIRECT can happen after the check
-		 * or in the middle of the check.
-		 */
-		entry = ptep_clear_flush(vma, addr, ptep);
-		/*
-		 * Check that no O_DIRECT or similar I/O is in progress on the
-		 * page
-		 */
-		if (page_mapcount(page) + 1 + swapped != page_count(page)) {
-			set_pte_at(mm, addr, ptep, entry);
-			goto out_unlock;
-		}
-		if (pte_dirty(entry))
-			set_page_dirty(page);
-		entry = pte_mkclean(pte_wrprotect(entry));
-		set_pte_at_notify(mm, addr, ptep, entry);
-	}
-	*orig_pte = *ptep;
-	err = 0;
-
-out_unlock:
-	pte_unmap_unlock(ptep, ptl);
-out:
-	return err;
-}
-
-/**
- * replace_page - replace page in vma by new ksm page
- * @vma:      vma that holds the pte pointing to page
- * @page:     the page we are replacing by kpage
- * @kpage:    the ksm page we replace page by
- * @orig_pte: the original value of the pte
- *
- * Returns 0 on success, -EFAULT on failure.
- */
-static int replace_page(struct vm_area_struct *vma, struct page *page,
-			struct page *kpage, pte_t orig_pte)
-{
-	struct mm_struct *mm = vma->vm_mm;
-	pgd_t *pgd;
-	pud_t *pud;
-	pmd_t *pmd;
-	pte_t *ptep;
-	spinlock_t *ptl;
-	unsigned long addr;
-	int err = -EFAULT;
-
-	addr = page_address_in_vma(page, vma);
-	if (addr == -EFAULT)
-		goto out;
-
-	pgd = pgd_offset(mm, addr);
-	if (!pgd_present(*pgd))
-		goto out;
-
-	pud = pud_offset(pgd, addr);
-	if (!pud_present(*pud))
-		goto out;
-
-	pmd = pmd_offset(pud, addr);
-	if (!pmd_present(*pmd))
-		goto out;
-
-	ptep = pte_offset_map_lock(mm, pmd, addr, &ptl);
-	if (!pte_same(*ptep, orig_pte)) {
-		pte_unmap_unlock(ptep, ptl);
-		goto out;
-	}
-
-	get_page(kpage);
-	page_add_anon_rmap(kpage, vma, addr);
-
-	flush_cache_page(vma, addr, pte_pfn(*ptep));
-	ptep_clear_flush(vma, addr, ptep);
-	set_pte_at_notify(mm, addr, ptep, mk_pte(kpage, vma->vm_page_prot));
-
-	page_remove_rmap(page);
-	put_page(page);
-
-	pte_unmap_unlock(ptep, ptl);
-	err = 0;
-out:
-	return err;
-}
-
 /*
  * try_to_merge_one_page - take two pages and merge them into one
  * @vma: the vma that holds the pte pointing to page
diff --git a/mm/memory.c b/mm/memory.c
index 02e48aa..28f79bb 100644
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -2591,6 +2591,128 @@ void unmap_mapping_range(struct address_space *mapping,
 }
 EXPORT_SYMBOL(unmap_mapping_range);
 
+/**
+ * replace_page - replace page in vma by new ksm page
+ * @vma:      vma that holds the pte pointing to page
+ * @page:     the page we are replacing by kpage
+ * @kpage:    the ksm page we replace page by
+ * @orig_pte: the original value of the pte
+ *
+ * Returns 0 on success, -EFAULT on failure.
+ */
+int replace_page(struct vm_area_struct *vma, struct page *page,
+			struct page *kpage, pte_t orig_pte)
+{
+	struct mm_struct *mm = vma->vm_mm;
+	pgd_t *pgd;
+	pud_t *pud;
+	pmd_t *pmd;
+	pte_t *ptep;
+	spinlock_t *ptl;
+	unsigned long addr;
+	int err = -EFAULT;
+
+	addr = page_address_in_vma(page, vma);
+	if (addr == -EFAULT)
+		goto out;
+
+	pgd = pgd_offset(mm, addr);
+	if (!pgd_present(*pgd))
+		goto out;
+
+	pud = pud_offset(pgd, addr);
+	if (!pud_present(*pud))
+		goto out;
+
+	pmd = pmd_offset(pud, addr);
+	if (!pmd_present(*pmd))
+		goto out;
+
+	ptep = pte_offset_map_lock(mm, pmd, addr, &ptl);
+	if (!pte_same(*ptep, orig_pte)) {
+		pte_unmap_unlock(ptep, ptl);
+		goto out;
+	}
+
+	get_page(kpage);
+	page_add_anon_rmap(kpage, vma, addr);
+
+	flush_cache_page(vma, addr, pte_pfn(*ptep));
+	ptep_clear_flush(vma, addr, ptep);
+	set_pte_at_notify(mm, addr, ptep, mk_pte(kpage, vma->vm_page_prot));
+
+	page_remove_rmap(page);
+	put_page(page);
+
+	pte_unmap_unlock(ptep, ptl);
+	err = 0;
+out:
+	return err;
+}
+
+/**
+ * write_protect_page - mark the page readonly
+ * @vma:      vma that holds the page we want to mark
+ * @page:     page that needs to be marked readonly
+ * @orig_pte: pte for the protected page.
+ *
+ * Returns 0 on success, -EFAULT on failure.
+ */
+int write_protect_page(struct vm_area_struct *vma, struct page *page,
+						      pte_t *orig_pte)
+{
+	struct mm_struct *mm = vma->vm_mm;
+	unsigned long addr;
+	pte_t *ptep;
+	spinlock_t *ptl;
+	int swapped;
+	int err = -EFAULT;
+
+	addr = page_address_in_vma(page, vma);
+	if (addr == -EFAULT)
+		goto out;
+
+	ptep = page_check_address(page, mm, addr, &ptl, 0);
+	if (!ptep)
+		goto out;
+
+	if (pte_write(*ptep) || pte_dirty(*ptep)) {
+		pte_t entry;
+
+		swapped = PageSwapCache(page);
+		flush_cache_page(vma, addr, page_to_pfn(page));
+		/*
+		 * Ok this is tricky, when get_user_pages_fast() run it doesnt
+		 * take any lock, therefore the check that we are going to make
+		 * with the pagecount against the mapcount is racey and
+		 * O_DIRECT can happen right after the check.
+		 * So we clear the pte and flush the tlb before the check
+		 * this assure us that no O_DIRECT can happen after the check
+		 * or in the middle of the check.
+		 */
+		entry = ptep_clear_flush(vma, addr, ptep);
+		/*
+		 * Check that no O_DIRECT or similar I/O is in progress on the
+		 * page
+		 */
+		if (page_mapcount(page) + 1 + swapped != page_count(page)) {
+			set_pte_at(mm, addr, ptep, entry);
+			goto out_unlock;
+		}
+		if (pte_dirty(entry))
+			set_page_dirty(page);
+		entry = pte_mkclean(pte_wrprotect(entry));
+		set_pte_at_notify(mm, addr, ptep, entry);
+	}
+	*orig_pte = *ptep;
+	err = 0;
+
+out_unlock:
+	pte_unmap_unlock(ptep, ptl);
+out:
+	return err;
+}
+
 int vmtruncate_range(struct inode *inode, loff_t offset, loff_t end)
 {
 	struct address_space *mapping = inode->i_mapping;
--
Previous message: [thread] [date] [author]
Next message: [thread] [date] [author]

Messages in current thread:
[RFC] [PATCH 2.6.37-rc5-tip 0/20] 0: Inode based uprobes, Srikar Dronamraju, (Thu Dec 16, 2:57 am)
[RFC] [PATCH 2.6.37-rc5-tip 1/20] 1: mm: Move replace_pag ..., Srikar Dronamraju, (Thu Dec 16, 2:57 am)
[RFC] [PATCH 2.6.37-rc5-tip 2/20] 2: X86 specific breakpo ..., Srikar Dronamraju, (Thu Dec 16, 2:57 am)
[RFC] [PATCH 2.6.37-rc5-tip 3/20] 3: uprobes: Breakground ..., Srikar Dronamraju, (Thu Dec 16, 2:57 am)
[RFC] [PATCH 2.6.37-rc5-tip 4/20] 4: uprobes: Adding and ..., Srikar Dronamraju, (Thu Dec 16, 2:58 am)
[RFC] [PATCH 2.6.37-rc5-tip 5/20] 5: Uprobes: register/un ..., Srikar Dronamraju, (Thu Dec 16, 2:58 am)
[RFC] [PATCH 2.6.37-rc5-tip 6/20] 6: x86: analyze instruc ..., Srikar Dronamraju, (Thu Dec 16, 2:58 am)
[RFC] [PATCH 2.6.37-rc5-tip 7/20] 7: uprobes: store/resto ..., Srikar Dronamraju, (Thu Dec 16, 2:58 am)
[RFC] [PATCH 2.6.37-rc5-tip 8/20] 8: uprobes: mmap and fo ..., Srikar Dronamraju, (Thu Dec 16, 2:58 am)
[RFC] [PATCH 2.6.37-rc5-tip 9/20] 9: x86: architecture sp ..., Srikar Dronamraju, (Thu Dec 16, 2:58 am)
[RFC] [PATCH 2.6.37-rc5-tip 10/20] 10: uprobes: task speci ..., Srikar Dronamraju, (Thu Dec 16, 2:59 am)
[RFC] [PATCH 2.6.37-rc5-tip 11/20] 11: uprobes: slot alloc ..., Srikar Dronamraju, (Thu Dec 16, 2:59 am)
[RFC] [PATCH 2.6.37-rc5-tip 12/20] 12: uprobes: get the br ..., Srikar Dronamraju, (Thu Dec 16, 2:59 am)
[RFC] [PATCH 2.6.37-rc5-tip 13/20] 13: x86: x86 specific p ..., Srikar Dronamraju, (Thu Dec 16, 2:59 am)
[RFC] [PATCH 2.6.37-rc5-tip 14/20] 14: uprobes: Handing in ..., Srikar Dronamraju, (Thu Dec 16, 2:59 am)
[RFC] [PATCH 2.6.37-rc5-tip 15/20] 15: x86: uprobes except ..., Srikar Dronamraju, (Thu Dec 16, 3:00 am)
[RFC] [PATCH 2.6.37-rc5-tip 16/20] 16: uprobes: register a ..., Srikar Dronamraju, (Thu Dec 16, 3:00 am)
[RFC] [PATCH 2.6.37-rc5-tip 17/20] 17: uprobes: filter chain, Srikar Dronamraju, (Thu Dec 16, 3:00 am)
[RFC] [PATCH 2.6.37-rc5-tip 18/20] 18: uprobes: commonly u ..., Srikar Dronamraju, (Thu Dec 16, 3:00 am)
[RFC] [PATCH 2.6.37-rc5-tip 19/20] 19: tracing: Extract ou ..., Srikar Dronamraju, (Thu Dec 16, 3:00 am)
[RFC] [PATCH 2.6.37-rc5-tip 20/20] 20: tracing: uprobes tr ..., Srikar Dronamraju, (Thu Dec 16, 3:01 am)
Re: [RFC] [PATCH 2.6.37-rc5-tip 0/20] 0: Inode based uprobes, Srikar Dronamraju, (Thu Dec 16, 3:07 am)
Re: [RFC] [PATCH 2.6.37-rc5-tip 18/20] 18: uprobes: common ..., Valdis.Kletnieks, (Fri Dec 17, 12:32 pm)
Re: [RFC] [PATCH 2.6.37-rc5-tip 18/20] 18: uprobes: common ..., Srikar Dronamraju, (Fri Dec 17, 8:04 pm)