[PATCH] mm: unmap_vmas with inner ptlock (508034a3) · Commits · e / devices / android_kernel_sony_msm8994

fs/hugetlbfs/inode.c

+3 −7

Original line number	Diff line number	Diff line
		@@ -92,7 +92,7 @@ out:
		}

		/*
		* Called under down_write(mmap_sem), page_table_lock is not held
		* Called under down_write(mmap_sem).
		*/

		#ifdef HAVE_ARCH_HUGETLB_UNMAPPED_AREA
		@@ -308,7 +308,6 @@ hugetlb_vmtruncate_list(struct prio_tree_root *root, unsigned long h_pgoff)

		vma_prio_tree_foreach(vma, &iter, root, h_pgoff, ULONG_MAX) {
		unsigned long h_vm_pgoff;
		unsigned long v_length;
		unsigned long v_offset;

		h_vm_pgoff = vma->vm_pgoff >> (HPAGE_SHIFT - PAGE_SHIFT);
		@@ -319,11 +318,8 @@ hugetlb_vmtruncate_list(struct prio_tree_root *root, unsigned long h_pgoff)
		if (h_vm_pgoff >= h_pgoff)
		v_offset = 0;

		v_length = vma->vm_end - vma->vm_start;

		zap_hugepage_range(vma,
		vma->vm_start + v_offset,
		v_length - v_offset);
		unmap_hugepage_range(vma,
		vma->vm_start + v_offset, vma->vm_end);
		}
		}

include/linux/hugetlb.h

+0 −2

Original line number	Diff line number	Diff line
		@@ -16,7 +16,6 @@ static inline int is_vm_hugetlb_page(struct vm_area_struct *vma)
		int hugetlb_sysctl_handler(struct ctl_table , int, struct file , void __user , size_t , loff_t *);
		int copy_hugetlb_page_range(struct mm_struct , struct mm_struct , struct vm_area_struct *);
		int follow_hugetlb_page(struct mm_struct , struct vm_area_struct , struct page , struct vm_area_struct , unsigned long , int , int);
		void zap_hugepage_range(struct vm_area_struct *, unsigned long, unsigned long);
		void unmap_hugepage_range(struct vm_area_struct *, unsigned long, unsigned long);
		int hugetlb_prefault(struct address_space , struct vm_area_struct );
		int hugetlb_report_meminfo(char *);
		@@ -87,7 +86,6 @@ static inline unsigned long hugetlb_total_pages(void)
		#define follow_huge_addr(mm, addr, write) ERR_PTR(-EINVAL)
		#define copy_hugetlb_page_range(src, dst, vma) ({ BUG(); 0; })
		#define hugetlb_prefault(mapping, vma) ({ BUG(); 0; })
		#define zap_hugepage_range(vma, start, len) BUG()
		#define unmap_hugepage_range(vma, start, end) BUG()
		#define is_hugepage_mem_enough(size) 0
		#define hugetlb_report_meminfo(buf) 0

include/linux/mm.h

+1 −1

Original line number	Diff line number	Diff line
		@@ -682,7 +682,7 @@ struct zap_details {

		unsigned long zap_page_range(struct vm_area_struct *vma, unsigned long address,
		unsigned long size, struct zap_details *);
		unsigned long unmap_vmas(struct mmu_gather *tlb, struct mm_struct mm,
		unsigned long unmap_vmas(struct mmu_gather **tlb,
		struct vm_area_struct *start_vma, unsigned long start_addr,
		unsigned long end_addr, unsigned long *nr_accounted,
		struct zap_details *);

mm/hugetlb.c

+3 −9

Original line number	Diff line number	Diff line
		@@ -314,6 +314,8 @@ void unmap_hugepage_range(struct vm_area_struct *vma, unsigned long start,
		BUG_ON(start & ~HPAGE_MASK);
		BUG_ON(end & ~HPAGE_MASK);

		spin_lock(&mm->page_table_lock);

		/* Update high watermark before we lower rss */
		update_hiwater_rss(mm);

		@@ -333,17 +335,9 @@ void unmap_hugepage_range(struct vm_area_struct *vma, unsigned long start,
		put_page(page);
		add_mm_counter(mm, file_rss, (int) -(HPAGE_SIZE / PAGE_SIZE));
		}
		flush_tlb_range(vma, start, end);
		}

		void zap_hugepage_range(struct vm_area_struct *vma,
		unsigned long start, unsigned long length)
		{
		struct mm_struct *mm = vma->vm_mm;

		spin_lock(&mm->page_table_lock);
		unmap_hugepage_range(vma, start, start + length);
		spin_unlock(&mm->page_table_lock);
		flush_tlb_range(vma, start, end);
		}

		int hugetlb_prefault(struct address_space mapping, struct vm_area_struct vma)

mm/memory.c

+12 −29

Original line number	Diff line number	Diff line
		@@ -551,10 +551,11 @@ static void zap_pte_range(struct mmu_gather *tlb,
		{
		struct mm_struct *mm = tlb->mm;
		pte_t *pte;
		spinlock_t *ptl;
		int file_rss = 0;
		int anon_rss = 0;

		pte = pte_offset_map(pmd, addr);
		pte = pte_offset_map_lock(mm, pmd, addr, &ptl);
		do {
		pte_t ptent = *pte;
		if (pte_none(ptent))
		@@ -621,7 +622,7 @@ static void zap_pte_range(struct mmu_gather *tlb,
		} while (pte++, addr += PAGE_SIZE, addr != end);

		add_mm_rss(mm, file_rss, anon_rss);
		pte_unmap(pte - 1);
		pte_unmap_unlock(pte - 1, ptl);
		}

		static inline void zap_pmd_range(struct mmu_gather *tlb,
		@@ -690,7 +691,6 @@ static void unmap_page_range(struct mmu_gather tlb, struct vm_area_struct vma,
		/**
		* unmap_vmas - unmap a range of memory covered by a list of vma's
		* @tlbp: address of the caller's struct mmu_gather
		* @mm: the controlling mm_struct
		* @vma: the starting vma
		* @start_addr: virtual address at which to start unmapping
		* @end_addr: virtual address at which to end unmapping
		@@ -699,10 +699,10 @@ static void unmap_page_range(struct mmu_gather tlb, struct vm_area_struct vma,
		*
		* Returns the end address of the unmapping (restart addr if interrupted).
		*
		* Unmap all pages in the vma list. Called under page_table_lock.
		* Unmap all pages in the vma list.
		*
		* We aim to not hold page_table_lock for too long (for scheduling latency
		* reasons). So zap pages in ZAP_BLOCK_SIZE bytecounts. This means we need to
		* We aim to not hold locks for too long (for scheduling latency reasons).
		* So zap pages in ZAP_BLOCK_SIZE bytecounts. This means we need to
		* return the ending mmu_gather to the caller.
		*
		* Only addresses between `start' and `end' will be unmapped.
		@@ -714,7 +714,7 @@ static void unmap_page_range(struct mmu_gather tlb, struct vm_area_struct vma,
		* ensure that any thus-far unmapped pages are flushed before unmap_vmas()
		* drops the lock and schedules.
		*/
		unsigned long unmap_vmas(struct mmu_gather *tlbp, struct mm_struct mm,
		unsigned long unmap_vmas(struct mmu_gather **tlbp,
		struct vm_area_struct *vma, unsigned long start_addr,
		unsigned long end_addr, unsigned long *nr_accounted,
		struct zap_details *details)
		@@ -764,19 +764,15 @@ unsigned long unmap_vmas(struct mmu_gather *tlbp, struct mm_struct mm,
		tlb_finish_mmu(*tlbp, tlb_start, start);

		if (need_resched() \|\|
		need_lockbreak(&mm->page_table_lock) \|\|
		(i_mmap_lock && need_lockbreak(i_mmap_lock))) {
		if (i_mmap_lock) {
		/* must reset count of rss freed */
		*tlbp = tlb_gather_mmu(mm, fullmm);
		*tlbp = NULL;
		goto out;
		}
		spin_unlock(&mm->page_table_lock);
		cond_resched();
		spin_lock(&mm->page_table_lock);
		}

		*tlbp = tlb_gather_mmu(mm, fullmm);
		*tlbp = tlb_gather_mmu(vma->vm_mm, fullmm);
		tlb_start_valid = 0;
		zap_bytes = ZAP_BLOCK_SIZE;
		}
		@@ -800,17 +796,11 @@ unsigned long zap_page_range(struct vm_area_struct *vma, unsigned long address,
		unsigned long end = address + size;
		unsigned long nr_accounted = 0;

		if (is_vm_hugetlb_page(vma)) {
		zap_hugepage_range(vma, address, size);
		return end;
		}

		lru_add_drain();
		tlb = tlb_gather_mmu(mm, 0);
		update_hiwater_rss(mm);
		spin_lock(&mm->page_table_lock);
		end = unmap_vmas(&tlb, mm, vma, address, end, &nr_accounted, details);
		spin_unlock(&mm->page_table_lock);
		end = unmap_vmas(&tlb, vma, address, end, &nr_accounted, details);
		if (tlb)
		tlb_finish_mmu(tlb, address, end);
		return end;
		}
		@@ -1434,13 +1424,6 @@ again:

		restart_addr = zap_page_range(vma, start_addr,
		end_addr - start_addr, details);

		/*
		* We cannot rely on the break test in unmap_vmas:
		* on the one hand, we don't want to restart our loop
		* just because that broke out for the page_table_lock;
		* on the other hand, it does no test when vma is small.
		*/
		need_break = need_resched() \|\|
		need_lockbreak(details->i_mmap_lock);