mm: make compound_head() robust (1d798ca3) · Commits · e / devices / android_kernel_oneplus_sm7250

Documentation/vm/split_page_table_lock

+2 −2

Original line number	Diff line number	Diff line
		@@ -54,8 +54,8 @@ everything required is done by pgtable_page_ctor() and pgtable_page_dtor(),
		which must be called on PTE table allocation / freeing.

		Make sure the architecture doesn't use slab allocator for page table
		allocation: slab uses page->slab_cache and page->first_page for its pages.
		These fields share storage with page->ptl.
		allocation: slab uses page->slab_cache for its pages.
		This field shares storage with page->ptl.

		PMD split lock only makes sense if you have more than two page table
		levels.

arch/xtensa/configs/iss_defconfig

+0 −1

Original line number	Diff line number	Diff line
		@@ -169,7 +169,6 @@ CONFIG_FLATMEM_MANUAL=y
		# CONFIG_SPARSEMEM_MANUAL is not set
		CONFIG_FLATMEM=y
		CONFIG_FLAT_NODE_MEM_MAP=y
		CONFIG_PAGEFLAGS_EXTENDED=y
		CONFIG_SPLIT_PTLOCK_CPUS=4
		# CONFIG_PHYS_ADDR_T_64BIT is not set
		CONFIG_ZONE_DMA_FLAG=1

include/linux/hugetlb_cgroup.h

+2 −2

Original line number	Diff line number	Diff line
		@@ -32,7 +32,7 @@ static inline struct hugetlb_cgroup hugetlb_cgroup_from_page(struct page page)

		if (compound_order(page) < HUGETLB_CGROUP_MIN_ORDER)
		return NULL;
		return (struct hugetlb_cgroup *)page[2].lru.next;
		return (struct hugetlb_cgroup *)page[2].private;
		}

		static inline
		@@ -42,7 +42,7 @@ int set_hugetlb_cgroup(struct page page, struct hugetlb_cgroup h_cg)

		if (compound_order(page) < HUGETLB_CGROUP_MIN_ORDER)
		return -1;
		page[2].lru.next = (void *)h_cg;
		page[2].private = (unsigned long)h_cg;
		return 0;
		}

include/linux/mm.h

+3 −50

Original line number	Diff line number	Diff line
		@@ -430,46 +430,6 @@ static inline void compound_unlock_irqrestore(struct page *page,
		#endif
		}

		static inline struct page compound_head_by_tail(struct page tail)
		{
		struct page *head = tail->first_page;

		/*
		* page->first_page may be a dangling pointer to an old
		* compound page, so recheck that it is still a tail
		* page before returning.
		*/
		smp_rmb();
		if (likely(PageTail(tail)))
		return head;
		return tail;
		}

		/*
		* Since either compound page could be dismantled asynchronously in THP
		* or we access asynchronously arbitrary positioned struct page, there
		* would be tail flag race. To handle this race, we should call
		* smp_rmb() before checking tail flag. compound_head_by_tail() did it.
		*/
		static inline struct page compound_head(struct page page)
		{
		if (unlikely(PageTail(page)))
		return compound_head_by_tail(page);
		return page;
		}

		/*
		* If we access compound page synchronously such as access to
		* allocated page, there is no need to handle tail flag race, so we can
		* check tail flag directly without any synchronization primitive.
		*/
		static inline struct page compound_head_fast(struct page page)
		{
		if (unlikely(PageTail(page)))
		return page->first_page;
		return page;
		}

		/*
		* The atomic page->_mapcount, starts from -1: so that transitions
		* both from it and to it can be tracked, using atomic_inc_and_test
		@@ -518,7 +478,7 @@ static inline void get_huge_page_tail(struct page *page)
		VM_BUG_ON_PAGE(!PageTail(page), page);
		VM_BUG_ON_PAGE(page_mapcount(page) < 0, page);
		VM_BUG_ON_PAGE(atomic_read(&page->_count) != 0, page);
		if (compound_tail_refcounted(page->first_page))
		if (compound_tail_refcounted(compound_head(page)))
		atomic_inc(&page->_mapcount);
		}

		@@ -541,13 +501,7 @@ static inline struct page virt_to_head_page(const void x)
		{
		struct page *page = virt_to_page(x);

		/*
		* We don't need to worry about synchronization of tail flag
		* when we call virt_to_head_page() since it is only called for
		* already allocated page and this page won't be freed until
		* this virt_to_head_page() is finished. So use _fast variant.
		*/
		return compound_head_fast(page);
		return compound_head(page);
		}

		/*
		@@ -1586,8 +1540,7 @@ static inline bool ptlock_init(struct page *page)
		* with 0. Make sure nobody took it in use in between.
		*
		* It can happen if arch try to use slab for page table allocation:
		* slab code uses page->slab_cache and page->first_page (for tail
		* pages), which share storage with page->ptl.
		* slab code uses page->slab_cache, which share storage with page->ptl.
		*/
		VM_BUG_ON_PAGE((unsigned long )&page->ptl, page);
		if (!ptlock_alloc(page))

include/linux/mm_types.h

+18 −4

Original line number	Diff line number	Diff line
		@@ -111,7 +111,13 @@ struct page {
		};
		};

		/* Third double word block */
		/*
		* Third double word block
		*
		* WARNING: bit 0 of the first word encode PageTail(). That means
		* the rest users of the storage space MUST NOT use the bit to
		* avoid collision and false-positive PageTail().
		*/
		union {
		struct list_head lru; /* Pageout list, eg. active_list
		* protected by zone->lru_lock !
		@@ -132,14 +138,23 @@ struct page {
		struct rcu_head rcu_head; /* Used by SLAB
		* when destroying via RCU
		*/
		/* First tail page of compound page */
		/* Tail pages of compound page */
		struct {
		unsigned long compound_head; /* If bit zero is set */

		/* First tail page only */
		unsigned short int compound_dtor;
		unsigned short int compound_order;
		};

		#if defined(CONFIG_TRANSPARENT_HUGEPAGE) && USE_SPLIT_PMD_PTLOCKS
		struct {
		unsigned long __pad; /* do not overlay pmd_huge_pte
		* with compound_head to avoid
		* possible bit 0 collision.
		*/
		pgtable_t pmd_huge_pte; /* protected by page->ptl */
		};
		#endif
		};

		@@ -160,7 +175,6 @@ struct page {
		#endif
		#endif
		struct kmem_cache slab_cache; / SL[AU]B: Pointer to slab */
		struct page first_page; / Compound tail pages */
		};

		#ifdef CONFIG_MEMCG