srcu: Abstract multi-tail callback list handling (15fecf89) · Commits · e / devices / android_kernel_oneplus_sm8150

kernel/rcu/rcu_segcblist.h

0 → 100644

+625 −0

Original line number	Diff line number	Diff line
		/*
		* RCU segmented callback lists
		*
		* This program is free software; you can redistribute it and/or modify
		* it under the terms of the GNU General Public License as published by
		* the Free Software Foundation; either version 2 of the License, or
		* (at your option) any later version.
		*
		* This program is distributed in the hope that it will be useful,
		* but WITHOUT ANY WARRANTY; without even the implied warranty of
		* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
		* GNU General Public License for more details.
		*
		* You should have received a copy of the GNU General Public License
		* along with this program; if not, you can access it online at
		* http://www.gnu.org/licenses/gpl-2.0.html.
		*
		* Copyright IBM Corporation, 2017
		*
		* Authors: Paul E. McKenney <paulmck@linux.vnet.ibm.com>
		*/

		#ifndef __KERNEL_RCU_SEGCBLIST_H
		#define __KERNEL_RCU_SEGCBLIST_H

		/* Simple unsegmented callback lists. */
		struct rcu_cblist {
		struct rcu_head *head;
		struct rcu_head **tail;
		long len;
		long len_lazy;
		};

		#define RCU_CBLIST_INITIALIZER(n) { .head = NULL, .tail = &n.head }

		/* Initialize simple callback list. */
		static inline void rcu_cblist_init(struct rcu_cblist *rclp)
		{
		rclp->head = NULL;
		rclp->tail = &rclp->head;
		rclp->len = 0;
		rclp->len_lazy = 0;
		}

		/* Is simple callback list empty? */
		static inline bool rcu_cblist_empty(struct rcu_cblist *rclp)
		{
		return !rclp->head;
		}

		/* Return number of callbacks in simple callback list. */
		static inline long rcu_cblist_n_cbs(struct rcu_cblist *rclp)
		{
		return rclp->len;
		}

		/* Return number of lazy callbacks in simple callback list. */
		static inline long rcu_cblist_n_lazy_cbs(struct rcu_cblist *rclp)
		{
		return rclp->len_lazy;
		}

		/*
		* Debug function to actually count the number of callbacks.
		* If the number exceeds the limit specified, return -1.
		*/
		static inline long rcu_cblist_count_cbs(struct rcu_cblist *rclp, long lim)
		{
		int cnt = 0;
		struct rcu_head **rhpp = &rclp->head;

		for (;;) {
		if (!*rhpp)
		return cnt;
		if (++cnt > lim)
		return -1;
		rhpp = &(*rhpp)->next;
		}
		}

		/*
		* Dequeue the oldest rcu_head structure from the specified callback
		* list. This function assumes that the callback is non-lazy, but
		* the caller can later invoke rcu_cblist_dequeued_lazy() if it
		* finds otherwise (and if it cares about laziness). This allows
		* different users to have different ways of determining laziness.
		*/
		static inline struct rcu_head rcu_cblist_dequeue(struct rcu_cblist rclp)
		{
		struct rcu_head *rhp;

		rhp = rclp->head;
		if (!rhp)
		return NULL;
		prefetch(rhp);
		rclp->len--;
		rclp->head = rhp->next;
		if (!rclp->head)
		rclp->tail = &rclp->head;
		return rhp;
		}

		/*
		* Account for the fact that a previously dequeued callback turned out
		* to be marked as lazy.
		*/
		static inline void rcu_cblist_dequeued_lazy(struct rcu_cblist *rclp)
		{
		rclp->len_lazy--;
		}

		/*
		* Interim function to return rcu_cblist head pointer. Longer term, the
		* rcu_cblist will be used more pervasively, removing the need for this
		* function.
		*/
		static inline struct rcu_head rcu_cblist_head(struct rcu_cblist rclp)
		{
		return rclp->head;
		}

		/*
		* Interim function to return rcu_cblist head pointer. Longer term, the
		* rcu_cblist will be used more pervasively, removing the need for this
		* function.
		*/
		static inline struct rcu_head *rcu_cblist_tail(struct rcu_cblist rclp)
		{
		WARN_ON_ONCE(rcu_cblist_empty(rclp));
		return rclp->tail;
		}

		/* Complicated segmented callback lists. ;-) */

		/*
		* Index values for segments in rcu_segcblist structure.
		*
		* The segments are as follows:
		*
		* [head, *tails[RCU_DONE_TAIL]):
		* Callbacks whose grace period has elapsed, and thus can be invoked.
		* [tails[RCU_DONE_TAIL], tails[RCU_WAIT_TAIL]):
		* Callbacks waiting for the current GP from the current CPU's viewpoint.
		* [tails[RCU_WAIT_TAIL], tails[RCU_NEXT_READY_TAIL]):
		* Callbacks that arrived before the next GP started, again from
		* the current CPU's viewpoint. These can be handled by the next GP.
		* [tails[RCU_NEXT_READY_TAIL], tails[RCU_NEXT_TAIL]):
		* Callbacks that might have arrived after the next GP started.
		* There is some uncertainty as to when a given GP starts and
		* ends, but a CPU knows the exact times if it is the one starting
		* or ending the GP. Other CPUs know that the previous GP ends
		* before the next one starts.
		*
		* Note that RCU_WAIT_TAIL cannot be empty unless RCU_NEXT_READY_TAIL is also
		* empty.
		*
		* The ->gp_seq[] array contains the grace-period number at which the
		* corresponding segment of callbacks will be ready to invoke. A given
		* element of this array is meaningful only when the corresponding segment
		* is non-empty, and it is never valid for RCU_DONE_TAIL (whose callbacks
		* are already ready to invoke) or for RCU_NEXT_TAIL (whose callbacks have
		* not yet been assigned a grace-period number).
		*/
		#define RCU_DONE_TAIL 0 /* Also RCU_WAIT head. */
		#define RCU_WAIT_TAIL 1 /* Also RCU_NEXT_READY head. */
		#define RCU_NEXT_READY_TAIL 2 /* Also RCU_NEXT head. */
		#define RCU_NEXT_TAIL 3
		#define RCU_CBLIST_NSEGS 4

		struct rcu_segcblist {
		struct rcu_head *head;
		struct rcu_head **tails[RCU_CBLIST_NSEGS];
		unsigned long gp_seq[RCU_CBLIST_NSEGS];
		long len;
		long len_lazy;
		};

		/*
		* Initialize an rcu_segcblist structure.
		*/
		static inline void rcu_segcblist_init(struct rcu_segcblist *rsclp)
		{
		int i;

		BUILD_BUG_ON(RCU_NEXT_TAIL + 1 != ARRAY_SIZE(rsclp->gp_seq));
		BUILD_BUG_ON(ARRAY_SIZE(rsclp->tails) != ARRAY_SIZE(rsclp->gp_seq));
		rsclp->head = NULL;
		for (i = 0; i < RCU_CBLIST_NSEGS; i++)
		rsclp->tails[i] = &rsclp->head;
		rsclp->len = 0;
		rsclp->len_lazy = 0;
		}

		/*
		* Is the specified rcu_segcblist structure empty?
		*
		* But careful! The fact that the ->head field is NULL does not
		* necessarily imply that there are no callbacks associated with
		* this structure. When callbacks are being invoked, they are
		* removed as a group. If callback invocation must be preempted,
		* the remaining callbacks will be added back to the list. Either
		* way, the counts are updated later.
		*
		* So it is often the case that rcu_segcblist_n_cbs() should be used
		* instead.
		*/
		static inline bool rcu_segcblist_empty(struct rcu_segcblist *rsclp)
		{
		return !rsclp->head;
		}

		/* Return number of callbacks in segmented callback list. */
		static inline long rcu_segcblist_n_cbs(struct rcu_segcblist *rsclp)
		{
		return READ_ONCE(rsclp->len);
		}

		/* Return number of lazy callbacks in segmented callback list. */
		static inline long rcu_segcblist_n_lazy_cbs(struct rcu_segcblist *rsclp)
		{
		return rsclp->len_lazy;
		}

		/* Return number of lazy callbacks in segmented callback list. */
		static inline long rcu_segcblist_n_nonlazy_cbs(struct rcu_segcblist *rsclp)
		{
		return rsclp->len - rsclp->len_lazy;
		}

		/*
		* Is the specified rcu_segcblist enabled, for example, not corresponding
		* to an offline or callback-offloaded CPU?
		*/
		static inline bool rcu_segcblist_is_enabled(struct rcu_segcblist *rsclp)
		{
		return !!rsclp->tails[RCU_NEXT_TAIL];
		}

		/*
		* Disable the specified rcu_segcblist structure, so that callbacks can
		* no longer be posted to it. This structure must be empty.
		*/
		static inline void rcu_segcblist_disable(struct rcu_segcblist *rsclp)
		{
		WARN_ON_ONCE(!rcu_segcblist_empty(rsclp));
		WARN_ON_ONCE(rcu_segcblist_n_cbs(rsclp));
		WARN_ON_ONCE(rcu_segcblist_n_lazy_cbs(rsclp));
		rsclp->tails[RCU_NEXT_TAIL] = NULL;
		}

		/*
		* Is the specified segment of the specified rcu_segcblist structure
		* empty of callbacks?
		*/
		static inline bool rcu_segcblist_segempty(struct rcu_segcblist *rsclp, int seg)
		{
		if (seg == RCU_DONE_TAIL)
		return &rsclp->head == rsclp->tails[RCU_DONE_TAIL];
		return rsclp->tails[seg - 1] == rsclp->tails[seg];
		}

		/*
		* Are all segments following the specified segment of the specified
		* rcu_segcblist structure empty of callbacks? (The specified
		* segment might well contain callbacks.)
		*/
		static inline bool rcu_segcblist_restempty(struct rcu_segcblist *rsclp, int seg)
		{
		return !*rsclp->tails[seg];
		}

		/*
		* Does the specified rcu_segcblist structure contain callbacks that
		* are ready to be invoked?
		*/
		static inline bool rcu_segcblist_ready_cbs(struct rcu_segcblist *rsclp)
		{
		return rcu_segcblist_is_enabled(rsclp) &&
		&rsclp->head != rsclp->tails[RCU_DONE_TAIL];
		}

		/*
		* Does the specified rcu_segcblist structure contain callbacks that
		* are still pending, that is, not yet ready to be invoked?
		*/
		static inline bool rcu_segcblist_pend_cbs(struct rcu_segcblist *rsclp)
		{
		return rcu_segcblist_is_enabled(rsclp) &&
		!rcu_segcblist_restempty(rsclp, RCU_DONE_TAIL);
		}

		/*
		* Return a pointer to the first callback in the specified rcu_segcblist
		* structure. This is useful for diagnostics.
		*/
		static inline struct rcu_head *
		rcu_segcblist_first_cb(struct rcu_segcblist *rsclp)
		{
		if (rcu_segcblist_is_enabled(rsclp))
		return rsclp->head;
		return NULL;
		}

		/*
		* Return a pointer to the first pending callback in the specified
		* rcu_segcblist structure. This is useful just after posting a given
		* callback -- if that callback is the first pending callback, then
		* you cannot rely on someone else having already started up the required
		* grace period.
		*/
		static inline struct rcu_head *
		rcu_segcblist_first_pend_cb(struct rcu_segcblist *rsclp)
		{
		if (rcu_segcblist_is_enabled(rsclp))
		return *rsclp->tails[RCU_DONE_TAIL];
		return NULL;
		}

		/*
		* Does the specified rcu_segcblist structure contain callbacks that
		* have not yet been processed beyond having been posted, that is,
		* does it contain callbacks in its last segment?
		*/
		static inline bool rcu_segcblist_new_cbs(struct rcu_segcblist *rsclp)
		{
		return rcu_segcblist_is_enabled(rsclp) &&
		!rcu_segcblist_restempty(rsclp, RCU_NEXT_READY_TAIL);
		}

		/*
		* Enqueue the specified callback onto the specified rcu_segcblist
		* structure, updating accounting as needed. Note that the ->len
		* field may be accessed locklessly, hence the WRITE_ONCE().
		* The ->len field is used by rcu_barrier() and friends to determine
		* if it must post a callback on this structure, and it is OK
		* for rcu_barrier() to sometimes post callbacks needlessly, but
		* absolutely not OK for it to ever miss posting a callback.
		*/
		static inline void rcu_segcblist_enqueue(struct rcu_segcblist *rsclp,
		struct rcu_head *rhp, bool lazy)
		{
		WRITE_ONCE(rsclp->len, rsclp->len + 1); /* ->len sampled locklessly. */
		if (lazy)
		rsclp->len_lazy++;
		smp_mb(); /* Ensure counts are updated before callback is enqueued. */
		rhp->next = NULL;
		*rsclp->tails[RCU_NEXT_TAIL] = rhp;
		rsclp->tails[RCU_NEXT_TAIL] = &rhp->next;
		}

		/*
		* Extract only the counts from the specified rcu_segcblist structure,
		* and place them in the specified rcu_cblist structure. This function
		* supports both callback orphaning and invocation, hence the separation
		* of counts and callbacks. (Callbacks ready for invocation must be
		* orphaned and adopted separately from pending callbacks, but counts
		* apply to all callbacks. Locking must be used to make sure that
		* both orphaned-callbacks lists are consistent.)
		*/
		static inline void rcu_segcblist_extract_count(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		rclp->len_lazy += rsclp->len_lazy;
		rclp->len += rsclp->len;
		rsclp->len_lazy = 0;
		WRITE_ONCE(rsclp->len, 0); /* ->len sampled locklessly. */
		}

		/*
		* Extract only those callbacks ready to be invoked from the specified
		* rcu_segcblist structure and place them in the specified rcu_cblist
		* structure.
		*/
		static inline void rcu_segcblist_extract_done_cbs(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		int i;

		if (!rcu_segcblist_ready_cbs(rsclp))
		return; /* Nothing to do. */
		*rclp->tail = rsclp->head;
		rsclp->head = *rsclp->tails[RCU_DONE_TAIL];
		*rsclp->tails[RCU_DONE_TAIL] = NULL;
		rclp->tail = rsclp->tails[RCU_DONE_TAIL];
		for (i = RCU_CBLIST_NSEGS - 1; i >= RCU_DONE_TAIL; i--)
		if (rsclp->tails[i] == rsclp->tails[RCU_DONE_TAIL])
		rsclp->tails[i] = &rsclp->head;
		}

		/*
		* Extract only those callbacks still pending (not yet ready to be
		* invoked) from the specified rcu_segcblist structure and place them in
		* the specified rcu_cblist structure. Note that this loses information
		* about any callbacks that might have been partway done waiting for
		* their grace period. Too bad! They will have to start over.
		*/
		static inline void
		rcu_segcblist_extract_pend_cbs(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		int i;

		if (!rcu_segcblist_pend_cbs(rsclp))
		return; /* Nothing to do. */
		rclp->tail = rsclp->tails[RCU_DONE_TAIL];
		rclp->tail = rsclp->tails[RCU_NEXT_TAIL];
		*rsclp->tails[RCU_DONE_TAIL] = NULL;
		for (i = RCU_DONE_TAIL + 1; i < RCU_CBLIST_NSEGS; i++)
		rsclp->tails[i] = rsclp->tails[RCU_DONE_TAIL];
		}

		/*
		* Move the entire contents of the specified rcu_segcblist structure,
		* counts, callbacks, and all, to the specified rcu_cblist structure.
		* @@@ Why do we need this??? Moving early-boot CBs to NOCB lists?
		* @@@ Memory barrier needed? (Not if only used at boot time...)
		*/
		static inline void rcu_segcblist_extract_all(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		rcu_segcblist_extract_done_cbs(rsclp, rclp);
		rcu_segcblist_extract_pend_cbs(rsclp, rclp);
		rcu_segcblist_extract_count(rsclp, rclp);
		}

		/*
		* Insert counts from the specified rcu_cblist structure in the
		* specified rcu_segcblist structure.
		*/
		static inline void rcu_segcblist_insert_count(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		rsclp->len_lazy += rclp->len_lazy;
		/* ->len sampled locklessly. */
		WRITE_ONCE(rsclp->len, rsclp->len + rclp->len);
		rclp->len_lazy = 0;
		rclp->len = 0;
		}

		/*
		* Move callbacks from the specified rcu_cblist to the beginning of the
		* done-callbacks segment of the specified rcu_segcblist.
		*/
		static inline void rcu_segcblist_insert_done_cbs(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		int i;

		if (!rclp->head)
		return; /* No callbacks to move. */
		*rclp->tail = rsclp->head;
		rsclp->head = rclp->head;
		for (i = RCU_DONE_TAIL; i < RCU_CBLIST_NSEGS; i++)
		if (&rsclp->head == rsclp->tails[i])
		rsclp->tails[i] = rclp->tail;
		else
		break;
		rclp->head = NULL;
		rclp->tail = &rclp->head;
		}

		/*
		* Move callbacks from the specified rcu_cblist to the end of the
		* new-callbacks segment of the specified rcu_segcblist.
		*/
		static inline void rcu_segcblist_insert_pend_cbs(struct rcu_segcblist *rsclp,
		struct rcu_cblist *rclp)
		{
		if (!rclp->head)
		return; /* Nothing to do. */
		*rsclp->tails[RCU_NEXT_TAIL] = rclp->head;
		rsclp->tails[RCU_NEXT_TAIL] = rclp->tail;
		rclp->head = NULL;
		rclp->tail = &rclp->head;
		}

		/*
		* Advance the callbacks in the specified rcu_segcblist structure based
		* on the current value passed in for the grace-period counter.
		*/
		static inline void rcu_segcblist_advance(struct rcu_segcblist *rsclp,
		unsigned long seq)
		{
		int i, j;

		WARN_ON_ONCE(!rcu_segcblist_is_enabled(rsclp));
		WARN_ON_ONCE(rcu_segcblist_restempty(rsclp, RCU_DONE_TAIL));

		/*
		* Find all callbacks whose ->gp_seq numbers indicate that they
		* are ready to invoke, and put them into the RCU_DONE_TAIL segment.
		*/
		for (i = RCU_WAIT_TAIL; i < RCU_NEXT_TAIL; i++) {
		if (ULONG_CMP_LT(seq, rsclp->gp_seq[i]))
		break;
		rsclp->tails[RCU_DONE_TAIL] = rsclp->tails[i];
		}

		/* If no callbacks moved, nothing more need be done. */
		if (i == RCU_WAIT_TAIL)
		return;

		/* Clean up tail pointers that might have been misordered above. */
		for (j = RCU_WAIT_TAIL; j < i; j++)
		rsclp->tails[j] = rsclp->tails[RCU_DONE_TAIL];

		/*
		* Callbacks moved, so clean up the misordered ->tails[] pointers
		* that now point into the middle of the list of ready-to-invoke
		* callbacks. The overall effect is to copy down the later pointers
		* into the gap that was created by the now-ready segments.
		*/
		for (j = RCU_WAIT_TAIL; i < RCU_NEXT_TAIL; i++, j++) {
		if (rsclp->tails[j] == rsclp->tails[RCU_NEXT_TAIL])
		break; /* No more callbacks. */
		rsclp->tails[j] = rsclp->tails[i];
		rsclp->gp_seq[j] = rsclp->gp_seq[i];
		}
		}

		/*
		* "Accelerate" callbacks based on more-accurate grace-period information.
		* The reason for this is that RCU does not synchronize the beginnings and
		* ends of grace periods, and that callbacks are posted locally. This in
		* turn means that the callbacks must be labelled conservatively early
		* on, as getting exact information would degrade both performance and
		* scalability. When more accurate grace-period information becomes
		* available, previously posted callbacks can be "accelerated", marking
		* them to complete at the end of the earlier grace period.
		*
		* This function operates on an rcu_segcblist structure, and also the
		* grace-period sequence number at which new callbacks would become
		* ready to invoke.
		*/
		static inline bool rcu_segcblist_accelerate(struct rcu_segcblist *rsclp,
		unsigned long seq)
		{
		int i;

		WARN_ON_ONCE(!rcu_segcblist_is_enabled(rsclp));
		WARN_ON_ONCE(rcu_segcblist_restempty(rsclp, RCU_DONE_TAIL));

		/*
		* Find the segment preceding the oldest segment of callbacks
		* whose ->gp_seq[] completion is at or after that passed in via
		* "seq", skipping any empty segments. This oldest segment, along
		* with any later segments, can be merged in with any newly arrived
		* callbacks in the RCU_NEXT_TAIL segment, and assigned "seq"
		* as their ->gp_seq[] grace-period completion sequence number.
		*/
		for (i = RCU_NEXT_READY_TAIL; i > RCU_DONE_TAIL; i--)
		if (rsclp->tails[i] != rsclp->tails[i - 1] &&
		ULONG_CMP_LT(rsclp->gp_seq[i], seq))
		break;

		/*
		* If all the segments contain callbacks that correspond to
		* earlier grace-period sequence numbers than "seq", leave.
		* Assuming that the rcu_segcblist structure has enough
		* segments in its arrays, this can only happen if some of
		* the non-done segments contain callbacks that really are
		* ready to invoke. This situation will get straightened
		* out by the next call to rcu_segcblist_advance().
		*
		* Also advance to the oldest segment of callbacks whose
		* ->gp_seq[] completion is at or after that passed in via "seq",
		* skipping any empty segments.
		*/
		if (++i >= RCU_NEXT_TAIL)
		return false;

		/*
		* Merge all later callbacks, including newly arrived callbacks,
		* into the segment located by the for-loop above. Assign "seq"
		* as the ->gp_seq[] value in order to correctly handle the case
		* where there were no pending callbacks in the rcu_segcblist
		* structure other than in the RCU_NEXT_TAIL segment.
		*/
		for (; i < RCU_NEXT_TAIL; i++) {
		rsclp->tails[i] = rsclp->tails[RCU_NEXT_TAIL];
		rsclp->gp_seq[i] = seq;
		}
		return true;
		}

		/*
		* Scan the specified rcu_segcblist structure for callbacks that need
		* a grace period later than the one specified by "seq". We don't look
		* at the RCU_DONE_TAIL or RCU_NEXT_TAIL segments because they don't
		* have a grace-period sequence number.
		*/
		static inline bool rcu_segcblist_future_gp_needed(struct rcu_segcblist *rsclp,
		unsigned long seq)
		{
		int i;

		for (i = RCU_WAIT_TAIL; i < RCU_NEXT_TAIL; i++)
		if (rsclp->tails[i - 1] != rsclp->tails[i] &&
		ULONG_CMP_LT(seq, rsclp->gp_seq[i]))
		return true;
		return false;
		}

		/*
		* Interim function to return rcu_segcblist head pointer. Longer term, the
		* rcu_segcblist will be used more pervasively, removing the need for this
		* function.
		*/
		static inline struct rcu_head rcu_segcblist_head(struct rcu_segcblist rsclp)
		{
		return rsclp->head;
		}

		/*
		* Interim function to return rcu_segcblist head pointer. Longer term, the
		* rcu_segcblist will be used more pervasively, removing the need for this
		* function.
		*/
		static inline struct rcu_head *rcu_segcblist_tail(struct rcu_segcblist rsclp)
		{
		WARN_ON_ONCE(rcu_segcblist_empty(rsclp));
		return rsclp->tails[RCU_NEXT_TAIL];
		}

		#endif /* __KERNEL_RCU_SEGCBLIST_H */

kernel/rcu/tree.c

+112 −236

File changed.

Preview size limit exceeded, changes collapsed.

kernel/rcu/tree.h

+7 −34

Original line number	Diff line number	Diff line
		@@ -30,6 +30,7 @@
		#include <linux/seqlock.h>
		#include <linux/swait.h>
		#include <linux/stop_machine.h>
		#include "rcu_segcblist.h"

		/*
		* Define shape of hierarchy based on NR_CPUS, CONFIG_RCU_FANOUT, and
		@@ -335,34 +336,9 @@ struct rcu_data {
		/* period it is aware of. */

		/* 2) batch handling */
		/*
		* If nxtlist is not NULL, it is partitioned as follows.
		* Any of the partitions might be empty, in which case the
		* pointer to that partition will be equal to the pointer for
		* the following partition. When the list is empty, all of
		* the nxttail elements point to the ->nxtlist pointer itself,
		* which in that case is NULL.
		*
		* [nxtlist, *nxttail[RCU_DONE_TAIL]):
		* Entries that batch # <= ->completed
		* The grace period for these entries has completed, and
		* the other grace-period-completed entries may be moved
		* here temporarily in rcu_process_callbacks().
		* [nxttail[RCU_DONE_TAIL], nxttail[RCU_WAIT_TAIL]):
		* Entries that batch # <= ->completed - 1: waiting for current GP
		* [nxttail[RCU_WAIT_TAIL], nxttail[RCU_NEXT_READY_TAIL]):
		* Entries known to have arrived before current GP ended
		* [nxttail[RCU_NEXT_READY_TAIL], nxttail[RCU_NEXT_TAIL]):
		* Entries that might have arrived after current GP ended
		* Note that the value of *nxttail[RCU_NEXT_TAIL] will
		* always be NULL, as this is the end of the list.
		*/
		struct rcu_head *nxtlist;
		struct rcu_head **nxttail[RCU_NEXT_SIZE];
		unsigned long nxtcompleted[RCU_NEXT_SIZE];
		/* grace periods for sublists. */
		long qlen_lazy; /* # of lazy queued callbacks */
		long qlen; /* # of queued callbacks, incl lazy */
		struct rcu_segcblist cblist; /* Segmented callback list, with */
		/* different callbacks waiting for */
		/* different grace periods. */
		long qlen_last_fqs_check;
		/* qlen at last check for QS forcing */
		unsigned long n_cbs_invoked; /* count of RCU cbs invoked. */
		@@ -500,14 +476,11 @@ struct rcu_state {

		raw_spinlock_t orphan_lock ____cacheline_internodealigned_in_smp;
		/* Protect following fields. */
		struct rcu_head orphan_nxtlist; / Orphaned callbacks that */
		struct rcu_cblist orphan_pend; /* Orphaned callbacks that */
		/* need a grace period. */
		struct rcu_head *orphan_nxttail; / Tail of above. */
		struct rcu_head orphan_donelist; / Orphaned callbacks that */
		struct rcu_cblist orphan_done; /* Orphaned callbacks that */
		/* are ready to invoke. */
		struct rcu_head *orphan_donetail; / Tail of above. */
		long qlen_lazy; /* Number of lazy callbacks. */
		long qlen; /* Total number of callbacks. */
		/* (Contains counts.) */
		/* End of fields guarded by orphan_lock. */

		struct mutex barrier_mutex; /* Guards barrier fields. */

kernel/rcu/tree_plugin.h

+25 −29

Original line number	Diff line number	Diff line
		@@ -1350,10 +1350,10 @@ static bool __maybe_unused rcu_try_advance_all_cbs(void)
		*/
		if ((rdp->completed != rnp->completed \|\|
		unlikely(READ_ONCE(rdp->gpwrap))) &&
		rdp->nxttail[RCU_DONE_TAIL] != rdp->nxttail[RCU_NEXT_TAIL])
		rcu_segcblist_pend_cbs(&rdp->cblist))
		note_gp_changes(rsp, rdp);

		if (cpu_has_callbacks_ready_to_invoke(rdp))
		if (rcu_segcblist_ready_cbs(&rdp->cblist))
		cbs_ready = true;
		}
		return cbs_ready;
		@@ -1461,7 +1461,7 @@ static void rcu_prepare_for_idle(void)
		rdtp->last_accelerate = jiffies;
		for_each_rcu_flavor(rsp) {
		rdp = this_cpu_ptr(rsp->rda);
		if (!*rdp->nxttail[RCU_DONE_TAIL])
		if (rcu_segcblist_pend_cbs(&rdp->cblist))
		continue;
		rnp = rdp->mynode;
		raw_spin_lock_rcu_node(rnp); /* irqs already disabled. */
		@@ -1529,7 +1529,7 @@ static void rcu_oom_notify_cpu(void *unused)

		for_each_rcu_flavor(rsp) {
		rdp = raw_cpu_ptr(rsp->rda);
		if (rdp->qlen_lazy != 0) {
		if (rcu_segcblist_n_lazy_cbs(&rdp->cblist)) {
		atomic_inc(&oom_callback_count);
		rsp->call(&rdp->oom_head, rcu_oom_callback);
		}
		@@ -1934,30 +1934,26 @@ static bool __maybe_unused rcu_nocb_adopt_orphan_cbs(struct rcu_state *rsp,
		struct rcu_data *rdp,
		unsigned long flags)
		{
		long ql = rsp->qlen;
		long qll = rsp->qlen_lazy;
		long ql = rcu_cblist_n_cbs(&rsp->orphan_done);
		long qll = rcu_cblist_n_lazy_cbs(&rsp->orphan_done);

		/* If this is not a no-CBs CPU, tell the caller to do it the old way. */
		if (!rcu_is_nocb_cpu(smp_processor_id()))
		return false;
		rsp->qlen = 0;
		rsp->qlen_lazy = 0;

		/* First, enqueue the donelist, if any. This preserves CB ordering. */
		if (rsp->orphan_donelist != NULL) {
		__call_rcu_nocb_enqueue(rdp, rsp->orphan_donelist,
		rsp->orphan_donetail, ql, qll, flags);
		ql = qll = 0;
		rsp->orphan_donelist = NULL;
		rsp->orphan_donetail = &rsp->orphan_donelist;
		}
		if (rsp->orphan_nxtlist != NULL) {
		__call_rcu_nocb_enqueue(rdp, rsp->orphan_nxtlist,
		rsp->orphan_nxttail, ql, qll, flags);
		ql = qll = 0;
		rsp->orphan_nxtlist = NULL;
		rsp->orphan_nxttail = &rsp->orphan_nxtlist;
		}
		if (!rcu_cblist_empty(&rsp->orphan_done)) {
		__call_rcu_nocb_enqueue(rdp, rcu_cblist_head(&rsp->orphan_done),
		rcu_cblist_tail(&rsp->orphan_done),
		ql, qll, flags);
		}
		if (!rcu_cblist_empty(&rsp->orphan_pend)) {
		__call_rcu_nocb_enqueue(rdp, rcu_cblist_head(&rsp->orphan_pend),
		rcu_cblist_tail(&rsp->orphan_pend),
		ql, qll, flags);
		}
		rcu_cblist_init(&rsp->orphan_done);
		rcu_cblist_init(&rsp->orphan_pend);
		return true;
		}

		@@ -2399,16 +2395,16 @@ static bool init_nocb_callback_list(struct rcu_data *rdp)
		return false;

		/* If there are early-boot callbacks, move them to nocb lists. */
		if (rdp->nxtlist) {
		rdp->nocb_head = rdp->nxtlist;
		rdp->nocb_tail = rdp->nxttail[RCU_NEXT_TAIL];
		atomic_long_set(&rdp->nocb_q_count, rdp->qlen);
		atomic_long_set(&rdp->nocb_q_count_lazy, rdp->qlen_lazy);
		rdp->nxtlist = NULL;
		rdp->qlen = 0;
		rdp->qlen_lazy = 0;
		}
		rdp->nxttail[RCU_NEXT_TAIL] = NULL;
		if (!rcu_segcblist_empty(&rdp->cblist)) {
		rdp->nocb_head = rcu_segcblist_head(&rdp->cblist);
		rdp->nocb_tail = rcu_segcblist_tail(&rdp->cblist);
		atomic_long_set(&rdp->nocb_q_count,
		rcu_segcblist_n_cbs(&rdp->cblist));
		atomic_long_set(&rdp->nocb_q_count_lazy,
		rcu_segcblist_n_lazy_cbs(&rdp->cblist));
		rcu_segcblist_init(&rdp->cblist);
		}
		rcu_segcblist_disable(&rdp->cblist);
		return true;
		}

kernel/rcu/tree_trace.c

+11 −10

File changed.

Preview size limit exceeded, changes collapsed.