Skip to content

Commit acddb87

Browse files
committed
Revert "rcu-tasks: Fix access non-existent percpu rtpcp variable in rcu_tasks_need_gpcb()"
This reverts commit 224fd63 which is commit fd70e9f1d85f5323096ad313ba73f5fe3d15ea41 upstream. It is reported to cause problems in testing, so revert it for now. Link: https://lore.kernel.org/r/20241216-comic-handling-3bcf108cc465@wendy Reported-by: Conor Dooley <[email protected]> CC: Zhixu Liu <[email protected]> Cc: Zqiang <[email protected]> Cc: Neeraj Upadhyay <[email protected]> Cc: Sasha Levin <[email protected]> Cc: Xiangyu Chen <[email protected]> Signed-off-by: Greg Kroah-Hartman <[email protected]>
1 parent 36775f4 commit acddb87

File tree

1 file changed

+28
-54
lines changed

1 file changed

+28
-54
lines changed

kernel/rcu/tasks.h

Lines changed: 28 additions & 54 deletions
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,6 @@ typedef void (*postgp_func_t)(struct rcu_tasks *rtp);
3131
* @barrier_q_head: RCU callback for barrier operation.
3232
* @rtp_blkd_tasks: List of tasks blocked as readers.
3333
* @cpu: CPU number corresponding to this entry.
34-
* @index: Index of this CPU in rtpcp_array of the rcu_tasks structure.
3534
* @rtpp: Pointer to the rcu_tasks structure.
3635
*/
3736
struct rcu_tasks_percpu {
@@ -44,7 +43,6 @@ struct rcu_tasks_percpu {
4443
struct rcu_head barrier_q_head;
4544
struct list_head rtp_blkd_tasks;
4645
int cpu;
47-
int index;
4846
struct rcu_tasks *rtpp;
4947
};
5048

@@ -70,7 +68,6 @@ struct rcu_tasks_percpu {
7068
* @postgp_func: This flavor's post-grace-period function (optional).
7169
* @call_func: This flavor's call_rcu()-equivalent function.
7270
* @rtpcpu: This flavor's rcu_tasks_percpu structure.
73-
* @rtpcp_array: Array of pointers to rcu_tasks_percpu structure of CPUs in cpu_possible_mask.
7471
* @percpu_enqueue_shift: Shift down CPU ID this much when enqueuing callbacks.
7572
* @percpu_enqueue_lim: Number of per-CPU callback queues in use for enqueuing.
7673
* @percpu_dequeue_lim: Number of per-CPU callback queues in use for dequeuing.
@@ -103,7 +100,6 @@ struct rcu_tasks {
103100
postgp_func_t postgp_func;
104101
call_rcu_func_t call_func;
105102
struct rcu_tasks_percpu __percpu *rtpcpu;
106-
struct rcu_tasks_percpu **rtpcp_array;
107103
int percpu_enqueue_shift;
108104
int percpu_enqueue_lim;
109105
int percpu_dequeue_lim;
@@ -168,8 +164,6 @@ module_param(rcu_task_contend_lim, int, 0444);
168164
static int rcu_task_collapse_lim __read_mostly = 10;
169165
module_param(rcu_task_collapse_lim, int, 0444);
170166

171-
static int rcu_task_cpu_ids;
172-
173167
/* RCU tasks grace-period state for debugging. */
174168
#define RTGS_INIT 0
175169
#define RTGS_WAIT_WAIT_CBS 1
@@ -234,8 +228,6 @@ static void cblist_init_generic(struct rcu_tasks *rtp)
234228
unsigned long flags;
235229
int lim;
236230
int shift;
237-
int maxcpu;
238-
int index = 0;
239231

240232
raw_spin_lock_irqsave(&rtp->cbs_gbl_lock, flags);
241233
if (rcu_task_enqueue_lim < 0) {
@@ -246,9 +238,14 @@ static void cblist_init_generic(struct rcu_tasks *rtp)
246238
}
247239
lim = rcu_task_enqueue_lim;
248240

249-
rtp->rtpcp_array = kcalloc(num_possible_cpus(), sizeof(struct rcu_tasks_percpu *), GFP_KERNEL);
250-
BUG_ON(!rtp->rtpcp_array);
251-
241+
if (lim > nr_cpu_ids)
242+
lim = nr_cpu_ids;
243+
shift = ilog2(nr_cpu_ids / lim);
244+
if (((nr_cpu_ids - 1) >> shift) >= lim)
245+
shift++;
246+
WRITE_ONCE(rtp->percpu_enqueue_shift, shift);
247+
WRITE_ONCE(rtp->percpu_dequeue_lim, lim);
248+
smp_store_release(&rtp->percpu_enqueue_lim, lim);
252249
for_each_possible_cpu(cpu) {
253250
struct rcu_tasks_percpu *rtpcp = per_cpu_ptr(rtp->rtpcpu, cpu);
254251

@@ -261,33 +258,16 @@ static void cblist_init_generic(struct rcu_tasks *rtp)
261258
INIT_WORK(&rtpcp->rtp_work, rcu_tasks_invoke_cbs_wq);
262259
rtpcp->cpu = cpu;
263260
rtpcp->rtpp = rtp;
264-
rtpcp->index = index;
265-
rtp->rtpcp_array[index] = rtpcp;
266-
index++;
267261
if (!rtpcp->rtp_blkd_tasks.next)
268262
INIT_LIST_HEAD(&rtpcp->rtp_blkd_tasks);
269263
raw_spin_unlock_rcu_node(rtpcp); // irqs remain disabled.
270-
maxcpu = cpu;
271264
}
272265
raw_spin_unlock_irqrestore(&rtp->cbs_gbl_lock, flags);
273266

274267
if (rcu_task_cb_adjust)
275268
pr_info("%s: Setting adjustable number of callback queues.\n", __func__);
276269

277-
rcu_task_cpu_ids = maxcpu + 1;
278-
if (lim > rcu_task_cpu_ids)
279-
lim = rcu_task_cpu_ids;
280-
shift = ilog2(rcu_task_cpu_ids / lim);
281-
if (((rcu_task_cpu_ids - 1) >> shift) >= lim)
282-
shift++;
283-
WRITE_ONCE(rtp->percpu_enqueue_shift, shift);
284-
WRITE_ONCE(rtp->percpu_dequeue_lim, lim);
285-
smp_store_release(&rtp->percpu_enqueue_lim, lim);
286-
287-
pr_info("%s: Setting shift to %d and lim to %d rcu_task_cb_adjust=%d rcu_task_cpu_ids=%d.\n",
288-
rtp->name, data_race(rtp->percpu_enqueue_shift), data_race(rtp->percpu_enqueue_lim),
289-
rcu_task_cb_adjust, rcu_task_cpu_ids);
290-
270+
pr_info("%s: Setting shift to %d and lim to %d.\n", __func__, data_race(rtp->percpu_enqueue_shift), data_race(rtp->percpu_enqueue_lim));
291271
}
292272

293273
// IRQ-work handler that does deferred wakeup for call_rcu_tasks_generic().
@@ -327,7 +307,7 @@ static void call_rcu_tasks_generic(struct rcu_head *rhp, rcu_callback_t func,
327307
rtpcp->rtp_n_lock_retries = 0;
328308
}
329309
if (rcu_task_cb_adjust && ++rtpcp->rtp_n_lock_retries > rcu_task_contend_lim &&
330-
READ_ONCE(rtp->percpu_enqueue_lim) != rcu_task_cpu_ids)
310+
READ_ONCE(rtp->percpu_enqueue_lim) != nr_cpu_ids)
331311
needadjust = true; // Defer adjustment to avoid deadlock.
332312
}
333313
if (!rcu_segcblist_is_enabled(&rtpcp->cblist)) {
@@ -340,10 +320,10 @@ static void call_rcu_tasks_generic(struct rcu_head *rhp, rcu_callback_t func,
340320
raw_spin_unlock_irqrestore_rcu_node(rtpcp, flags);
341321
if (unlikely(needadjust)) {
342322
raw_spin_lock_irqsave(&rtp->cbs_gbl_lock, flags);
343-
if (rtp->percpu_enqueue_lim != rcu_task_cpu_ids) {
323+
if (rtp->percpu_enqueue_lim != nr_cpu_ids) {
344324
WRITE_ONCE(rtp->percpu_enqueue_shift, 0);
345-
WRITE_ONCE(rtp->percpu_dequeue_lim, rcu_task_cpu_ids);
346-
smp_store_release(&rtp->percpu_enqueue_lim, rcu_task_cpu_ids);
325+
WRITE_ONCE(rtp->percpu_dequeue_lim, nr_cpu_ids);
326+
smp_store_release(&rtp->percpu_enqueue_lim, nr_cpu_ids);
347327
pr_info("Switching %s to per-CPU callback queuing.\n", rtp->name);
348328
}
349329
raw_spin_unlock_irqrestore(&rtp->cbs_gbl_lock, flags);
@@ -414,8 +394,6 @@ static int rcu_tasks_need_gpcb(struct rcu_tasks *rtp)
414394
int needgpcb = 0;
415395

416396
for (cpu = 0; cpu < smp_load_acquire(&rtp->percpu_dequeue_lim); cpu++) {
417-
if (!cpu_possible(cpu))
418-
continue;
419397
struct rcu_tasks_percpu *rtpcp = per_cpu_ptr(rtp->rtpcpu, cpu);
420398

421399
/* Advance and accelerate any new callbacks. */
@@ -448,7 +426,7 @@ static int rcu_tasks_need_gpcb(struct rcu_tasks *rtp)
448426
if (rcu_task_cb_adjust && ncbs <= rcu_task_collapse_lim) {
449427
raw_spin_lock_irqsave(&rtp->cbs_gbl_lock, flags);
450428
if (rtp->percpu_enqueue_lim > 1) {
451-
WRITE_ONCE(rtp->percpu_enqueue_shift, order_base_2(rcu_task_cpu_ids));
429+
WRITE_ONCE(rtp->percpu_enqueue_shift, order_base_2(nr_cpu_ids));
452430
smp_store_release(&rtp->percpu_enqueue_lim, 1);
453431
rtp->percpu_dequeue_gpseq = get_state_synchronize_rcu();
454432
gpdone = false;
@@ -463,9 +441,7 @@ static int rcu_tasks_need_gpcb(struct rcu_tasks *rtp)
463441
pr_info("Completing switch %s to CPU-0 callback queuing.\n", rtp->name);
464442
}
465443
if (rtp->percpu_dequeue_lim == 1) {
466-
for (cpu = rtp->percpu_dequeue_lim; cpu < rcu_task_cpu_ids; cpu++) {
467-
if (!cpu_possible(cpu))
468-
continue;
444+
for (cpu = rtp->percpu_dequeue_lim; cpu < nr_cpu_ids; cpu++) {
469445
struct rcu_tasks_percpu *rtpcp = per_cpu_ptr(rtp->rtpcpu, cpu);
470446

471447
WARN_ON_ONCE(rcu_segcblist_n_cbs(&rtpcp->cblist));
@@ -480,32 +456,30 @@ static int rcu_tasks_need_gpcb(struct rcu_tasks *rtp)
480456
// Advance callbacks and invoke any that are ready.
481457
static void rcu_tasks_invoke_cbs(struct rcu_tasks *rtp, struct rcu_tasks_percpu *rtpcp)
482458
{
459+
int cpu;
460+
int cpunext;
483461
int cpuwq;
484462
unsigned long flags;
485463
int len;
486-
int index;
487464
struct rcu_head *rhp;
488465
struct rcu_cblist rcl = RCU_CBLIST_INITIALIZER(rcl);
489466
struct rcu_tasks_percpu *rtpcp_next;
490467

491-
index = rtpcp->index * 2 + 1;
492-
if (index < num_possible_cpus()) {
493-
rtpcp_next = rtp->rtpcp_array[index];
494-
if (rtpcp_next->cpu < smp_load_acquire(&rtp->percpu_dequeue_lim)) {
495-
cpuwq = rcu_cpu_beenfullyonline(rtpcp_next->cpu) ? rtpcp_next->cpu : WORK_CPU_UNBOUND;
468+
cpu = rtpcp->cpu;
469+
cpunext = cpu * 2 + 1;
470+
if (cpunext < smp_load_acquire(&rtp->percpu_dequeue_lim)) {
471+
rtpcp_next = per_cpu_ptr(rtp->rtpcpu, cpunext);
472+
cpuwq = rcu_cpu_beenfullyonline(cpunext) ? cpunext : WORK_CPU_UNBOUND;
473+
queue_work_on(cpuwq, system_wq, &rtpcp_next->rtp_work);
474+
cpunext++;
475+
if (cpunext < smp_load_acquire(&rtp->percpu_dequeue_lim)) {
476+
rtpcp_next = per_cpu_ptr(rtp->rtpcpu, cpunext);
477+
cpuwq = rcu_cpu_beenfullyonline(cpunext) ? cpunext : WORK_CPU_UNBOUND;
496478
queue_work_on(cpuwq, system_wq, &rtpcp_next->rtp_work);
497-
index++;
498-
if (index < num_possible_cpus()) {
499-
rtpcp_next = rtp->rtpcp_array[index];
500-
if (rtpcp_next->cpu < smp_load_acquire(&rtp->percpu_dequeue_lim)) {
501-
cpuwq = rcu_cpu_beenfullyonline(rtpcp_next->cpu) ? rtpcp_next->cpu : WORK_CPU_UNBOUND;
502-
queue_work_on(cpuwq, system_wq, &rtpcp_next->rtp_work);
503-
}
504-
}
505479
}
506480
}
507481

508-
if (rcu_segcblist_empty(&rtpcp->cblist))
482+
if (rcu_segcblist_empty(&rtpcp->cblist) || !cpu_possible(cpu))
509483
return;
510484
raw_spin_lock_irqsave_rcu_node(rtpcp, flags);
511485
rcu_segcblist_advance(&rtpcp->cblist, rcu_seq_current(&rtp->tasks_gp_seq));

0 commit comments

Comments
 (0)