Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux

percpu: Resolve ambiguities in __get_cpu_var/cpumask_var_t

__get_cpu_var can paper over differences in the definitions of
cpumask_var_t and either use the address of the cpumask variable
directly or perform a fetch of the address of the struct cpumask
allocated elsewhere. This is important particularly when using per cpu
cpumask_var_t declarations because in one case we have an offset into
a per cpu area to handle and in the other case we need to fetch a
pointer from the offset.

This patch introduces a new macro

this_cpu_cpumask_var_ptr()

that is defined where cpumask_var_t is defined and performs the proper
actions. All use cases where __get_cpu_var is used with cpumask_var_t
are converted to the use of this_cpu_cpumask_var_ptr().

Signed-off-by: Christoph Lameter <cl@linux.com>
Signed-off-by: Tejun Heo <tj@kernel.org>

authored by

Christoph Lameter and committed by
Tejun Heo
4ba29684 23f66e2d

+17 -7
+1 -1
arch/x86/include/asm/perf_event_p4.h
··· 189 189 { 190 190 #ifdef CONFIG_SMP 191 191 if (smp_num_siblings == 2) 192 - return cpu != cpumask_first(__get_cpu_var(cpu_sibling_map)); 192 + return cpu != cpumask_first(this_cpu_cpumask_var_ptr(cpu_sibling_map)); 193 193 #endif 194 194 return 0; 195 195 }
+1 -2
arch/x86/kernel/apic/x2apic_cluster.c
··· 42 42 * We are to modify mask, so we need an own copy 43 43 * and be sure it's manipulated with irq off. 44 44 */ 45 - ipi_mask_ptr = __raw_get_cpu_var(ipi_mask); 46 - cpumask_copy(ipi_mask_ptr, mask); 45 + ipi_mask_ptr = this_cpu_cpumask_var_ptr(ipi_mask); 47 46 48 47 /* 49 48 * The idea is to send one IPI per cluster.
+1 -1
arch/x86/oprofile/op_model_p4.c
··· 372 372 { 373 373 #ifdef CONFIG_SMP 374 374 int cpu = smp_processor_id(); 375 - return cpu != cpumask_first(__get_cpu_var(cpu_sibling_map)); 375 + return cpu != cpumask_first(this_cpu_cpumask_var_ptr(cpu_sibling_map)); 376 376 #endif 377 377 return 0; 378 378 }
+11
include/linux/cpumask.h
··· 666 666 * 667 667 * This code makes NR_CPUS length memcopy and brings to a memory corruption. 668 668 * cpumask_copy() provide safe copy functionality. 669 + * 670 + * Note that there is another evil here: If you define a cpumask_var_t 671 + * as a percpu variable then the way to obtain the address of the cpumask 672 + * structure differently influences what this_cpu_* operation needs to be 673 + * used. Please use this_cpu_cpumask_var_t in those cases. The direct use 674 + * of this_cpu_ptr() or this_cpu_read() will lead to failures when the 675 + * other type of cpumask_var_t implementation is configured. 669 676 */ 670 677 #ifdef CONFIG_CPUMASK_OFFSTACK 671 678 typedef struct cpumask *cpumask_var_t; 679 + 680 + #define this_cpu_cpumask_var_ptr(x) this_cpu_read(x) 672 681 673 682 bool alloc_cpumask_var_node(cpumask_var_t *mask, gfp_t flags, int node); 674 683 bool alloc_cpumask_var(cpumask_var_t *mask, gfp_t flags); ··· 689 680 690 681 #else 691 682 typedef struct cpumask cpumask_var_t[1]; 683 + 684 + #define this_cpu_cpumask_var_ptr(x) this_cpu_ptr(x) 692 685 693 686 static inline bool alloc_cpumask_var(cpumask_var_t *mask, gfp_t flags) 694 687 {
+1 -1
kernel/sched/deadline.c
··· 1158 1158 static int find_later_rq(struct task_struct *task) 1159 1159 { 1160 1160 struct sched_domain *sd; 1161 - struct cpumask *later_mask = __get_cpu_var(local_cpu_mask_dl); 1161 + struct cpumask *later_mask = this_cpu_cpumask_var_ptr(local_cpu_mask_dl); 1162 1162 int this_cpu = smp_processor_id(); 1163 1163 int best_cpu, cpu = task_cpu(task); 1164 1164
+1 -1
kernel/sched/fair.c
··· 6539 6539 struct sched_group *group; 6540 6540 struct rq *busiest; 6541 6541 unsigned long flags; 6542 - struct cpumask *cpus = __get_cpu_var(load_balance_mask); 6542 + struct cpumask *cpus = this_cpu_cpumask_var_ptr(load_balance_mask); 6543 6543 6544 6544 struct lb_env env = { 6545 6545 .sd = sd,
+1 -1
kernel/sched/rt.c
··· 1526 1526 static int find_lowest_rq(struct task_struct *task) 1527 1527 { 1528 1528 struct sched_domain *sd; 1529 - struct cpumask *lowest_mask = __get_cpu_var(local_cpu_mask); 1529 + struct cpumask *lowest_mask = this_cpu_cpumask_var_ptr(local_cpu_mask); 1530 1530 int this_cpu = smp_processor_id(); 1531 1531 int cpu = task_cpu(task); 1532 1532