x86: merge 64 and 32 SMP percpu handling
Now that pda is allocated as part of percpu, percpu doesn't need to be accessed through pda. Unify x86_64 SMP percpu access with x86_32 SMP one. Other than the segment register, operand size and the base of percpu symbols, they behave identical now. This patch replaces now unnecessary pda->data_offset with a dummy field which is necessary to keep stack_canary at its place. This patch also moves per_cpu_offset initialization out of init_gdt() into setup_per_cpu_areas(). Note that this change also necessitates explicit per_cpu_offset initializations in voyager_smp.c. With this change, x86_OP_percpu()'s are as efficient on x86_64 as on x86_32 and also x86_64 can use assembly PER_CPU macros. Signed-off-by: Tejun Heo <tj@kernel.org> Signed-off-by: Ingo Molnar <mingo@elte.hu>
This commit is contained in:
@@ -11,8 +11,7 @@
|
|||||||
/* Per processor datastructure. %gs points to it while the kernel runs */
|
/* Per processor datastructure. %gs points to it while the kernel runs */
|
||||||
struct x8664_pda {
|
struct x8664_pda {
|
||||||
struct task_struct *pcurrent; /* 0 Current process */
|
struct task_struct *pcurrent; /* 0 Current process */
|
||||||
unsigned long data_offset; /* 8 Per cpu data offset from linker
|
unsigned long dummy;
|
||||||
address */
|
|
||||||
unsigned long kernelstack; /* 16 top of kernel stack for current */
|
unsigned long kernelstack; /* 16 top of kernel stack for current */
|
||||||
unsigned long oldrsp; /* 24 user rsp for system call */
|
unsigned long oldrsp; /* 24 user rsp for system call */
|
||||||
int irqcount; /* 32 Irq nesting counter. Starts -1 */
|
int irqcount; /* 32 Irq nesting counter. Starts -1 */
|
||||||
|
@@ -1,62 +1,13 @@
|
|||||||
#ifndef _ASM_X86_PERCPU_H
|
#ifndef _ASM_X86_PERCPU_H
|
||||||
#define _ASM_X86_PERCPU_H
|
#define _ASM_X86_PERCPU_H
|
||||||
|
|
||||||
#ifndef __ASSEMBLY__
|
|
||||||
#ifdef CONFIG_X86_64
|
#ifdef CONFIG_X86_64
|
||||||
extern void load_pda_offset(int cpu);
|
#define __percpu_seg gs
|
||||||
|
#define __percpu_mov_op movq
|
||||||
#else
|
#else
|
||||||
static inline void load_pda_offset(int cpu) { }
|
#define __percpu_seg fs
|
||||||
|
#define __percpu_mov_op movl
|
||||||
#endif
|
#endif
|
||||||
#endif
|
|
||||||
|
|
||||||
#ifdef CONFIG_X86_64
|
|
||||||
#include <linux/compiler.h>
|
|
||||||
|
|
||||||
/* Same as asm-generic/percpu.h, except that we store the per cpu offset
|
|
||||||
in the PDA. Longer term the PDA and every per cpu variable
|
|
||||||
should be just put into a single section and referenced directly
|
|
||||||
from %gs */
|
|
||||||
|
|
||||||
#ifdef CONFIG_SMP
|
|
||||||
#include <asm/pda.h>
|
|
||||||
|
|
||||||
#define __per_cpu_offset(cpu) (cpu_pda(cpu)->data_offset)
|
|
||||||
#define __my_cpu_offset read_pda(data_offset)
|
|
||||||
|
|
||||||
#define per_cpu_offset(x) (__per_cpu_offset(x))
|
|
||||||
|
|
||||||
#endif
|
|
||||||
#include <asm-generic/percpu.h>
|
|
||||||
|
|
||||||
DECLARE_PER_CPU(struct x8664_pda, pda);
|
|
||||||
|
|
||||||
/*
|
|
||||||
* These are supposed to be implemented as a single instruction which
|
|
||||||
* operates on the per-cpu data base segment. x86-64 doesn't have
|
|
||||||
* that yet, so this is a fairly inefficient workaround for the
|
|
||||||
* meantime. The single instruction is atomic with respect to
|
|
||||||
* preemption and interrupts, so we need to explicitly disable
|
|
||||||
* interrupts here to achieve the same effect. However, because it
|
|
||||||
* can be used from within interrupt-disable/enable, we can't actually
|
|
||||||
* disable interrupts; disabling preemption is enough.
|
|
||||||
*/
|
|
||||||
#define x86_read_percpu(var) \
|
|
||||||
({ \
|
|
||||||
typeof(per_cpu_var(var)) __tmp; \
|
|
||||||
preempt_disable(); \
|
|
||||||
__tmp = __get_cpu_var(var); \
|
|
||||||
preempt_enable(); \
|
|
||||||
__tmp; \
|
|
||||||
})
|
|
||||||
|
|
||||||
#define x86_write_percpu(var, val) \
|
|
||||||
do { \
|
|
||||||
preempt_disable(); \
|
|
||||||
__get_cpu_var(var) = (val); \
|
|
||||||
preempt_enable(); \
|
|
||||||
} while(0)
|
|
||||||
|
|
||||||
#else /* CONFIG_X86_64 */
|
|
||||||
|
|
||||||
#ifdef __ASSEMBLY__
|
#ifdef __ASSEMBLY__
|
||||||
|
|
||||||
@@ -73,42 +24,26 @@ DECLARE_PER_CPU(struct x8664_pda, pda);
|
|||||||
* PER_CPU(cpu_gdt_descr, %ebx)
|
* PER_CPU(cpu_gdt_descr, %ebx)
|
||||||
*/
|
*/
|
||||||
#ifdef CONFIG_SMP
|
#ifdef CONFIG_SMP
|
||||||
#define PER_CPU(var, reg) \
|
#define PER_CPU(var, reg) \
|
||||||
movl %fs:per_cpu__##this_cpu_off, reg; \
|
__percpu_mov_op %__percpu_seg:per_cpu__this_cpu_off, reg; \
|
||||||
lea per_cpu__##var(reg), reg
|
lea per_cpu__##var(reg), reg
|
||||||
#define PER_CPU_VAR(var) %fs:per_cpu__##var
|
#define PER_CPU_VAR(var) %__percpu_seg:per_cpu__##var
|
||||||
#else /* ! SMP */
|
#else /* ! SMP */
|
||||||
#define PER_CPU(var, reg) \
|
#define PER_CPU(var, reg) \
|
||||||
movl $per_cpu__##var, reg
|
__percpu_mov_op $per_cpu__##var, reg
|
||||||
#define PER_CPU_VAR(var) per_cpu__##var
|
#define PER_CPU_VAR(var) per_cpu__##var
|
||||||
#endif /* SMP */
|
#endif /* SMP */
|
||||||
|
|
||||||
#else /* ...!ASSEMBLY */
|
#else /* ...!ASSEMBLY */
|
||||||
|
|
||||||
/*
|
#include <linux/stringify.h>
|
||||||
* PER_CPU finds an address of a per-cpu variable.
|
|
||||||
*
|
|
||||||
* Args:
|
|
||||||
* var - variable name
|
|
||||||
* cpu - 32bit register containing the current CPU number
|
|
||||||
*
|
|
||||||
* The resulting address is stored in the "cpu" argument.
|
|
||||||
*
|
|
||||||
* Example:
|
|
||||||
* PER_CPU(cpu_gdt_descr, %ebx)
|
|
||||||
*/
|
|
||||||
#ifdef CONFIG_SMP
|
#ifdef CONFIG_SMP
|
||||||
|
#define __percpu_seg_str "%%"__stringify(__percpu_seg)":"
|
||||||
#define __my_cpu_offset x86_read_percpu(this_cpu_off)
|
#define __my_cpu_offset x86_read_percpu(this_cpu_off)
|
||||||
|
#else
|
||||||
/* fs segment starts at (positive) offset == __per_cpu_offset[cpu] */
|
#define __percpu_seg_str
|
||||||
#define __percpu_seg "%%fs:"
|
#endif
|
||||||
|
|
||||||
#else /* !SMP */
|
|
||||||
|
|
||||||
#define __percpu_seg ""
|
|
||||||
|
|
||||||
#endif /* SMP */
|
|
||||||
|
|
||||||
#include <asm-generic/percpu.h>
|
#include <asm-generic/percpu.h>
|
||||||
|
|
||||||
@@ -128,20 +63,25 @@ do { \
|
|||||||
} \
|
} \
|
||||||
switch (sizeof(var)) { \
|
switch (sizeof(var)) { \
|
||||||
case 1: \
|
case 1: \
|
||||||
asm(op "b %1,"__percpu_seg"%0" \
|
asm(op "b %1,"__percpu_seg_str"%0" \
|
||||||
: "+m" (var) \
|
: "+m" (var) \
|
||||||
: "ri" ((T__)val)); \
|
: "ri" ((T__)val)); \
|
||||||
break; \
|
break; \
|
||||||
case 2: \
|
case 2: \
|
||||||
asm(op "w %1,"__percpu_seg"%0" \
|
asm(op "w %1,"__percpu_seg_str"%0" \
|
||||||
: "+m" (var) \
|
: "+m" (var) \
|
||||||
: "ri" ((T__)val)); \
|
: "ri" ((T__)val)); \
|
||||||
break; \
|
break; \
|
||||||
case 4: \
|
case 4: \
|
||||||
asm(op "l %1,"__percpu_seg"%0" \
|
asm(op "l %1,"__percpu_seg_str"%0" \
|
||||||
: "+m" (var) \
|
: "+m" (var) \
|
||||||
: "ri" ((T__)val)); \
|
: "ri" ((T__)val)); \
|
||||||
break; \
|
break; \
|
||||||
|
case 8: \
|
||||||
|
asm(op "q %1,"__percpu_seg_str"%0" \
|
||||||
|
: "+m" (var) \
|
||||||
|
: "r" ((T__)val)); \
|
||||||
|
break; \
|
||||||
default: __bad_percpu_size(); \
|
default: __bad_percpu_size(); \
|
||||||
} \
|
} \
|
||||||
} while (0)
|
} while (0)
|
||||||
@@ -151,17 +91,22 @@ do { \
|
|||||||
typeof(var) ret__; \
|
typeof(var) ret__; \
|
||||||
switch (sizeof(var)) { \
|
switch (sizeof(var)) { \
|
||||||
case 1: \
|
case 1: \
|
||||||
asm(op "b "__percpu_seg"%1,%0" \
|
asm(op "b "__percpu_seg_str"%1,%0" \
|
||||||
: "=r" (ret__) \
|
: "=r" (ret__) \
|
||||||
: "m" (var)); \
|
: "m" (var)); \
|
||||||
break; \
|
break; \
|
||||||
case 2: \
|
case 2: \
|
||||||
asm(op "w "__percpu_seg"%1,%0" \
|
asm(op "w "__percpu_seg_str"%1,%0" \
|
||||||
: "=r" (ret__) \
|
: "=r" (ret__) \
|
||||||
: "m" (var)); \
|
: "m" (var)); \
|
||||||
break; \
|
break; \
|
||||||
case 4: \
|
case 4: \
|
||||||
asm(op "l "__percpu_seg"%1,%0" \
|
asm(op "l "__percpu_seg_str"%1,%0" \
|
||||||
|
: "=r" (ret__) \
|
||||||
|
: "m" (var)); \
|
||||||
|
break; \
|
||||||
|
case 8: \
|
||||||
|
asm(op "q "__percpu_seg_str"%1,%0" \
|
||||||
: "=r" (ret__) \
|
: "=r" (ret__) \
|
||||||
: "m" (var)); \
|
: "m" (var)); \
|
||||||
break; \
|
break; \
|
||||||
@@ -175,8 +120,14 @@ do { \
|
|||||||
#define x86_add_percpu(var, val) percpu_to_op("add", per_cpu__##var, val)
|
#define x86_add_percpu(var, val) percpu_to_op("add", per_cpu__##var, val)
|
||||||
#define x86_sub_percpu(var, val) percpu_to_op("sub", per_cpu__##var, val)
|
#define x86_sub_percpu(var, val) percpu_to_op("sub", per_cpu__##var, val)
|
||||||
#define x86_or_percpu(var, val) percpu_to_op("or", per_cpu__##var, val)
|
#define x86_or_percpu(var, val) percpu_to_op("or", per_cpu__##var, val)
|
||||||
|
|
||||||
|
#ifdef CONFIG_X86_64
|
||||||
|
extern void load_pda_offset(int cpu);
|
||||||
|
#else
|
||||||
|
static inline void load_pda_offset(int cpu) { }
|
||||||
|
#endif
|
||||||
|
|
||||||
#endif /* !__ASSEMBLY__ */
|
#endif /* !__ASSEMBLY__ */
|
||||||
#endif /* !CONFIG_X86_64 */
|
|
||||||
|
|
||||||
#ifdef CONFIG_SMP
|
#ifdef CONFIG_SMP
|
||||||
|
|
||||||
|
@@ -55,7 +55,6 @@ int main(void)
|
|||||||
ENTRY(irqcount);
|
ENTRY(irqcount);
|
||||||
ENTRY(cpunumber);
|
ENTRY(cpunumber);
|
||||||
ENTRY(irqstackptr);
|
ENTRY(irqstackptr);
|
||||||
ENTRY(data_offset);
|
|
||||||
DEFINE(pda_size, sizeof(struct x8664_pda));
|
DEFINE(pda_size, sizeof(struct x8664_pda));
|
||||||
BLANK();
|
BLANK();
|
||||||
#undef ENTRY
|
#undef ENTRY
|
||||||
|
@@ -52,6 +52,7 @@
|
|||||||
#include <asm/irqflags.h>
|
#include <asm/irqflags.h>
|
||||||
#include <asm/paravirt.h>
|
#include <asm/paravirt.h>
|
||||||
#include <asm/ftrace.h>
|
#include <asm/ftrace.h>
|
||||||
|
#include <asm/percpu.h>
|
||||||
|
|
||||||
/* Avoid __ASSEMBLER__'ifying <linux/audit.h> just for this. */
|
/* Avoid __ASSEMBLER__'ifying <linux/audit.h> just for this. */
|
||||||
#include <linux/elf-em.h>
|
#include <linux/elf-em.h>
|
||||||
@@ -1072,10 +1073,10 @@ ENTRY(\sym)
|
|||||||
TRACE_IRQS_OFF
|
TRACE_IRQS_OFF
|
||||||
movq %rsp,%rdi /* pt_regs pointer */
|
movq %rsp,%rdi /* pt_regs pointer */
|
||||||
xorl %esi,%esi /* no error code */
|
xorl %esi,%esi /* no error code */
|
||||||
movq %gs:pda_data_offset, %rbp
|
PER_CPU(init_tss, %rbp)
|
||||||
subq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
|
subq $EXCEPTION_STKSZ, TSS_ist + (\ist - 1) * 8(%rbp)
|
||||||
call \do_sym
|
call \do_sym
|
||||||
addq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
|
addq $EXCEPTION_STKSZ, TSS_ist + (\ist - 1) * 8(%rbp)
|
||||||
jmp paranoid_exit /* %ebx: no swapgs flag */
|
jmp paranoid_exit /* %ebx: no swapgs flag */
|
||||||
CFI_ENDPROC
|
CFI_ENDPROC
|
||||||
END(\sym)
|
END(\sym)
|
||||||
|
@@ -38,8 +38,6 @@ void __init x86_64_init_pda(void)
|
|||||||
#else
|
#else
|
||||||
cpu_pda(0) = &_boot_cpu_pda;
|
cpu_pda(0) = &_boot_cpu_pda;
|
||||||
#endif
|
#endif
|
||||||
cpu_pda(0)->data_offset =
|
|
||||||
(unsigned long)(__per_cpu_load - __per_cpu_start);
|
|
||||||
pda_init(0);
|
pda_init(0);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@@ -125,14 +125,14 @@ static void __init setup_per_cpu_maps(void)
|
|||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef CONFIG_X86_32
|
#ifdef CONFIG_X86_64
|
||||||
/*
|
unsigned long __per_cpu_offset[NR_CPUS] __read_mostly = {
|
||||||
* Great future not-so-futuristic plan: make i386 and x86_64 do it
|
[0] = (unsigned long)__per_cpu_load,
|
||||||
* the same way
|
};
|
||||||
*/
|
#else
|
||||||
unsigned long __per_cpu_offset[NR_CPUS] __read_mostly;
|
unsigned long __per_cpu_offset[NR_CPUS] __read_mostly;
|
||||||
EXPORT_SYMBOL(__per_cpu_offset);
|
|
||||||
#endif
|
#endif
|
||||||
|
EXPORT_SYMBOL(__per_cpu_offset);
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Great future plan:
|
* Great future plan:
|
||||||
@@ -178,6 +178,7 @@ void __init setup_per_cpu_areas(void)
|
|||||||
#endif
|
#endif
|
||||||
|
|
||||||
memcpy(ptr, __per_cpu_load, __per_cpu_end - __per_cpu_start);
|
memcpy(ptr, __per_cpu_load, __per_cpu_end - __per_cpu_start);
|
||||||
|
per_cpu_offset(cpu) = ptr - __per_cpu_start;
|
||||||
#ifdef CONFIG_X86_64
|
#ifdef CONFIG_X86_64
|
||||||
cpu_pda(cpu) = (void *)ptr;
|
cpu_pda(cpu) = (void *)ptr;
|
||||||
|
|
||||||
@@ -190,7 +191,7 @@ void __init setup_per_cpu_areas(void)
|
|||||||
else
|
else
|
||||||
memset(cpu_pda(cpu), 0, sizeof(*cpu_pda(cpu)));
|
memset(cpu_pda(cpu), 0, sizeof(*cpu_pda(cpu)));
|
||||||
#endif
|
#endif
|
||||||
per_cpu_offset(cpu) = ptr - __per_cpu_start;
|
per_cpu(this_cpu_off, cpu) = per_cpu_offset(cpu);
|
||||||
|
|
||||||
DBG("PERCPU: cpu %4d %p\n", cpu, ptr);
|
DBG("PERCPU: cpu %4d %p\n", cpu, ptr);
|
||||||
}
|
}
|
||||||
|
@@ -4,10 +4,10 @@
|
|||||||
#include <linux/module.h>
|
#include <linux/module.h>
|
||||||
#include <asm/smp.h>
|
#include <asm/smp.h>
|
||||||
|
|
||||||
#ifdef CONFIG_X86_32
|
|
||||||
DEFINE_PER_CPU(unsigned long, this_cpu_off);
|
DEFINE_PER_CPU(unsigned long, this_cpu_off);
|
||||||
EXPORT_PER_CPU_SYMBOL(this_cpu_off);
|
EXPORT_PER_CPU_SYMBOL(this_cpu_off);
|
||||||
|
|
||||||
|
#ifdef CONFIG_X86_32
|
||||||
/*
|
/*
|
||||||
* Initialize the CPU's GDT. This is either the boot CPU doing itself
|
* Initialize the CPU's GDT. This is either the boot CPU doing itself
|
||||||
* (still using the master per-cpu area), or a CPU doing it for a
|
* (still using the master per-cpu area), or a CPU doing it for a
|
||||||
@@ -24,7 +24,6 @@ __cpuinit void init_gdt(int cpu)
|
|||||||
write_gdt_entry(get_cpu_gdt_table(cpu),
|
write_gdt_entry(get_cpu_gdt_table(cpu),
|
||||||
GDT_ENTRY_PERCPU, &gdt, DESCTYPE_S);
|
GDT_ENTRY_PERCPU, &gdt, DESCTYPE_S);
|
||||||
|
|
||||||
per_cpu(this_cpu_off, cpu) = __per_cpu_offset[cpu];
|
|
||||||
per_cpu(cpu_number, cpu) = cpu;
|
per_cpu(cpu_number, cpu) = cpu;
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
@@ -531,6 +531,7 @@ static void __init do_boot_cpu(__u8 cpu)
|
|||||||
stack_start.sp = (void *)idle->thread.sp;
|
stack_start.sp = (void *)idle->thread.sp;
|
||||||
|
|
||||||
init_gdt(cpu);
|
init_gdt(cpu);
|
||||||
|
per_cpu(this_cpu_off, cpu) = __per_cpu_offset[cpu];
|
||||||
per_cpu(current_task, cpu) = idle;
|
per_cpu(current_task, cpu) = idle;
|
||||||
early_gdt_descr.address = (unsigned long)get_cpu_gdt_table(cpu);
|
early_gdt_descr.address = (unsigned long)get_cpu_gdt_table(cpu);
|
||||||
irq_ctx_init(cpu);
|
irq_ctx_init(cpu);
|
||||||
@@ -1748,6 +1749,7 @@ static void __init voyager_smp_prepare_cpus(unsigned int max_cpus)
|
|||||||
static void __cpuinit voyager_smp_prepare_boot_cpu(void)
|
static void __cpuinit voyager_smp_prepare_boot_cpu(void)
|
||||||
{
|
{
|
||||||
init_gdt(smp_processor_id());
|
init_gdt(smp_processor_id());
|
||||||
|
per_cpu(this_cpu_off, cpu) = __per_cpu_offset[cpu];
|
||||||
switch_to_new_gdt();
|
switch_to_new_gdt();
|
||||||
|
|
||||||
cpu_set(smp_processor_id(), cpu_online_map);
|
cpu_set(smp_processor_id(), cpu_online_map);
|
||||||
|
Reference in New Issue
Block a user