x86/asm: Move 'status' from thread_struct to thread_info
authorAndy Lutomirski <luto@kernel.org>
Sun, 28 Jan 2018 18:38:50 +0000 (10:38 -0800)
committerThomas Gleixner <tglx@linutronix.de>
Tue, 30 Jan 2018 14:30:36 +0000 (15:30 +0100)
The TS_COMPAT bit is very hot and is accessed from code paths that mostly
also touch thread_info::flags.  Move it into struct thread_info to improve
cache locality.

The only reason it was in thread_struct is that there was a brief period
during which arch-specific fields were not allowed in struct thread_info.

Linus suggested further changing:

  ti->status &= ~(TS_COMPAT|TS_I386_REGS_POKED);

to:

  if (unlikely(ti->status & (TS_COMPAT|TS_I386_REGS_POKED)))
          ti->status &= ~(TS_COMPAT|TS_I386_REGS_POKED);

on the theory that frequently dirtying the cacheline even in pure 64-bit
code that never needs to modify status hurts performance.  That could be a
reasonable followup patch, but I suspect it matters less on top of this
patch.

Suggested-by: Linus Torvalds <torvalds@linux-foundation.org>
Signed-off-by: Andy Lutomirski <luto@kernel.org>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Reviewed-by: Ingo Molnar <mingo@kernel.org>
Acked-by: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Kernel Hardening <kernel-hardening@lists.openwall.com>
Link: https://lkml.kernel.org/r/03148bcc1b217100e6e8ecf6a5468c45cf4304b6.1517164461.git.luto@kernel.org
arch/x86/entry/common.c
arch/x86/include/asm/processor.h
arch/x86/include/asm/syscall.h
arch/x86/include/asm/thread_info.h
arch/x86/kernel/process_64.c
arch/x86/kernel/ptrace.c
arch/x86/kernel/signal.c

index d7d3cc24baf4e5bf7c8f14e92aca44820eb8c463..99081340d19a83e147b0cb678bde5c0050214870 100644 (file)
@@ -206,7 +206,7 @@ __visible inline void prepare_exit_to_usermode(struct pt_regs *regs)
         * special case only applies after poking regs and before the
         * very next return to user mode.
         */
-       current->thread.status &= ~(TS_COMPAT|TS_I386_REGS_POKED);
+       ti->status &= ~(TS_COMPAT|TS_I386_REGS_POKED);
 #endif
 
        user_enter_irqoff();
@@ -304,7 +304,7 @@ static __always_inline void do_syscall_32_irqs_on(struct pt_regs *regs)
        unsigned int nr = (unsigned int)regs->orig_ax;
 
 #ifdef CONFIG_IA32_EMULATION
-       current->thread.status |= TS_COMPAT;
+       ti->status |= TS_COMPAT;
 #endif
 
        if (READ_ONCE(ti->flags) & _TIF_WORK_SYSCALL_ENTRY) {
index efbde088a71826fe0ae933084b3e831a2e45b10e..513f9604c1929dc8127d9c664f293b61b6d74d4b 100644 (file)
@@ -460,8 +460,6 @@ struct thread_struct {
        unsigned short          gsindex;
 #endif
 
-       u32                     status;         /* thread synchronous flags */
-
 #ifdef CONFIG_X86_64
        unsigned long           fsbase;
        unsigned long           gsbase;
index e3c95e8e61c5fca9808524ba47d539bd0377ece2..03eedc21246d5b65d39ffb45ce27c588151d7488 100644 (file)
@@ -60,7 +60,7 @@ static inline long syscall_get_error(struct task_struct *task,
         * TS_COMPAT is set for 32-bit syscall entries and then
         * remains set until we return to user mode.
         */
-       if (task->thread.status & (TS_COMPAT|TS_I386_REGS_POKED))
+       if (task->thread_info.status & (TS_COMPAT|TS_I386_REGS_POKED))
                /*
                 * Sign-extend the value so (int)-EFOO becomes (long)-EFOO
                 * and will match correctly in comparisons.
@@ -116,7 +116,7 @@ static inline void syscall_get_arguments(struct task_struct *task,
                                         unsigned long *args)
 {
 # ifdef CONFIG_IA32_EMULATION
-       if (task->thread.status & TS_COMPAT)
+       if (task->thread_info.status & TS_COMPAT)
                switch (i) {
                case 0:
                        if (!n--) break;
@@ -177,7 +177,7 @@ static inline void syscall_set_arguments(struct task_struct *task,
                                         const unsigned long *args)
 {
 # ifdef CONFIG_IA32_EMULATION
-       if (task->thread.status & TS_COMPAT)
+       if (task->thread_info.status & TS_COMPAT)
                switch (i) {
                case 0:
                        if (!n--) break;
index 00223333821a96616647a9cbb6fe729c4a18b7b6..eda3b6823ca4323d542f435854c658324ead17bd 100644 (file)
@@ -55,6 +55,7 @@ struct task_struct;
 
 struct thread_info {
        unsigned long           flags;          /* low level flags */
+       u32                     status;         /* thread synchronous flags */
 };
 
 #define INIT_THREAD_INFO(tsk)                  \
@@ -221,7 +222,7 @@ static inline int arch_within_stack_frames(const void * const stack,
 #define in_ia32_syscall() true
 #else
 #define in_ia32_syscall() (IS_ENABLED(CONFIG_IA32_EMULATION) && \
-                          current->thread.status & TS_COMPAT)
+                          current_thread_info()->status & TS_COMPAT)
 #endif
 
 /*
index c754662320163107ca3a254362ce0e404a8d3c11..9eb448c7859d2469ba63e6112f129bb2926c4bb0 100644 (file)
@@ -557,7 +557,7 @@ static void __set_personality_x32(void)
         * Pretend to come from a x32 execve.
         */
        task_pt_regs(current)->orig_ax = __NR_x32_execve | __X32_SYSCALL_BIT;
-       current->thread.status &= ~TS_COMPAT;
+       current_thread_info()->status &= ~TS_COMPAT;
 #endif
 }
 
@@ -571,7 +571,7 @@ static void __set_personality_ia32(void)
        current->personality |= force_personality32;
        /* Prepare the first "return" to user space */
        task_pt_regs(current)->orig_ax = __NR_ia32_execve;
-       current->thread.status |= TS_COMPAT;
+       current_thread_info()->status |= TS_COMPAT;
 #endif
 }
 
index f37d18124648fb9591779e50c878c4ffd51c51b1..ed5c4cdf0a348d6a0de34d1214298f12fd6f1ddb 100644 (file)
@@ -935,7 +935,7 @@ static int putreg32(struct task_struct *child, unsigned regno, u32 value)
                 */
                regs->orig_ax = value;
                if (syscall_get_nr(child, regs) >= 0)
-                       child->thread.status |= TS_I386_REGS_POKED;
+                       child->thread_info.status |= TS_I386_REGS_POKED;
                break;
 
        case offsetof(struct user32, regs.eflags):
index b9e00e8f1c9b63a92fa380fcb4fd12ef4acb9a29..4cdc0b27ec82fda92db3551f1e19bf70d88b25cb 100644 (file)
@@ -787,7 +787,7 @@ static inline unsigned long get_nr_restart_syscall(const struct pt_regs *regs)
         * than the tracee.
         */
 #ifdef CONFIG_IA32_EMULATION
-       if (current->thread.status & (TS_COMPAT|TS_I386_REGS_POKED))
+       if (current_thread_info()->status & (TS_COMPAT|TS_I386_REGS_POKED))
                return __NR_ia32_restart_syscall;
 #endif
 #ifdef CONFIG_X86_X32_ABI