mirror of
https://github.com/edk2-porting/linux-next.git
synced 2025-01-11 15:14:03 +08:00
5f409e20b7
Defer loading of FPU state until return to userspace. This gives the kernel the potential to skip loading FPU state for tasks that stay in kernel mode, or for tasks that end up with repeated invocations of kernel_fpu_begin() & kernel_fpu_end(). The fpregs_lock/unlock() section ensures that the registers remain unchanged. Otherwise a context switch or a bottom half could save the registers to its FPU context and the processor's FPU registers would became random if modified at the same time. KVM swaps the host/guest registers on entry/exit path. This flow has been kept as is. First it ensures that the registers are loaded and then saves the current (host) state before it loads the guest's registers. The swap is done at the very end with disabled interrupts so it should not change anymore before theg guest is entered. The read/save version seems to be cheaper compared to memcpy() in a micro benchmark. Each thread gets TIF_NEED_FPU_LOAD set as part of fork() / fpu__copy(). For kernel threads, this flag gets never cleared which avoids saving / restoring the FPU state for kernel threads and during in-kernel usage of the FPU registers. [ bp: Correct and update commit message and fix checkpatch warnings. s/register/registers/ where it is used in plural. minor comment corrections. remove unused trace_x86_fpu_activate_state() TP. ] Signed-off-by: Rik van Riel <riel@surriel.com> Signed-off-by: Sebastian Andrzej Siewior <bigeasy@linutronix.de> Signed-off-by: Borislav Petkov <bp@suse.de> Reviewed-by: Dave Hansen <dave.hansen@intel.com> Reviewed-by: Thomas Gleixner <tglx@linutronix.de> Cc: Andy Lutomirski <luto@kernel.org> Cc: Aubrey Li <aubrey.li@intel.com> Cc: Babu Moger <Babu.Moger@amd.com> Cc: "Chang S. Bae" <chang.seok.bae@intel.com> Cc: Dmitry Safonov <dima@arista.com> Cc: "H. Peter Anvin" <hpa@zytor.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Jann Horn <jannh@google.com> Cc: "Jason A. Donenfeld" <Jason@zx2c4.com> Cc: Joerg Roedel <jroedel@suse.de> Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com> Cc: kvm ML <kvm@vger.kernel.org> Cc: Nicolai Stange <nstange@suse.de> Cc: Paolo Bonzini <pbonzini@redhat.com> Cc: "Radim Krčmář" <rkrcmar@redhat.com> Cc: Tim Chen <tim.c.chen@linux.intel.com> Cc: Waiman Long <longman@redhat.com> Cc: x86-ml <x86@kernel.org> Cc: Yi Wang <wang.yi59@zte.com.cn> Link: https://lkml.kernel.org/r/20190403164156.19645-24-bigeasy@linutronix.de
100 lines
2.0 KiB
C
100 lines
2.0 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
#undef TRACE_SYSTEM
|
|
#define TRACE_SYSTEM x86_fpu
|
|
|
|
#if !defined(_TRACE_FPU_H) || defined(TRACE_HEADER_MULTI_READ)
|
|
#define _TRACE_FPU_H
|
|
|
|
#include <linux/tracepoint.h>
|
|
|
|
DECLARE_EVENT_CLASS(x86_fpu,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(struct fpu *, fpu)
|
|
__field(bool, load_fpu)
|
|
__field(u64, xfeatures)
|
|
__field(u64, xcomp_bv)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->fpu = fpu;
|
|
__entry->load_fpu = test_thread_flag(TIF_NEED_FPU_LOAD);
|
|
if (boot_cpu_has(X86_FEATURE_OSXSAVE)) {
|
|
__entry->xfeatures = fpu->state.xsave.header.xfeatures;
|
|
__entry->xcomp_bv = fpu->state.xsave.header.xcomp_bv;
|
|
}
|
|
),
|
|
TP_printk("x86/fpu: %p load: %d xfeatures: %llx xcomp_bv: %llx",
|
|
__entry->fpu,
|
|
__entry->load_fpu,
|
|
__entry->xfeatures,
|
|
__entry->xcomp_bv
|
|
)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_before_save,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_after_save,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_before_restore,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_after_restore,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_regs_activated,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_regs_deactivated,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_init_state,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_dropped,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_copy_src,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_copy_dst,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
DEFINE_EVENT(x86_fpu, x86_fpu_xstate_check_failed,
|
|
TP_PROTO(struct fpu *fpu),
|
|
TP_ARGS(fpu)
|
|
);
|
|
|
|
#undef TRACE_INCLUDE_PATH
|
|
#define TRACE_INCLUDE_PATH asm/trace/
|
|
#undef TRACE_INCLUDE_FILE
|
|
#define TRACE_INCLUDE_FILE fpu
|
|
#endif /* _TRACE_FPU_H */
|
|
|
|
/* This part must be outside protection */
|
|
#include <trace/define_trace.h>
|