linux-arm-kernel.lists.infradead.org archive mirror
 help / color / mirror / Atom feed
From: liuj97@gmail.com (Jiang Liu)
To: linux-arm-kernel@lists.infradead.org
Subject: [RFT PATCH v1 6/7] amd64: avoid saving and restoring FPSIMD registers until threads access them
Date: Fri, 27 Sep 2013 16:04:46 +0800	[thread overview]
Message-ID: <1380269087-8520-7-git-send-email-liuj97@gmail.com> (raw)
In-Reply-To: <1380269087-8520-1-git-send-email-liuj97@gmail.com>

From: Jiang Liu <jiang.liu@huawei.com>

Use PF_USED_MATH flag to mark whether the thread has accessed any FPSIMD
registers, so we could avoid saving and restroing FPSIMD registers until
threads access them. This may improve performance when lazy FPSIMD restore
is disabled.

Signed-off-by: Jiang Liu <jiang.liu@huawei.com>
Cc: Jiang Liu <liuj97@gmail.com>
---
 arch/arm64/kernel/fpsimd.c | 38 +++++++++++++++++++++++---------------
 1 file changed, 23 insertions(+), 15 deletions(-)

diff --git a/arch/arm64/kernel/fpsimd.c b/arch/arm64/kernel/fpsimd.c
index 267e54a..a81af5f 100644
--- a/arch/arm64/kernel/fpsimd.c
+++ b/arch/arm64/kernel/fpsimd.c
@@ -99,7 +99,8 @@ void fpsimd_disable_lazy_restore(void)
  * If lazy mode is enabled, caller needs to disable preemption
  * when calling fpsimd_load_state_lazy() and fpsimd_save_state_lazy().
  */
-static void fpsimd_load_state_lazy(struct fpsimd_state *state)
+static void fpsimd_load_state_lazy(struct fpsimd_state *state,
+				   struct task_struct *tsk)
 {
 	/* Could we reuse the hardware context? */
 	if (state->last_cpu == smp_processor_id() &&
@@ -109,13 +110,19 @@ static void fpsimd_load_state_lazy(struct fpsimd_state *state)
 	if (static_key_false(&fpsimd_lazy_mode)) {
 		fpsimd_clear_on_hw(state);
 		fpsimd_enable_trap();
-	} else {
+	} else if (tsk_used_math(tsk)) {
+		fpsimd_disable_trap();
 		fpsimd_load_state(state);
+	} else {
+		fpsimd_enable_trap();
 	}
 }
 
 static void fpsimd_save_state_lazy(struct fpsimd_state *state)
 {
+	if (!used_math())
+		return;
+
 	if (static_key_false(&fpsimd_lazy_mode)) {
 		if (!fpsimd_is_on_hw(state))
 			return;
@@ -133,12 +140,14 @@ void do_fpsimd_acc(unsigned int esr, struct pt_regs *regs)
 {
 	struct fpsimd_state *state = &current->thread.fpsimd_state;
 
+	fpsimd_disable_trap();
+	fpsimd_load_state(state);
 	if (static_key_false(&fpsimd_lazy_mode)) {
-		fpsimd_disable_trap();
-		fpsimd_load_state(state);
 		fpsimd_set_on_hw(state);
+		if (!used_math())
+			set_used_math();
 	} else {
-		WARN_ON(1);
+		set_used_math();
 	}
 }
 
@@ -175,7 +184,7 @@ void fpsimd_thread_switch(struct task_struct *next)
 	if (current->mm)
 		fpsimd_save_state_lazy(&current->thread.fpsimd_state);
 	if (next->mm)
-		fpsimd_load_state_lazy(&next->thread.fpsimd_state);
+		fpsimd_load_state_lazy(&next->thread.fpsimd_state, next);
 }
 
 void fpsimd_flush_thread(void)
@@ -187,8 +196,9 @@ void fpsimd_flush_thread(void)
 #if (AARCH64_FPCR_DEFAULT_VAL != 0)
 	state->fpcr = AARCH64_FPCR_DEFAULT_VAL;
 #endif
+	clear_used_math();
 	fpsimd_set_last_cpu(state, -1);
-	fpsimd_load_state_lazy(state);
+	fpsimd_load_state_lazy(state, current);
 	preempt_enable();
 }
 
@@ -205,7 +215,7 @@ void fpsimd_dup_state(struct fpsimd_state *src, struct fpsimd_state *dst)
 			fpsimd_save_state(dst);
 		fpsimd_clear_on_hw(dst);
 		preempt_enable();
-	} else {
+	} else if (used_math()) {
 		fpsimd_save_state(dst);
 	}
 	fpsimd_set_last_cpu(dst, -1);
@@ -226,12 +236,12 @@ void fpsimd_prepare_sigctx(struct fpsimd_state *ctx)
 		preempt_disable();
 		if (fpsimd_is_on_hw(ctx)) {
 			fpsimd_init_hw_state();
-		} else {
+		} else if (used_math()) {
 			ctx->fpsr = 0;
 			ctx->fpcr = AARCH64_FPCR_DEFAULT_VAL;
 		}
 		preempt_enable();
-	} else {
+	} else if (used_math()) {
 		fpsimd_init_hw_state();
 	}
 }
@@ -243,7 +253,7 @@ void fpsimd_restore_sigctx(struct fpsimd_state *ctx)
 	preempt_disable();
 	*state = *ctx;
 	__this_cpu_write(fpsimd_owner, NULL);
-	fpsimd_load_state_lazy(state);
+	fpsimd_load_state_lazy(state, current);
 	preempt_enable();
 }
 
@@ -261,9 +271,7 @@ void kernel_neon_begin(void)
 	if (current->mm)
 		fpsimd_save_state_lazy(&current->thread.fpsimd_state);
 
-	if (static_key_false(&fpsimd_lazy_mode))
-		fpsimd_disable_trap();
-
+	fpsimd_disable_trap();
 	fpsimd_init_hw_state();
 	__this_cpu_write(fpsimd_owner, NULL);
 }
@@ -272,7 +280,7 @@ EXPORT_SYMBOL(kernel_neon_begin);
 void kernel_neon_end(void)
 {
 	if (current->mm)
-		fpsimd_load_state_lazy(&current->thread.fpsimd_state);
+		fpsimd_load_state_lazy(&current->thread.fpsimd_state, current);
 
 	preempt_enable();
 }
-- 
1.8.1.2

  parent reply	other threads:[~2013-09-27  8:04 UTC|newest]

Thread overview: 18+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2013-09-27  8:04 [RFT PATCH v1 0/7] enable FPSIMD lazy save and restore for arm64 Jiang Liu
2013-09-27  8:04 ` [RFT PATCH v1 1/7] arm64: fix possible invalid FPSIMD initialization state Jiang Liu
2013-09-27 10:59   ` Catalin Marinas
2013-09-27  8:04 ` [RFT PATCH v1 2/7] arm64: restore FPSIMD to default state for kernel and signal contexts Jiang Liu
2013-09-27 11:35   ` Catalin Marinas
2013-09-27 13:20     ` Jiang Liu
2013-09-27  8:04 ` [RFT PATCH v1 3/7] arm64: implement basic lazy save and restore for FPSIMD registers Jiang Liu
2013-09-27  8:04 ` [RFT PATCH v1 4/7] arm64: provide boot option "eagerfpu" to control FPSIMD restore policy Jiang Liu
2013-09-27  8:04 ` [RFT PATCH v1 5/7] arm64: reuse FPSIMD hardware context if possible Jiang Liu
2013-09-27  8:04 ` Jiang Liu [this message]
2013-09-27 10:59   ` [RFT PATCH v1 6/7] amd64: avoid saving and restoring FPSIMD registers until threads access them Will Deacon
2013-09-27 14:20     ` Jiang Liu
2013-09-30  9:34       ` Will Deacon
2013-09-27  8:04 ` [RFT PATCH v1 7/7] arm64: disable lazy load if FPSIMD registers are frequently used Jiang Liu
2013-09-27 10:50 ` [RFT PATCH v1 0/7] enable FPSIMD lazy save and restore for arm64 Catalin Marinas
2013-09-27 11:23   ` Will Deacon
2013-09-27 15:20     ` Jiang Liu
2013-09-27 16:16       ` Catalin Marinas

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=1380269087-8520-7-git-send-email-liuj97@gmail.com \
    --to=liuj97@gmail.com \
    --cc=linux-arm-kernel@lists.infradead.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).