From: Richard Henderson <richard.henderson@linaro.org>
To: qemu-devel@nongnu.org
Cc: WANG Xuerui <git@xen0n.name>
Subject: [PULL 15/31] tcg/loongarch64: Implement clz/ctz ops
Date: Tue, 21 Dec 2021 08:47:21 -0800 [thread overview]
Message-ID: <20211221164737.1076007-16-richard.henderson@linaro.org> (raw)
In-Reply-To: <20211221164737.1076007-1-richard.henderson@linaro.org>
From: WANG Xuerui <git@xen0n.name>
Signed-off-by: WANG Xuerui <git@xen0n.name>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
Message-Id: <20211221054105.178795-16-git@xen0n.name>
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
---
tcg/loongarch64/tcg-target-con-set.h | 1 +
tcg/loongarch64/tcg-target.h | 8 +++---
tcg/loongarch64/tcg-target.c.inc | 42 ++++++++++++++++++++++++++++
3 files changed, 47 insertions(+), 4 deletions(-)
diff --git a/tcg/loongarch64/tcg-target-con-set.h b/tcg/loongarch64/tcg-target-con-set.h
index d958183020..2975e03127 100644
--- a/tcg/loongarch64/tcg-target-con-set.h
+++ b/tcg/loongarch64/tcg-target-con-set.h
@@ -18,4 +18,5 @@ C_O0_I1(r)
C_O1_I1(r, r)
C_O1_I2(r, r, rC)
C_O1_I2(r, r, rU)
+C_O1_I2(r, r, rW)
C_O1_I2(r, 0, rZ)
diff --git a/tcg/loongarch64/tcg-target.h b/tcg/loongarch64/tcg-target.h
index 5303001653..2fd2745b63 100644
--- a/tcg/loongarch64/tcg-target.h
+++ b/tcg/loongarch64/tcg-target.h
@@ -120,8 +120,8 @@ typedef enum {
#define TCG_TARGET_HAS_eqv_i32 0
#define TCG_TARGET_HAS_nand_i32 0
#define TCG_TARGET_HAS_nor_i32 1
-#define TCG_TARGET_HAS_clz_i32 0
-#define TCG_TARGET_HAS_ctz_i32 0
+#define TCG_TARGET_HAS_clz_i32 1
+#define TCG_TARGET_HAS_ctz_i32 1
#define TCG_TARGET_HAS_ctpop_i32 0
#define TCG_TARGET_HAS_direct_jump 0
#define TCG_TARGET_HAS_brcond2 0
@@ -156,8 +156,8 @@ typedef enum {
#define TCG_TARGET_HAS_eqv_i64 0
#define TCG_TARGET_HAS_nand_i64 0
#define TCG_TARGET_HAS_nor_i64 1
-#define TCG_TARGET_HAS_clz_i64 0
-#define TCG_TARGET_HAS_ctz_i64 0
+#define TCG_TARGET_HAS_clz_i64 1
+#define TCG_TARGET_HAS_ctz_i64 1
#define TCG_TARGET_HAS_ctpop_i64 0
#define TCG_TARGET_HAS_add2_i64 0
#define TCG_TARGET_HAS_sub2_i64 0
diff --git a/tcg/loongarch64/tcg-target.c.inc b/tcg/loongarch64/tcg-target.c.inc
index 3b056dd358..39df2885b5 100644
--- a/tcg/loongarch64/tcg-target.c.inc
+++ b/tcg/loongarch64/tcg-target.c.inc
@@ -412,6 +412,28 @@ static void tcg_out_ext32s(TCGContext *s, TCGReg ret, TCGReg arg)
tcg_out_opc_addi_w(s, ret, arg, 0);
}
+static void tcg_out_clzctz(TCGContext *s, LoongArchInsn opc,
+ TCGReg a0, TCGReg a1, TCGReg a2,
+ bool c2, bool is_32bit)
+{
+ if (c2) {
+ /*
+ * Fast path: semantics already satisfied due to constraint and
+ * insn behavior, single instruction is enough.
+ */
+ tcg_debug_assert(a2 == (is_32bit ? 32 : 64));
+ /* all clz/ctz insns belong to DJ-format */
+ tcg_out32(s, encode_dj_insn(opc, a0, a1));
+ return;
+ }
+
+ tcg_out32(s, encode_dj_insn(opc, TCG_REG_TMP0, a1));
+ /* a0 = a1 ? REG_TMP0 : a2 */
+ tcg_out_opc_maskeqz(s, TCG_REG_TMP0, TCG_REG_TMP0, a1);
+ tcg_out_opc_masknez(s, a0, a2, a1);
+ tcg_out_opc_or(s, a0, TCG_REG_TMP0, a0);
+}
+
/*
* Entry-points
*/
@@ -572,6 +594,20 @@ static void tcg_out_op(TCGContext *s, TCGOpcode opc,
tcg_out_opc_revb_d(s, a0, a1);
break;
+ case INDEX_op_clz_i32:
+ tcg_out_clzctz(s, OPC_CLZ_W, a0, a1, a2, c2, true);
+ break;
+ case INDEX_op_clz_i64:
+ tcg_out_clzctz(s, OPC_CLZ_D, a0, a1, a2, c2, false);
+ break;
+
+ case INDEX_op_ctz_i32:
+ tcg_out_clzctz(s, OPC_CTZ_W, a0, a1, a2, c2, true);
+ break;
+ case INDEX_op_ctz_i64:
+ tcg_out_clzctz(s, OPC_CTZ_D, a0, a1, a2, c2, false);
+ break;
+
case INDEX_op_mov_i32: /* Always emitted via tcg_out_mov. */
case INDEX_op_mov_i64:
default:
@@ -632,6 +668,12 @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
/* LoongArch reg-imm bitops have their imms ZERO-extended */
return C_O1_I2(r, r, rU);
+ case INDEX_op_clz_i32:
+ case INDEX_op_clz_i64:
+ case INDEX_op_ctz_i32:
+ case INDEX_op_ctz_i64:
+ return C_O1_I2(r, r, rW);
+
case INDEX_op_deposit_i32:
case INDEX_op_deposit_i64:
/* Must deposit into the same register as input */
--
2.25.1
next prev parent reply other threads:[~2021-12-21 17:00 UTC|newest]
Thread overview: 32+ messages / expand[flat|nested] mbox.gz Atom feed top
2021-12-21 16:47 [PULL 00/31] tcg/loongarch64: New tcg backend Richard Henderson
2021-12-21 16:47 ` [PULL 01/31] elf: Add machine type value for LoongArch Richard Henderson
2021-12-21 16:47 ` [PULL 02/31] MAINTAINERS: Add tcg/loongarch64 entry with myself as maintainer Richard Henderson
2021-12-21 16:47 ` [PULL 03/31] tcg/loongarch64: Add the tcg-target.h file Richard Henderson
2021-12-21 16:47 ` [PULL 04/31] tcg/loongarch64: Add generated instruction opcodes and encoding helpers Richard Henderson
2021-12-21 16:47 ` [PULL 05/31] tcg/loongarch64: Add register names, allocation order and input/output sets Richard Henderson
2021-12-21 16:47 ` [PULL 06/31] tcg/loongarch64: Define the operand constraints Richard Henderson
2021-12-21 16:47 ` [PULL 07/31] tcg/loongarch64: Implement necessary relocation operations Richard Henderson
2021-12-21 16:47 ` [PULL 08/31] tcg/loongarch64: Implement the memory barrier op Richard Henderson
2021-12-21 16:47 ` [PULL 09/31] tcg/loongarch64: Implement tcg_out_mov and tcg_out_movi Richard Henderson
2021-12-21 16:47 ` [PULL 10/31] tcg/loongarch64: Implement goto_ptr Richard Henderson
2021-12-21 16:47 ` [PULL 11/31] tcg/loongarch64: Implement sign-/zero-extension ops Richard Henderson
2021-12-21 16:47 ` [PULL 12/31] tcg/loongarch64: Implement not/and/or/xor/nor/andc/orc ops Richard Henderson
2021-12-21 16:47 ` [PULL 13/31] tcg/loongarch64: Implement deposit/extract ops Richard Henderson
2021-12-21 16:47 ` [PULL 14/31] tcg/loongarch64: Implement bswap{16,32,64} ops Richard Henderson
2021-12-21 16:47 ` Richard Henderson [this message]
2021-12-21 16:47 ` [PULL 16/31] tcg/loongarch64: Implement shl/shr/sar/rotl/rotr ops Richard Henderson
2021-12-21 16:47 ` [PULL 17/31] tcg/loongarch64: Implement add/sub ops Richard Henderson
2021-12-21 16:47 ` [PULL 18/31] tcg/loongarch64: Implement mul/mulsh/muluh/div/divu/rem/remu ops Richard Henderson
2021-12-21 16:47 ` [PULL 19/31] tcg/loongarch64: Implement br/brcond ops Richard Henderson
2021-12-21 16:47 ` [PULL 20/31] tcg/loongarch64: Implement setcond ops Richard Henderson
2021-12-21 16:47 ` [PULL 21/31] tcg/loongarch64: Implement tcg_out_call Richard Henderson
2021-12-21 16:47 ` [PULL 22/31] tcg/loongarch64: Implement simple load/store ops Richard Henderson
2021-12-21 16:47 ` [PULL 23/31] tcg/loongarch64: Add softmmu load/store helpers, implement qemu_ld/qemu_st ops Richard Henderson
2021-12-21 16:47 ` [PULL 24/31] tcg/loongarch64: Implement tcg_target_qemu_prologue Richard Henderson
2021-12-21 16:47 ` [PULL 25/31] tcg/loongarch64: Implement exit_tb/goto_tb Richard Henderson
2021-12-21 16:47 ` [PULL 26/31] tcg/loongarch64: Implement tcg_target_init Richard Henderson
2021-12-21 16:47 ` [PULL 27/31] tcg/loongarch64: Register the JIT Richard Henderson
2021-12-21 16:47 ` [PULL 28/31] common-user: Add safe syscall handling for loongarch64 hosts Richard Henderson
2021-12-21 16:47 ` [PULL 29/31] linux-user: Implement CPU-specific signal handler " Richard Henderson
2021-12-21 16:47 ` [PULL 30/31] configure, meson.build: Mark support " Richard Henderson
2021-12-21 16:47 ` [PULL 31/31] tests/docker: Add gentoo-loongarch64-cross image and run cross builds in GitLab Richard Henderson
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20211221164737.1076007-16-richard.henderson@linaro.org \
--to=richard.henderson@linaro.org \
--cc=git@xen0n.name \
--cc=qemu-devel@nongnu.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).