[Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG

qemu-devel.nongnu.org archive mirror
 help / color / mirror / Atom feed

* [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG
@ 2008-08-30 19:36 Shin-ichiro KAWASAKI
  2008-08-30 20:23 ` Blue Swirl
  0 siblings, 1 reply; 6+ messages in thread
From: Shin-ichiro KAWASAKI @ 2008-08-30 19:36 UTC (permalink / raw)
  To: qemu-devel

This patch converts two SH4 float instructions, 'fmov Rm,Rn' and
'fadd' into TCG.  Before converting other float instructions
into TCG, comments on it will be appreciated.

- TCG variables intorudced for float operation : FT[01], and DT[01].
- I think float registers 'fregs' are not to be mapped for
  TCG variables, because TCG does not support float operations, now.
  Instead of it, float register load/store function introduced.
  For 64 bit operation, they do 32 bit swap with temporary TCG vars.
  I hope that this won't result too much overhead.
- A comment is added to imply that SH-Linux does not run
  'fmov' in 64 bit .

Regards,
Shin-ichiro KAWASAKI


Index: trunk/target-sh4/op.c
===================================================================
--- trunk/target-sh4/op.c	(revision 5116)
+++ trunk/target-sh4/op.c	(working copy)
@@ -230,18 +230,6 @@
     RETURN();
 }
 
-void OPPROTO op_fadd_FT(void)
-{
-    FT0 = float32_add(FT0, FT1, &env->fp_status);
-    RETURN();
-}
-
-void OPPROTO op_fadd_DT(void)
-{
-    DT0 = float64_add(DT0, DT1, &env->fp_status);
-    RETURN();
-}
-
 void OPPROTO op_fsub_FT(void)
 {
     FT0 = float32_sub(FT0, FT1, &env->fp_status);
Index: trunk/target-sh4/helper.h
===================================================================
--- trunk/target-sh4/helper.h	(revision 5116)
+++ trunk/target-sh4/helper.h	(working copy)
@@ -16,3 +16,6 @@
 DEF_HELPER(uint32_t, helper_negc, (uint32_t))
 DEF_HELPER(void, helper_macl, (uint32_t, uint32_t))
 DEF_HELPER(void, helper_macw, (uint32_t, uint32_t))
+
+DEF_HELPER(uint32_t, helper_fadd_FT, (uint32_t, uint32_t, CPUState *))
+DEF_HELPER(uint64_t, helper_fadd_DT, (uint64_t, uint64_t, CPUState *))
Index: trunk/target-sh4/op_helper.c
===================================================================
--- trunk/target-sh4/op_helper.c	(revision 5116)
+++ trunk/target-sh4/op_helper.c	(working copy)
@@ -388,3 +388,15 @@
 	env->sr &= ~SR_T;
     *addr = new;
 }
+
+uint32_t helper_fadd_FT(uint32_t t0, uint32_t t1, CPUState * env)
+{
+    float32 ret = float32_add(*(float32*)&t0, *(float32*)&t1, &env->fp_status);
+    return *(uint32_t*)(&ret);
+}
+
+uint64_t helper_fadd_DT(uint64_t t0, uint64_t t1, CPUState * env)
+{
+    float64 ret = float64_add(*(float64*)&t0, *(float64*)&t1, &env->fp_status);
+    return *(uint64_t*)(&ret);
+}
Index: trunk/target-sh4/translate.c
===================================================================
--- trunk/target-sh4/translate.c	(revision 5116)
+++ trunk/target-sh4/translate.c	(working copy)
@@ -69,6 +69,8 @@
 
 /* dyngen register indexes */
 static TCGv cpu_T[2];
+static TCGv cpu_FT[2];
+static TCGv cpu_DT[2];
 
 #include "gen-icount.h"
 
@@ -90,6 +92,14 @@
     cpu_env = tcg_global_reg_new(TCG_TYPE_PTR, TCG_AREG0, "env");
     cpu_T[0] = tcg_global_reg_new(TCG_TYPE_I32, TCG_AREG1, "T0");
     cpu_T[1] = tcg_global_reg_new(TCG_TYPE_I32, TCG_AREG2, "T1");
+    cpu_FT[0] = tcg_global_mem_new(TCG_TYPE_I32, TCG_AREG0,
+				   offsetof(CPUState, ft0), "FT0");
+    cpu_FT[1] = tcg_global_mem_new(TCG_TYPE_I32, TCG_AREG0,
+				   offsetof(CPUState, ft1), "FT1");
+    cpu_DT[0] = tcg_global_mem_new(TCG_TYPE_I64, TCG_AREG0,
+				   offsetof(CPUState, dt0), "DT0");
+    cpu_DT[1] = tcg_global_mem_new(TCG_TYPE_I64, TCG_AREG0,
+				   offsetof(CPUState, dt1), "DT1");
 
     for (i = 0; i < 24; i++)
         cpu_gregs[i] = tcg_global_mem_new(TCG_TYPE_I32, TCG_AREG0,
@@ -345,6 +355,42 @@
     tcg_gen_ori_i32(cpu_flags, cpu_flags, flags);
 }
 
+static inline void gen_ld_frN(TCGv ft, TCGv cpu_env, uint32_t reg)
+{
+    tcg_gen_ld_i32(ft, cpu_env, offsetof(CPUState, fregs[reg]));
+}
+
+static inline void gen_ld_drN(TCGv dt, TCGv cpu_env, uint32_t reg)
+{
+    TCGv tmp = tcg_temp_new(TCG_TYPE_I64);
+	        
+    tcg_gen_ld_i64(dt, cpu_env, offsetof(CPUState, fregs[reg]));
+    tcg_gen_shli_i64(tmp, dt, 32);
+    tcg_gen_shri_i64(dt, dt, 32);
+    tcg_gen_or_i64(dt, tmp, dt);
+
+    tcg_temp_free(tmp);
+}
+
+static inline void gen_st_frN(TCGv ft, TCGv cpu_env, uint32_t reg)
+{
+    tcg_gen_st_i32(ft, cpu_env, offsetof(CPUState, fregs[reg]));
+}
+
+static inline void gen_st_drN(TCGv dt, TCGv cpu_env, uint32_t reg)
+{
+    TCGv tmp1 = tcg_temp_new(TCG_TYPE_I64);
+    TCGv tmp2 = tcg_temp_new(TCG_TYPE_I64);
+	        
+    tcg_gen_shli_i64(tmp1, dt, 32);
+    tcg_gen_shri_i64(tmp2, dt, 32);
+    tcg_gen_or_i64(tmp1, tmp1, tmp2);
+    tcg_gen_st_i64(tmp1, cpu_env, offsetof(CPUState, fregs[reg]));
+
+    tcg_temp_free(tmp1);
+    tcg_temp_free(tmp2);
+}
+
 #define B3_0 (ctx->opcode & 0xf)
 #define B6_4 ((ctx->opcode >> 4) & 0x7)
 #define B7_4 ((ctx->opcode >> 4) & 0xf)
@@ -811,12 +857,14 @@
 	tcg_gen_xor_i32(cpu_gregs[REG(B11_8)], cpu_gregs[REG(B11_8)], cpu_gregs[REG(B7_4)]);
 	return;
     case 0xf00c: /* fmov {F,D,X}Rm,{F,D,X}Rn - FPSCR: Nothing */
+        /* 64 bit fmov code is not tested, because SH-Linux seems
+	   not to set FPSCR_SZ flag true. */
 	if (ctx->fpscr & FPSCR_SZ) {
-	    gen_op_fmov_drN_DT0(XREG(B7_4));
-	    gen_op_fmov_DT0_drN(XREG(B11_8));
+	    gen_ld_drN(cpu_DT[0], cpu_env, XREG(B7_4));
+	    gen_st_drN(cpu_DT[1], cpu_env, XREG(B11_8));
 	} else {
-	    gen_op_fmov_frN_FT0(FREG(B7_4));
-	    gen_op_fmov_FT0_frN(FREG(B11_8));
+	    gen_ld_frN(cpu_FT[0], cpu_env, FREG(B7_4));
+	    gen_st_frN(cpu_FT[0], cpu_env, FREG(B11_8));
 	}
 	return;
     case 0xf00a: /* fmov {F,D,X}Rm,@Rn - FPSCR: Nothing */
@@ -905,17 +953,22 @@
 	if (ctx->fpscr & FPSCR_PR) {
 	    if (ctx->opcode & 0x0110)
 		break; /* illegal instruction */
-	    gen_op_fmov_drN_DT1(DREG(B7_4));
-	    gen_op_fmov_drN_DT0(DREG(B11_8));
+	    gen_ld_drN(cpu_DT[1], cpu_env, DREG(B7_4));
+	    gen_ld_drN(cpu_DT[0], cpu_env, DREG(B11_8));
 	}
 	else {
-	    gen_op_fmov_frN_FT1(FREG(B7_4));
-	    gen_op_fmov_frN_FT0(FREG(B11_8));
+	    gen_ld_frN(cpu_FT[1], cpu_env, FREG(B7_4));
+	    gen_ld_frN(cpu_FT[0], cpu_env, FREG(B11_8));
 	}
 
 	switch (ctx->opcode & 0xf00f) {
 	case 0xf000:		/* fadd Rm,Rn */
-	    ctx->fpscr & FPSCR_PR ? gen_op_fadd_DT() : gen_op_fadd_FT();
+	    if (ctx->fpscr & FPSCR_PR)
+	        tcg_gen_helper_1_3(helper_fadd_DT, cpu_DT[0],
+				   cpu_DT[0], cpu_DT[1], cpu_env);
+	    else
+	        tcg_gen_helper_1_3(helper_fadd_FT, cpu_FT[0],
+				   cpu_FT[0], cpu_FT[1], cpu_env);
 	    break;
 	case 0xf001:		/* fsub Rm,Rn */
 	    ctx->fpscr & FPSCR_PR ? gen_op_fsub_DT() : gen_op_fsub_FT();
@@ -935,10 +988,10 @@
 	}
 
 	if (ctx->fpscr & FPSCR_PR) {
-	    gen_op_fmov_DT0_drN(DREG(B11_8));
+	    gen_st_drN(cpu_DT[0], cpu_env, DREG(B11_8));
 	}
 	else {
-	    gen_op_fmov_FT0_frN(FREG(B11_8));
+	    gen_st_frN(cpu_FT[0], cpu_env, FREG(B11_8));
 	}
 	return;
     }

^ permalink raw reply	[flat|nested] 6+ messages in thread

* Re: [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG
  2008-08-30 19:36 [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG Shin-ichiro KAWASAKI
@ 2008-08-30 20:23 ` Blue Swirl
  2008-08-31 17:28   ` Shin-ichiro KAWASAKI
  0 siblings, 1 reply; 6+ messages in thread
From: Blue Swirl @ 2008-08-30 20:23 UTC (permalink / raw)
  To: qemu-devel

On 8/30/08, Shin-ichiro KAWASAKI <kawasaki@juno.dti.ne.jp> wrote:
> This patch converts two SH4 float instructions, 'fmov Rm,Rn' and
>  'fadd' into TCG.  Before converting other float instructions
>  into TCG, comments on it will be appreciated.
>
>  - TCG variables intorudced for float operation : FT[01], and DT[01].
>  - I think float registers 'fregs' are not to be mapped for
>   TCG variables, because TCG does not support float operations, now.

In TCG README Fabrice mentioned that he's working on a floating point
version. It would be nice to get that committed, already m68k has a
fake version. I did not use TCG variables for float just because I've
been waiting for that. It's not possible to pass env->fp_status
cleanly now (for example to call softfloat functions directly). And
for example on Sparc host, moving data from integer registers to
floating point registers must use memory in between them so there the
integer TCG registers should be separate from float TCG registers.

>  +uint32_t helper_fadd_FT(uint32_t t0, uint32_t t1, CPUState * env)
>  +{
>  +    float32 ret = float32_add(*(float32*)&t0, *(float32*)&t1, &env->fp_status);
>  +    return *(uint32_t*)(&ret);
>  +}

There is no need to pass env as a parameter, it's available to
op_helper.c code anyway.

>  +static inline void gen_ld_frN(TCGv ft, TCGv cpu_env, uint32_t reg)
>  +{
>  +    tcg_gen_ld_i32(ft, cpu_env, offsetof(CPUState, fregs[reg]));
>  +}
>  +
>  +static inline void gen_ld_drN(TCGv dt, TCGv cpu_env, uint32_t reg)
>  +{
>  +    TCGv tmp = tcg_temp_new(TCG_TYPE_I64);
>  +
>  +    tcg_gen_ld_i64(dt, cpu_env, offsetof(CPUState, fregs[reg]));
>  +    tcg_gen_shli_i64(tmp, dt, 32);
>  +    tcg_gen_shri_i64(dt, dt, 32);
>  +    tcg_gen_or_i64(dt, tmp, dt);
>  +
>  +    tcg_temp_free(tmp);
>  +}

I guess that like in Sparc, two 32 bit fregs can be combined to a 64
bit double. Please have a look at target-sparc/translate.c on the use
of CPU_DoubleU, there should be a safer way to access the registers.

Otherwise, good work!

^ permalink raw reply	[flat|nested] 6+ messages in thread

* Re: [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG
  2008-08-30 20:23 ` Blue Swirl
@ 2008-08-31 17:28   ` Shin-ichiro KAWASAKI
  2008-08-31 18:28     ` Blue Swirl
  2008-08-31 19:32     ` Aurelien Jarno
  0 siblings, 2 replies; 6+ messages in thread
From: Shin-ichiro KAWASAKI @ 2008-08-31 17:28 UTC (permalink / raw)
  To: qemu-devel

Thank your for comments, Blue Swirl!
The new patch is shown at the end of this mail.
Reviews are welcome, again.

Blue Swirl wrote:
> > On 8/30/08, Shin-ichiro KAWASAKI <kawasaki@juno.dti.ne.jp> wrote:
>> >> This patch converts two SH4 float instructions, 'fmov Rm,Rn' and
>> >>  'fadd' into TCG.  Before converting other float instructions
>> >>  into TCG, comments on it will be appreciated.
>> >>
>> >>  - TCG variables intorudced for float operation : FT[01], and DT[01].
>> >>  - I think float registers 'fregs' are not to be mapped for
>> >>   TCG variables, because TCG does not support float operations, now.
> >
> > In TCG README Fabrice mentioned that he's working on a floating point
> > version. It would be nice to get that committed, already m68k has a
> > fake version. I did not use TCG variables for float just because I've
> > been waiting for that. It's not possible to pass env->fp_status
> > cleanly now (for example to call softfloat functions directly). And
> > for example on Sparc host, moving data from integer registers to
> > floating point registers must use memory in between them so there the
> > integer TCG registers should be separate from float TCG registers.

I agree that it is important to conisder mapping fregs ot TCG feature
like m68k implementation does. But I think this work will take too long
time, if I do it, and it will be some break for converting TCG work.
I think it is not too late to do this work after eliminating 'op.c'.

And I have a question on it.
As you pointed out below, two 32 bit registers are concatanated as one
64 bit register.  When floating point TCG variables introduced in the future,
it is straight to map one memory region for 32bit TCG variable and 64bit
TCG variable.  I wonder such two way mapping suit for TCG, or not.

> > There is no need to pass env as a parameter, it's available to
> > op_helper.c code anyway.

Indeed. Thanks!

> > I guess that like in Sparc, two 32 bit fregs can be combined to a 64
> > bit double. Please have a look at target-sparc/translate.c on the use
> > of CPU_DoubleU, there should be a safer way to access the registers.

Thanks. I wrote new codes for load/store function, following sparc.

Regards,
Shin-ichiro KAWASAKI


Index: trunk/target-sh4/op.c
===================================================================
--- trunk/target-sh4/op.c	(revision 5119)
+++ trunk/target-sh4/op.c	(working copy)
@@ -163,18 +163,6 @@
     RETURN();
 }
 
-void OPPROTO op_fadd_FT(void)
-{
-    FT0 = float32_add(FT0, FT1, &env->fp_status);
-    RETURN();
-}
-
-void OPPROTO op_fadd_DT(void)
-{
-    DT0 = float64_add(DT0, DT1, &env->fp_status);
-    RETURN();
-}
-
 void OPPROTO op_fsub_FT(void)
 {
     FT0 = float32_sub(FT0, FT1, &env->fp_status);
Index: trunk/target-sh4/helper.h
===================================================================
--- trunk/target-sh4/helper.h	(revision 5119)
+++ trunk/target-sh4/helper.h	(working copy)
@@ -18,3 +18,6 @@
 DEF_HELPER(void, helper_macw, (uint32_t, uint32_t))
 
 DEF_HELPER(void, helper_ld_fpscr, (uint32_t))
+DEF_HELPER(uint32_t, helper_fadd_FT, (uint32_t, uint32_t))
+DEF_HELPER(uint64_t, helper_fadd_DT, (uint64_t, uint64_t))
+
Index: trunk/target-sh4/op_helper.c
===================================================================
--- trunk/target-sh4/op_helper.c	(revision 5119)
+++ trunk/target-sh4/op_helper.c	(working copy)
@@ -397,3 +397,16 @@
     else
 	set_float_rounding_mode(float_round_nearest_even, &env->fp_status);
 }
+
+uint32_t helper_fadd_FT(uint32_t t0, uint32_t t1)
+{
+    float32 ret = float32_add(*(float32*)&t0, *(float32*)&t1, &env->fp_status);
+    return *(uint32_t*)(&ret);
+}
+
+uint64_t helper_fadd_DT(uint64_t t0, uint64_t t1)
+{
+    float64 ret = float64_add(*(float64*)&t0, *(float64*)&t1, &env->fp_status);
+    return *(uint64_t*)(&ret);
+}
+
Index: trunk/target-sh4/translate.c
===================================================================
--- trunk/target-sh4/translate.c	(revision 5119)
+++ trunk/target-sh4/translate.c	(working copy)
@@ -69,6 +69,8 @@
 
 /* dyngen register indexes */
 static TCGv cpu_T[2];
+static TCGv cpu_FT[2];
+static TCGv cpu_DT[2];
 
 #include "gen-icount.h"
 
@@ -90,6 +92,15 @@
     cpu_env = tcg_global_reg_new(TCG_TYPE_PTR, TCG_AREG0, "env");
     cpu_T[0] = tcg_global_reg_new(TCG_TYPE_I32, TCG_AREG1, "T0");
     cpu_T[1] = tcg_global_reg_new(TCG_TYPE_I32, TCG_AREG2, "T1");
+    cpu_FT[0] = tcg_global_mem_new(TCG_TYPE_I32, TCG_AREG0,
+				   offsetof(CPUState, ft0), "FT0");
+    cpu_FT[1] = tcg_global_mem_new(TCG_TYPE_I32, TCG_AREG0,
+				   offsetof(CPUState, ft1), "FT1");
+    cpu_DT[0] = tcg_global_mem_new(TCG_TYPE_I64, TCG_AREG0,
+				   offsetof(CPUState, dt0), "DT0");
+    printf("initial offset : %d\n", offsetof(CPUState, dt0));
+    cpu_DT[1] = tcg_global_mem_new(TCG_TYPE_I64, TCG_AREG0,
+				   offsetof(CPUState, dt1), "DT1");
 
     for (i = 0; i < 24; i++)
         cpu_gregs[i] = tcg_global_mem_new(TCG_TYPE_I32, TCG_AREG0,
@@ -337,6 +348,62 @@
     tcg_gen_ori_i32(cpu_flags, cpu_flags, flags);
 }
 
+
+#define DEF_gen_ld_frN_FTx(FTindex)                                           \
+static inline void gen_ld_frN_FT##FTindex(TCGv cpu_env, uint32_t reg)         \
+{                                                                             \
+    tcg_gen_ld_i32(cpu_FT[FTindex], cpu_env, offsetof(CPUState, fregs[reg])); \
+}
+
+DEF_gen_ld_frN_FTx(0)
+DEF_gen_ld_frN_FTx(1)
+
+#define DEF_gen_ld_drN_DTx(DTindex)                                           \
+static inline void gen_ld_drN_DT##DTindex(TCGv cpu_env, uint32_t reg)         \
+{                                                                             \
+    TCGv tmp = tcg_temp_new(TCG_TYPE_I32);                                    \
+    uint32_t offset = offsetof(CPUState, dt##DTindex);                        \
+                                                                              \
+    tcg_gen_ld_i32(tmp, cpu_env, offsetof(CPUState, fregs[reg]));             \
+    tcg_gen_st_i32(tmp, cpu_env, offset + offsetof(CPU_DoubleU, l.upper));    \
+    tcg_gen_ld_i32(tmp, cpu_env, offsetof(CPUState, fregs[reg + 1]));         \
+    tcg_gen_st_i32(tmp, cpu_env, offset + offsetof(CPU_DoubleU, l.lower));    \
+                                                                              \
+    tcg_temp_free(tmp);                                                       \
+}
+
+DEF_gen_ld_drN_DTx(0)
+DEF_gen_ld_drN_DTx(1)
+
+#define DEF_gen_st_FTx_frN(FTindex)                                           \
+static inline void gen_st_FT##FTindex##_frN(TCGv cpu_env, uint32_t reg)       \
+{                                                                             \
+    tcg_gen_st_i32(cpu_FT[FTindex], cpu_env, offsetof(CPUState, fregs[reg])); \
+}
+
+DEF_gen_st_FTx_frN(0)
+DEF_gen_st_FTx_frN(1)
+
+#define DEF_gen_st_DTx_drN(DTindex)                                           \
+static inline void gen_st_DT##DTindex##_drN(TCGv cpu_env, uint32_t reg)       \
+{                                                                             \
+    TCGv tmp = tcg_temp_new(TCG_TYPE_I32);                                    \
+    uint32_t offset = offsetof(CPUState, dt##DTindex);                        \
+                                                                              \
+    tcg_gen_st_i64(cpu_DT[DTindex], cpu_env, offset); /* keep DTx alive. */   \
+                                                                              \
+    tcg_gen_ld_i32(tmp, cpu_env, offset + offsetof(CPU_DoubleU, l.upper));    \
+    tcg_gen_st_i32(tmp, cpu_env, offsetof(CPUState, fregs[reg]));             \
+    tcg_gen_ld_i32(tmp, cpu_env, offset + offsetof(CPU_DoubleU, l.lower));    \
+    tcg_gen_st_i32(tmp, cpu_env, offsetof(CPUState, fregs[reg + 1]));         \
+                                                                              \
+    tcg_temp_free(tmp);                                                       \
+}
+
+DEF_gen_st_DTx_drN(0)
+DEF_gen_st_DTx_drN(1)
+
+
 #define B3_0 (ctx->opcode & 0xf)
 #define B6_4 ((ctx->opcode >> 4) & 0x7)
 #define B7_4 ((ctx->opcode >> 4) & 0xf)
@@ -788,12 +855,14 @@
 	tcg_gen_xor_i32(cpu_gregs[REG(B11_8)], cpu_gregs[REG(B11_8)], cpu_gregs[REG(B7_4)]);
 	return;
     case 0xf00c: /* fmov {F,D,X}Rm,{F,D,X}Rn - FPSCR: Nothing */
+        /* 64 bit fmov code is not tested, because SH-Linux seems
+	   not to set FPSCR_SZ flag true. */
 	if (ctx->fpscr & FPSCR_SZ) {
-	    gen_op_fmov_drN_DT0(XREG(B7_4));
-	    gen_op_fmov_DT0_drN(XREG(B11_8));
+	    gen_ld_drN_DT0(cpu_env, XREG(B7_4));
+	    gen_st_DT0_drN(cpu_env, XREG(B11_8));
 	} else {
-	    gen_op_fmov_frN_FT0(FREG(B7_4));
-	    gen_op_fmov_FT0_frN(FREG(B11_8));
+	    gen_ld_frN_FT0(cpu_env, FREG(B7_4));
+	    gen_st_FT0_frN(cpu_env, FREG(B11_8));
 	}
 	return;
     case 0xf00a: /* fmov {F,D,X}Rm,@Rn - FPSCR: Nothing */
@@ -882,17 +951,22 @@
 	if (ctx->fpscr & FPSCR_PR) {
 	    if (ctx->opcode & 0x0110)
 		break; /* illegal instruction */
-	    gen_op_fmov_drN_DT1(DREG(B7_4));
-	    gen_op_fmov_drN_DT0(DREG(B11_8));
+	    gen_ld_drN_DT1(cpu_env, DREG(B7_4));
+	    gen_ld_drN_DT0(cpu_env, DREG(B11_8));
 	}
 	else {
-	    gen_op_fmov_frN_FT1(FREG(B7_4));
-	    gen_op_fmov_frN_FT0(FREG(B11_8));
+	    gen_ld_frN_FT1(cpu_env, FREG(B7_4));
+	    gen_ld_frN_FT0(cpu_env, FREG(B11_8));
 	}
 
 	switch (ctx->opcode & 0xf00f) {
 	case 0xf000:		/* fadd Rm,Rn */
-	    ctx->fpscr & FPSCR_PR ? gen_op_fadd_DT() : gen_op_fadd_FT();
+	    if (ctx->fpscr & FPSCR_PR)
+	        tcg_gen_helper_1_2(helper_fadd_DT, cpu_DT[0],
+				   cpu_DT[0], cpu_DT[1]);
+	    else
+	        tcg_gen_helper_1_2(helper_fadd_FT, cpu_FT[0],
+				   cpu_FT[0], cpu_FT[1]);
 	    break;
 	case 0xf001:		/* fsub Rm,Rn */
 	    ctx->fpscr & FPSCR_PR ? gen_op_fsub_DT() : gen_op_fsub_FT();
@@ -912,10 +986,10 @@
 	}
 
 	if (ctx->fpscr & FPSCR_PR) {
-	    gen_op_fmov_DT0_drN(DREG(B11_8));
+	    gen_st_DT0_drN(cpu_env, DREG(B11_8));
 	}
 	else {
-	    gen_op_fmov_FT0_frN(FREG(B11_8));
+	    gen_st_FT0_frN(cpu_env, FREG(B11_8));
 	}
 	return;
     }

^ permalink raw reply	[flat|nested] 6+ messages in thread

* Re: [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG
  2008-08-31 17:28   ` Shin-ichiro KAWASAKI
@ 2008-08-31 18:28     ` Blue Swirl
  2008-08-31 19:32     ` Aurelien Jarno
  1 sibling, 0 replies; 6+ messages in thread
From: Blue Swirl @ 2008-08-31 18:28 UTC (permalink / raw)
  To: qemu-devel

On 8/31/08, Shin-ichiro KAWASAKI <kawasaki@juno.dti.ne.jp> wrote:
> Thank your for comments, Blue Swirl!
>  The new patch is shown at the end of this mail.
>  Reviews are welcome, again.
>
>  Blue Swirl wrote:
>
> > > On 8/30/08, Shin-ichiro KAWASAKI <kawasaki@juno.dti.ne.jp> wrote:
> >
> > > >> This patch converts two SH4 float instructions, 'fmov Rm,Rn' and
> > > >>  'fadd' into TCG.  Before converting other float instructions
> > > >>  into TCG, comments on it will be appreciated.
> > > >>
> > > >>  - TCG variables intorudced for float operation : FT[01], and DT[01].
> > > >>  - I think float registers 'fregs' are not to be mapped for
> > > >>   TCG variables, because TCG does not support float operations, now.
> > >
> > >
> > > In TCG README Fabrice mentioned that he's working on a floating point
> > > version. It would be nice to get that committed, already m68k has a
> > > fake version. I did not use TCG variables for float just because I've
> > > been waiting for that. It's not possible to pass env->fp_status
> > > cleanly now (for example to call softfloat functions directly). And
> > > for example on Sparc host, moving data from integer registers to
> > > floating point registers must use memory in between them so there the
> > > integer TCG registers should be separate from float TCG registers.
> >
>
>  I agree that it is important to conisder mapping fregs ot TCG feature
>  like m68k implementation does. But I think this work will take too long
>  time, if I do it, and it will be some break for converting TCG work.
>  I think it is not too late to do this work after eliminating 'op.c'.

That's a valid approach, of course.

>  And I have a question on it.
>  As you pointed out below, two 32 bit registers are concatanated as one
>  64 bit register.  When floating point TCG variables introduced in the
> future,
>  it is straight to map one memory region for 32bit TCG variable and 64bit
>  TCG variable.  I wonder such two way mapping suit for TCG, or not.

I think it depends how well TCG can detect aliased variables. As i386
does not use TCG variables for AL, AX and EAX, I guess that it can't.
This is of course just speculation.

> > > There is no need to pass env as a parameter, it's available to
> > > op_helper.c code anyway.
> >
>
>  Indeed. Thanks!
>
>
> > > I guess that like in Sparc, two 32 bit fregs can be combined to a 64
> > > bit double. Please have a look at target-sparc/translate.c on the use
> > > of CPU_DoubleU, there should be a safer way to access the registers.
> >
>
>  Thanks. I wrote new codes for load/store function, following sparc.

Looks good, except this small thing below:
>  +    printf("initial offset : %d\n", offsetof(CPUState, dt0));

^ permalink raw reply	[flat|nested] 6+ messages in thread

* Re: [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG
  2008-08-31 17:28   ` Shin-ichiro KAWASAKI
  2008-08-31 18:28     ` Blue Swirl
@ 2008-08-31 19:32     ` Aurelien Jarno
  2008-09-01 22:11       ` Aurelien Jarno
  1 sibling, 1 reply; 6+ messages in thread
From: Aurelien Jarno @ 2008-08-31 19:32 UTC (permalink / raw)
  To: Shin-ichiro KAWASAKI; +Cc: qemu-devel

On Mon, Sep 01, 2008 at 02:28:59AM +0900, Shin-ichiro KAWASAKI wrote:
> Thank your for comments, Blue Swirl!
> The new patch is shown at the end of this mail.
> Reviews are welcome, again.
>

Thanks for you patch. It looks good, but it doesn't work here (on an
amd64 host): while the kernel is booting correctly with qemu-system-sh4,
running /usr/bin/cal with qemu-sh4 causes a segfault.

-- 
  .''`.  Aurelien Jarno	            | GPG: 1024D/F1BCDB73
 : :' :  Debian developer           | Electrical Engineer
 `. `'   aurel32@debian.org         | aurelien@aurel32.net
   `-    people.debian.org/~aurel32 | www.aurel32.net

^ permalink raw reply	[flat|nested] 6+ messages in thread

* Re: [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG
  2008-08-31 19:32     ` Aurelien Jarno
@ 2008-09-01 22:11       ` Aurelien Jarno
  0 siblings, 0 replies; 6+ messages in thread
From: Aurelien Jarno @ 2008-09-01 22:11 UTC (permalink / raw)
  To: qemu-devel; +Cc: Shin-ichiro KAWASAKI

On Sun, Aug 31, 2008 at 09:32:03PM +0200, Aurelien Jarno wrote:
> On Mon, Sep 01, 2008 at 02:28:59AM +0900, Shin-ichiro KAWASAKI wrote:
> > Thank your for comments, Blue Swirl!
> > The new patch is shown at the end of this mail.
> > Reviews are welcome, again.
> >
> 
> Thanks for you patch. It looks good, but it doesn't work here (on an
> amd64 host): while the kernel is booting correctly with qemu-system-sh4,
> running /usr/bin/cal with qemu-sh4 causes a segfault.
> 

I have finally found the problem: the gen_ld_frN_FT and gen_st_frN_FT
already have access to cpu_env, this value does not needed to be passed
again. Passing it as a TCGv variable caused it to be truncated.

At the end, looking at what other targets do, I have decided to convert
the SH4 floating point ops the "MIPS way", which has the advantage of
only using TCG temp instead of global FT0, FT1, DT0 and DT1 variables.

I have committed that to the SVN, so the SH4 target is now fully
converted to TCG. I have tested my changes using /usr/bin/awk with
sh4-linux-user doing FP computations.

In the next days/weeks, I'll try to convert the alpha target to TCG, as
I need some more experience with TCG before doing the PowerPC one. I
have seen that Tristan already send patches about that, I'll have a look
later.

-- 
  .''`.  Aurelien Jarno	            | GPG: 1024D/F1BCDB73
 : :' :  Debian developer           | Electrical Engineer
 `. `'   aurel32@debian.org         | aurelien@aurel32.net
   `-    people.debian.org/~aurel32 | www.aurel32.net

^ permalink raw reply	[flat|nested] 6+ messages in thread

end of thread, other threads:[~2008-09-01 22:12 UTC | newest]

Thread overview: 6+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2008-08-30 19:36 [Qemu-devel] [PATCH] SH4: convert fmov/fadd to TCG Shin-ichiro KAWASAKI
2008-08-30 20:23 ` Blue Swirl
2008-08-31 17:28   ` Shin-ichiro KAWASAKI
2008-08-31 18:28     ` Blue Swirl
2008-08-31 19:32     ` Aurelien Jarno
2008-09-01 22:11       ` Aurelien Jarno

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).