diff mbox series

[2/2] target/arm: Fix do_predset for large VL

Message ID 20180705191929.30773-3-richard.henderson@linaro.org
State Superseded
Headers show
Series target/arm: SVE fixes | expand

Commit Message

Richard Henderson July 5, 2018, 7:19 p.m. UTC
Use MAKE_64BIT_MASK instead of open-coding.  Remove an odd
vector size check that is unlikely to be more profitable
than 3 64-bit integer stores.  Correct the iteration for WORD
to avoid writing too much data.

Fixes RISU tests of PTRUE for VL 256.

Signed-off-by: Richard Henderson <richard.henderson@linaro.org>

---
 target/arm/translate-sve.c | 10 ++--------
 1 file changed, 2 insertions(+), 8 deletions(-)

-- 
2.17.1

Comments

Alex Bennée July 6, 2018, 8:14 a.m. UTC | #1
Richard Henderson <richard.henderson@linaro.org> writes:

> Use MAKE_64BIT_MASK instead of open-coding.  Remove an odd

> vector size check that is unlikely to be more profitable

> than 3 64-bit integer stores.  Correct the iteration for WORD

> to avoid writing too much data.

>

> Fixes RISU tests of PTRUE for VL 256.

>

> Signed-off-by: Richard Henderson <richard.henderson@linaro.org>


Reviewed-by: Alex Bennée <alex.bennee@linaro.org>

Tested-by: Alex Bennée <alex.bennee@linaro.org>


> ---

>  target/arm/translate-sve.c | 10 ++--------

>  1 file changed, 2 insertions(+), 8 deletions(-)

>

> diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c

> index d41f1155f9..374051cd20 100644

> --- a/target/arm/translate-sve.c

> +++ b/target/arm/translate-sve.c

> @@ -1438,7 +1438,7 @@ static bool do_predset(DisasContext *s, int esz, int rd, int pat, bool setflag)

>          setsz = numelem << esz;

>          lastword = word = pred_esz_masks[esz];

>          if (setsz % 64) {

> -            lastword &= ~(-1ull << (setsz % 64));

> +            lastword &= MAKE_64BIT_MASK(0, setsz % 64);

>          }

>      }

>

> @@ -1457,19 +1457,13 @@ static bool do_predset(DisasContext *s, int esz, int rd, int pat, bool setflag)

>              tcg_gen_gvec_dup64i(ofs, oprsz, maxsz, word);

>              goto done;

>          }

> -        if (oprsz * 8 == setsz + 8) {

> -            tcg_gen_gvec_dup64i(ofs, oprsz, maxsz, word);

> -            tcg_gen_movi_i64(t, 0);

> -            tcg_gen_st_i64(t, cpu_env, ofs + oprsz - 8);

> -            goto done;

> -        }

>      }

>

>      setsz /= 8;

>      fullsz /= 8;

>

>      tcg_gen_movi_i64(t, word);

> -    for (i = 0; i < setsz; i += 8) {

> +    for (i = 0; i < QEMU_ALIGN_DOWN(setsz, 8); i += 8) {

>          tcg_gen_st_i64(t, cpu_env, ofs + i);

>      }

>      if (lastword != word) {



--
Alex Bennée
diff mbox series

Patch

diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c
index d41f1155f9..374051cd20 100644
--- a/target/arm/translate-sve.c
+++ b/target/arm/translate-sve.c
@@ -1438,7 +1438,7 @@  static bool do_predset(DisasContext *s, int esz, int rd, int pat, bool setflag)
         setsz = numelem << esz;
         lastword = word = pred_esz_masks[esz];
         if (setsz % 64) {
-            lastword &= ~(-1ull << (setsz % 64));
+            lastword &= MAKE_64BIT_MASK(0, setsz % 64);
         }
     }
 
@@ -1457,19 +1457,13 @@  static bool do_predset(DisasContext *s, int esz, int rd, int pat, bool setflag)
             tcg_gen_gvec_dup64i(ofs, oprsz, maxsz, word);
             goto done;
         }
-        if (oprsz * 8 == setsz + 8) {
-            tcg_gen_gvec_dup64i(ofs, oprsz, maxsz, word);
-            tcg_gen_movi_i64(t, 0);
-            tcg_gen_st_i64(t, cpu_env, ofs + oprsz - 8);
-            goto done;
-        }
     }
 
     setsz /= 8;
     fullsz /= 8;
 
     tcg_gen_movi_i64(t, word);
-    for (i = 0; i < setsz; i += 8) {
+    for (i = 0; i < QEMU_ALIGN_DOWN(setsz, 8); i += 8) {
         tcg_gen_st_i64(t, cpu_env, ofs + i);
     }
     if (lastword != word) {