aboutsummaryrefslogtreecommitdiff
path: root/target-arm/translate.c
diff options
context:
space:
mode:
authorPaul Brook <paul@codesourcery.com>2010-06-11 20:01:00 +0100
committerPaul Brook <paul@codesourcery.com>2010-06-11 20:37:51 +0100
commit41ba834146f1d8b9cbc09a9f25f5c6b84bf405d9 (patch)
treed6981379bb90fa2d23b452641226a96e66ee1d28 /target-arm/translate.c
parent0e2029a063405091ee34170ef71aa321715e4357 (diff)
downloadqemu-41ba834146f1d8b9cbc09a9f25f5c6b84bf405d9.zip
qemu-41ba834146f1d8b9cbc09a9f25f5c6b84bf405d9.tar.gz
qemu-41ba834146f1d8b9cbc09a9f25f5c6b84bf405d9.tar.bz2
NEON vldN optimization
When combining multiple values as part of a NEON array load, do explcit shift/or rather than using gen_bfi. This voids redundant mask operations. Signed-off-by: Paul Brook <paul@codesourcery.com>
Diffstat (limited to 'target-arm/translate.c')
-rw-r--r--target-arm/translate.c6
1 files changed, 4 insertions, 2 deletions
diff --git a/target-arm/translate.c b/target-arm/translate.c
index 0eccca5..a28e2ff 100644
--- a/target-arm/translate.c
+++ b/target-arm/translate.c
@@ -3854,7 +3854,8 @@ static int disas_neon_ls_insn(CPUState * env, DisasContext *s, uint32_t insn)
tcg_gen_addi_i32(addr, addr, stride);
tmp2 = gen_ld16u(addr, IS_USER(s));
tcg_gen_addi_i32(addr, addr, stride);
- gen_bfi(tmp, tmp, tmp2, 16, 0xffff);
+ tcg_gen_shli_i32(tmp2, tmp2, 16);
+ tcg_gen_or_i32(tmp, tmp, tmp2);
dead_tmp(tmp2);
neon_store_reg(rd, pass, tmp);
} else {
@@ -3875,7 +3876,8 @@ static int disas_neon_ls_insn(CPUState * env, DisasContext *s, uint32_t insn)
if (n == 0) {
tmp2 = tmp;
} else {
- gen_bfi(tmp2, tmp2, tmp, n * 8, 0xff);
+ tcg_gen_shli_i32(tmp, tmp, n * 8);
+ tcg_gen_or_i32(tmp2, tmp2, tmp);
dead_tmp(tmp);
}
}