Commit 23b5d936 authored by Ng Zhi An's avatar Ng Zhi An Committed by Commit Bot

[wasm-simd] No need to mask immediates for i8x16.shuffle

The immediates would have been checked by the validation, so we can skip
masking them.

Bug: v8:10696
Change-Id: I18e4746b1eb08a2436311a633341be0c88f52139
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2453456
Commit-Queue: Zhi An Ng <zhin@chromium.org>
Reviewed-by: 's avatarBill Budge <bbudge@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70394}
parent b87db517
......@@ -3121,8 +3121,7 @@ CodeGenerator::CodeGenResult CodeGenerator::AssembleArchInstruction(
int scratch_s_base = scratch.code() * 4;
for (int j = 0; j < 4; j++) {
uint32_t four_lanes = i.InputUint32(2 + j);
// Ensure byte indices are in [0, 31] so masks are never NaNs.
four_lanes &= 0x1F1F1F1F;
DCHECK_EQ(0, four_lanes & (table_size == 2 ? 0xF0F0F0F0 : 0xE0E0E0E0));
__ vmov(SwVfpRegister::from_code(scratch_s_base + j),
Float32::FromBits(four_lanes));
}
......
......@@ -2560,17 +2560,15 @@ CodeGenerator::CodeGenResult CodeGenerator::AssembleArchInstruction(
src1 = i.InputSimd128Register(1).V16B();
// Unary shuffle table is in src0, binary shuffle table is in src0, src1,
// which must be consecutive.
uint32_t mask = 0;
if (src0 == src1) {
mask = 0x0F0F0F0F;
} else {
mask = 0x1F1F1F1F;
if (src0 != src1) {
DCHECK(AreConsecutive(src0, src1));
}
int64_t imm1 =
make_uint64(i.InputInt32(3) & mask, i.InputInt32(2) & mask);
int64_t imm2 =
make_uint64(i.InputInt32(5) & mask, i.InputInt32(4) & mask);
int64_t imm1 = make_uint64(i.InputInt32(3), i.InputInt32(2));
int64_t imm2 = make_uint64(i.InputInt32(5), i.InputInt32(4));
DCHECK_EQ(0, (imm1 | imm2) & (src0 == src1 ? 0xF0F0F0F0F0F0F0F0
: 0xE0E0E0E0E0E0E0E0));
UseScratchRegisterScope scope(tasm());
VRegister temp = scope.AcquireV(kFormat16B);
__ Movi(temp, imm2, imm1);
......
......@@ -3133,7 +3133,6 @@ void LiftoffAssembler::emit_i8x16_shuffle(LiftoffRegister dst,
}
int table_size = src1 == src2 ? 2 : 4;
uint32_t mask = table_size == 2 ? 0x0F0F0F0F : 0x1F1F1F1F;
int scratch_s_base = scratch.code() * 4;
for (int j = 0; j < 4; j++) {
......@@ -3141,11 +3140,9 @@ void LiftoffAssembler::emit_i8x16_shuffle(LiftoffRegister dst,
for (int i = 3; i >= 0; i--) {
imm = (imm << 8) | shuffle[j * 4 + i];
}
uint32_t four_lanes = imm;
DCHECK_EQ(0, imm & (table_size == 2 ? 0xF0F0F0F0 : 0xE0E0E0E0));
// Ensure indices are in [0,15] if table_size is 2, or [0,31] if 4.
four_lanes &= mask;
vmov(SwVfpRegister::from_code(scratch_s_base + j),
Float32::FromBits(four_lanes));
vmov(SwVfpRegister::from_code(scratch_s_base + j), Float32::FromBits(imm));
}
DwVfpRegister table_base = src1.low();
......
......@@ -2187,12 +2187,13 @@ void LiftoffAssembler::emit_i8x16_shuffle(LiftoffRegister dst,
Mov(src2.Q(), rhs.fp().Q());
}
uint8_t mask = lhs == rhs ? 0x0F : 0x1F;
int64_t imms[2] = {0, 0};
for (int i = 7; i >= 0; i--) {
imms[0] = (imms[0] << 8) | (shuffle[i] & mask);
imms[1] = (imms[1] << 8) | (shuffle[i + 8] & mask);
imms[0] = (imms[0] << 8) | (shuffle[i]);
imms[1] = (imms[1] << 8) | (shuffle[i + 8]);
}
DCHECK_EQ(0, (imms[0] | imms[1]) &
(lhs == rhs ? 0xF0F0F0F0F0F0F0F0 : 0xE0E0E0E0E0E0E0E0));
Movi(temp.V16B(), imms[1], imms[0]);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment