Commit 70f7557e authored by Ng Zhi An's avatar Ng Zhi An Committed by Commit Bot

[wasm simd] Implement F64x2Neg on x64

Bug: v8:8460
Change-Id: I3e649e1398be429b8aff5b57316e320f9ca5ae8f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/1703763
Commit-Queue: Zhi An Ng <zhin@chromium.org>
Reviewed-by: 's avatarMichael Starzinger <mstarzinger@chromium.org>
Reviewed-by: 's avatarBill Budge <bbudge@chromium.org>
Reviewed-by: 's avatarDeepti Gandluri <gdeepti@chromium.org>
Cr-Commit-Position: refs/heads/master@{#62817}
parent e9b00902
...@@ -1822,6 +1822,8 @@ void InstructionSelector::VisitNode(Node* node) { ...@@ -1822,6 +1822,8 @@ void InstructionSelector::VisitNode(Node* node) {
return MarkAsSimd128(node), VisitF64x2ReplaceLane(node); return MarkAsSimd128(node), VisitF64x2ReplaceLane(node);
case IrOpcode::kF64x2Abs: case IrOpcode::kF64x2Abs:
return MarkAsSimd128(node), VisitF64x2Abs(node); return MarkAsSimd128(node), VisitF64x2Abs(node);
case IrOpcode::kF64x2Neg:
return MarkAsSimd128(node), VisitF64x2Neg(node);
case IrOpcode::kF64x2Eq: case IrOpcode::kF64x2Eq:
return MarkAsSimd128(node), VisitF64x2Eq(node); return MarkAsSimd128(node), VisitF64x2Eq(node);
case IrOpcode::kF64x2Ne: case IrOpcode::kF64x2Ne:
...@@ -2552,6 +2554,7 @@ void InstructionSelector::VisitF64x2Splat(Node* node) { UNIMPLEMENTED(); } ...@@ -2552,6 +2554,7 @@ void InstructionSelector::VisitF64x2Splat(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2ExtractLane(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2ExtractLane(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2ReplaceLane(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2ReplaceLane(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Abs(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Abs(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Neg(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Eq(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Eq(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Ne(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Ne(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Lt(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Lt(Node* node) { UNIMPLEMENTED(); }
......
...@@ -2292,6 +2292,23 @@ CodeGenerator::CodeGenResult CodeGenerator::AssembleArchInstruction( ...@@ -2292,6 +2292,23 @@ CodeGenerator::CodeGenResult CodeGenerator::AssembleArchInstruction(
} }
break; break;
} }
case kX64F64x2Neg: {
// TODO(zhin): look at kSSEFloat64Neg instruction selection and codegen to
// avoid having 2 cases here, and potentially share code
CpuFeatureScope sse_scope(tasm(), SSE4_1);
XMMRegister dst = i.OutputSimd128Register();
XMMRegister src = i.InputSimd128Register(0);
if (dst == src) {
__ pcmpeqq(kScratchDoubleReg, kScratchDoubleReg);
__ psllq(kScratchDoubleReg, 63);
__ xorpd(dst, kScratchDoubleReg);
} else {
__ pcmpeqq(dst, dst);
__ psllq(dst, 63);
__ xorpd(dst, src);
}
break;
}
case kX64F64x2Eq: { case kX64F64x2Eq: {
DCHECK_EQ(i.OutputSimd128Register(), i.InputSimd128Register(0)); DCHECK_EQ(i.OutputSimd128Register(), i.InputSimd128Register(0));
__ cmpeqpd(i.OutputSimd128Register(), i.InputSimd128Register(1)); __ cmpeqpd(i.OutputSimd128Register(), i.InputSimd128Register(1));
......
...@@ -162,6 +162,7 @@ namespace compiler { ...@@ -162,6 +162,7 @@ namespace compiler {
V(X64F64x2ExtractLane) \ V(X64F64x2ExtractLane) \
V(X64F64x2ReplaceLane) \ V(X64F64x2ReplaceLane) \
V(X64F64x2Abs) \ V(X64F64x2Abs) \
V(X64F64x2Neg) \
V(X64F64x2Eq) \ V(X64F64x2Eq) \
V(X64F64x2Ne) \ V(X64F64x2Ne) \
V(X64F64x2Lt) \ V(X64F64x2Lt) \
......
...@@ -128,6 +128,7 @@ int InstructionScheduler::GetTargetInstructionFlags( ...@@ -128,6 +128,7 @@ int InstructionScheduler::GetTargetInstructionFlags(
case kX64F64x2ExtractLane: case kX64F64x2ExtractLane:
case kX64F64x2ReplaceLane: case kX64F64x2ReplaceLane:
case kX64F64x2Abs: case kX64F64x2Abs:
case kX64F64x2Neg:
case kX64F64x2Eq: case kX64F64x2Eq:
case kX64F64x2Ne: case kX64F64x2Ne:
case kX64F64x2Lt: case kX64F64x2Lt:
......
...@@ -2661,6 +2661,7 @@ VISIT_ATOMIC_BINOP(Xor) ...@@ -2661,6 +2661,7 @@ VISIT_ATOMIC_BINOP(Xor)
#define SIMD_UNOP_LIST(V) \ #define SIMD_UNOP_LIST(V) \
V(F64x2Abs) \ V(F64x2Abs) \
V(F64x2Neg) \
V(F32x4SConvertI32x4) \ V(F32x4SConvertI32x4) \
V(F32x4Abs) \ V(F32x4Abs) \
V(F32x4Neg) \ V(F32x4Neg) \
......
...@@ -247,6 +247,7 @@ MachineType AtomicOpType(Operator const* op) { ...@@ -247,6 +247,7 @@ MachineType AtomicOpType(Operator const* op) {
V(Word32PairSar, Operator::kNoProperties, 3, 0, 2) \ V(Word32PairSar, Operator::kNoProperties, 3, 0, 2) \
V(F64x2Splat, Operator::kNoProperties, 1, 0, 1) \ V(F64x2Splat, Operator::kNoProperties, 1, 0, 1) \
V(F64x2Abs, Operator::kNoProperties, 1, 0, 1) \ V(F64x2Abs, Operator::kNoProperties, 1, 0, 1) \
V(F64x2Neg, Operator::kNoProperties, 1, 0, 1) \
V(F64x2Eq, Operator::kCommutative, 2, 0, 1) \ V(F64x2Eq, Operator::kCommutative, 2, 0, 1) \
V(F64x2Ne, Operator::kCommutative, 2, 0, 1) \ V(F64x2Ne, Operator::kCommutative, 2, 0, 1) \
V(F64x2Lt, Operator::kNoProperties, 2, 0, 1) \ V(F64x2Lt, Operator::kNoProperties, 2, 0, 1) \
......
...@@ -470,6 +470,7 @@ class V8_EXPORT_PRIVATE MachineOperatorBuilder final ...@@ -470,6 +470,7 @@ class V8_EXPORT_PRIVATE MachineOperatorBuilder final
// SIMD operators. // SIMD operators.
const Operator* F64x2Splat(); const Operator* F64x2Splat();
const Operator* F64x2Abs(); const Operator* F64x2Abs();
const Operator* F64x2Neg();
const Operator* F64x2ExtractLane(int32_t); const Operator* F64x2ExtractLane(int32_t);
const Operator* F64x2ReplaceLane(int32_t); const Operator* F64x2ReplaceLane(int32_t);
const Operator* F64x2Eq(); const Operator* F64x2Eq();
......
...@@ -744,6 +744,7 @@ ...@@ -744,6 +744,7 @@
V(F64x2ExtractLane) \ V(F64x2ExtractLane) \
V(F64x2ReplaceLane) \ V(F64x2ReplaceLane) \
V(F64x2Abs) \ V(F64x2Abs) \
V(F64x2Neg) \
V(F64x2Eq) \ V(F64x2Eq) \
V(F64x2Ne) \ V(F64x2Ne) \
V(F64x2Lt) \ V(F64x2Lt) \
......
...@@ -3996,6 +3996,8 @@ Node* WasmGraphBuilder::SimdOp(wasm::WasmOpcode opcode, Node* const* inputs) { ...@@ -3996,6 +3996,8 @@ Node* WasmGraphBuilder::SimdOp(wasm::WasmOpcode opcode, Node* const* inputs) {
return graph()->NewNode(mcgraph()->machine()->F64x2Splat(), inputs[0]); return graph()->NewNode(mcgraph()->machine()->F64x2Splat(), inputs[0]);
case wasm::kExprF64x2Abs: case wasm::kExprF64x2Abs:
return graph()->NewNode(mcgraph()->machine()->F64x2Abs(), inputs[0]); return graph()->NewNode(mcgraph()->machine()->F64x2Abs(), inputs[0]);
case wasm::kExprF64x2Neg:
return graph()->NewNode(mcgraph()->machine()->F64x2Neg(), inputs[0]);
case wasm::kExprF64x2Eq: case wasm::kExprF64x2Eq:
return graph()->NewNode(mcgraph()->machine()->F64x2Eq(), inputs[0], return graph()->NewNode(mcgraph()->machine()->F64x2Eq(), inputs[0],
inputs[1]); inputs[1]);
......
...@@ -2299,6 +2299,7 @@ class ThreadImpl { ...@@ -2299,6 +2299,7 @@ class ThreadImpl {
return true; \ return true; \
} }
UNOP_CASE(F64x2Abs, f64x2, float2, 2, std::abs(a)) UNOP_CASE(F64x2Abs, f64x2, float2, 2, std::abs(a))
UNOP_CASE(F64x2Neg, f64x2, float2, 2, -a)
UNOP_CASE(F32x4Abs, f32x4, float4, 4, std::abs(a)) UNOP_CASE(F32x4Abs, f32x4, float4, 4, std::abs(a))
UNOP_CASE(F32x4Neg, f32x4, float4, 4, -a) UNOP_CASE(F32x4Neg, f32x4, float4, 4, -a)
UNOP_CASE(F32x4RecipApprox, f32x4, float4, 4, base::Recip(a)) UNOP_CASE(F32x4RecipApprox, f32x4, float4, 4, base::Recip(a))
......
...@@ -220,6 +220,7 @@ const char* WasmOpcodes::OpcodeName(WasmOpcode opcode) { ...@@ -220,6 +220,7 @@ const char* WasmOpcodes::OpcodeName(WasmOpcode opcode) {
// SIMD opcodes. // SIMD opcodes.
CASE_SIMD_OP(Splat, "splat") CASE_SIMD_OP(Splat, "splat")
CASE_SIMD_OP(Neg, "neg") CASE_SIMD_OP(Neg, "neg")
CASE_F64x2_OP(Neg, "neg")
CASE_I64x2_OP(Neg, "neg") CASE_I64x2_OP(Neg, "neg")
CASE_SIMD_OP(Eq, "eq") CASE_SIMD_OP(Eq, "eq")
CASE_F64x2_OP(Eq, "eq") CASE_F64x2_OP(Eq, "eq")
......
...@@ -386,6 +386,7 @@ bool IsJSCompatibleSignature(const FunctionSig* sig, bool hasBigIntFeature); ...@@ -386,6 +386,7 @@ bool IsJSCompatibleSignature(const FunctionSig* sig, bool hasBigIntFeature);
V(F32x4Min, 0xfd9e, s_ss) \ V(F32x4Min, 0xfd9e, s_ss) \
V(F32x4Max, 0xfd9f, s_ss) \ V(F32x4Max, 0xfd9f, s_ss) \
V(F64x2Abs, 0xfda0, s_s) \ V(F64x2Abs, 0xfda0, s_s) \
V(F64x2Neg, 0xfda1, s_s) \
V(I32x4SConvertF32x4, 0xfdab, s_s) \ V(I32x4SConvertF32x4, 0xfdab, s_s) \
V(I32x4UConvertF32x4, 0xfdac, s_s) \ V(I32x4UConvertF32x4, 0xfdac, s_s) \
V(F32x4SConvertI32x4, 0xfdaf, s_s) \ V(F32x4SConvertI32x4, 0xfdaf, s_s) \
......
...@@ -954,6 +954,10 @@ WASM_SIMD_TEST_NO_LOWERING(F64x2Abs) { ...@@ -954,6 +954,10 @@ WASM_SIMD_TEST_NO_LOWERING(F64x2Abs) {
RunF64x2UnOpTest(execution_tier, lower_simd, kExprF64x2Abs, std::abs); RunF64x2UnOpTest(execution_tier, lower_simd, kExprF64x2Abs, std::abs);
} }
WASM_SIMD_TEST_NO_LOWERING(F64x2Neg) {
RunF64x2UnOpTest(execution_tier, lower_simd, kExprF64x2Neg, Negate);
}
WASM_SIMD_TEST_NO_LOWERING(I64x2Splat) { WASM_SIMD_TEST_NO_LOWERING(I64x2Splat) {
WasmRunner<int32_t, int64_t> r(execution_tier, lower_simd); WasmRunner<int32_t, int64_t> r(execution_tier, lower_simd);
// Set up a global to hold output vector. // Set up a global to hold output vector.
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment