Implement F64x2Div for x64

Bug: v8:8460
Change-Id: I78cb2badab3f28621f91d6ff5f455967fdcbee44
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/1731782
Reviewed-by: Bill Budge <bbudge@chromium.org>
Reviewed-by: Michael Starzinger <mstarzinger@chromium.org>
Commit-Queue: Zhi An Ng <zhin@chromium.org>
Cr-Commit-Position: refs/heads/master@{#63171}
This commit is contained in:
Ng Zhi An 2019-08-02 10:28:04 -07:00 committed by Commit Bot
parent 390c430e6a
commit 7cefcded8e
16 changed files with 33 additions and 1 deletions

View File

@ -1334,7 +1334,7 @@ class V8_EXPORT_PRIVATE Assembler : public AssemblerBase {
AVX_S_3(vadd, 0x58) AVX_S_3(vadd, 0x58)
AVX_S_3(vsub, 0x5c) AVX_S_3(vsub, 0x5c)
AVX_S_3(vmul, 0x59) AVX_S_3(vmul, 0x59)
AVX_SP_3(vdiv, 0x5e) AVX_S_3(vdiv, 0x5e)
AVX_S_3(vmin, 0x5d) AVX_S_3(vmin, 0x5d)
AVX_S_3(vmax, 0x5f) AVX_S_3(vmax, 0x5f)
AVX_P_3(vand, 0x54) AVX_P_3(vand, 0x54)

View File

@ -13,6 +13,7 @@
V(subpd, 66, 0F, 5C) \ V(subpd, 66, 0F, 5C) \
V(minpd, 66, 0F, 5D) \ V(minpd, 66, 0F, 5D) \
V(maxpd, 66, 0F, 5F) \ V(maxpd, 66, 0F, 5F) \
V(divpd, 66, 0F, 5E) \
V(punpcklbw, 66, 0F, 60) \ V(punpcklbw, 66, 0F, 60) \
V(punpcklwd, 66, 0F, 61) \ V(punpcklwd, 66, 0F, 61) \
V(punpckldq, 66, 0F, 62) \ V(punpckldq, 66, 0F, 62) \

View File

@ -1853,6 +1853,8 @@ void InstructionSelector::VisitNode(Node* node) {
return MarkAsSimd128(node), VisitF64x2Sub(node); return MarkAsSimd128(node), VisitF64x2Sub(node);
case IrOpcode::kF64x2Mul: case IrOpcode::kF64x2Mul:
return MarkAsSimd128(node), VisitF64x2Mul(node); return MarkAsSimd128(node), VisitF64x2Mul(node);
case IrOpcode::kF64x2Div:
return MarkAsSimd128(node), VisitF64x2Div(node);
case IrOpcode::kF64x2Min: case IrOpcode::kF64x2Min:
return MarkAsSimd128(node), VisitF64x2Min(node); return MarkAsSimd128(node), VisitF64x2Min(node);
case IrOpcode::kF64x2Max: case IrOpcode::kF64x2Max:
@ -2600,6 +2602,7 @@ void InstructionSelector::VisitF64x2Neg(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Add(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Add(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Sub(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Sub(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Mul(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Mul(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Div(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Min(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Min(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Max(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Max(Node* node) { UNIMPLEMENTED(); }
void InstructionSelector::VisitF64x2Eq(Node* node) { UNIMPLEMENTED(); } void InstructionSelector::VisitF64x2Eq(Node* node) { UNIMPLEMENTED(); }

View File

@ -2310,6 +2310,10 @@ CodeGenerator::CodeGenResult CodeGenerator::AssembleArchInstruction(
ASSEMBLE_SSE_BINOP(mulpd); ASSEMBLE_SSE_BINOP(mulpd);
break; break;
} }
case kX64F64x2Div: {
ASSEMBLE_SSE_BINOP(divpd);
break;
}
case kX64F64x2Min: { case kX64F64x2Min: {
XMMRegister src1 = i.InputSimd128Register(1), XMMRegister src1 = i.InputSimd128Register(1),
dst = i.OutputSimd128Register(); dst = i.OutputSimd128Register();

View File

@ -166,6 +166,7 @@ namespace compiler {
V(X64F64x2Add) \ V(X64F64x2Add) \
V(X64F64x2Sub) \ V(X64F64x2Sub) \
V(X64F64x2Mul) \ V(X64F64x2Mul) \
V(X64F64x2Div) \
V(X64F64x2Min) \ V(X64F64x2Min) \
V(X64F64x2Max) \ V(X64F64x2Max) \
V(X64F64x2Eq) \ V(X64F64x2Eq) \

View File

@ -132,6 +132,7 @@ int InstructionScheduler::GetTargetInstructionFlags(
case kX64F64x2Add: case kX64F64x2Add:
case kX64F64x2Sub: case kX64F64x2Sub:
case kX64F64x2Mul: case kX64F64x2Mul:
case kX64F64x2Div:
case kX64F64x2Min: case kX64F64x2Min:
case kX64F64x2Max: case kX64F64x2Max:
case kX64F64x2Eq: case kX64F64x2Eq:

View File

@ -2599,6 +2599,7 @@ VISIT_ATOMIC_BINOP(Xor)
V(F64x2Add) \ V(F64x2Add) \
V(F64x2Sub) \ V(F64x2Sub) \
V(F64x2Mul) \ V(F64x2Mul) \
V(F64x2Div) \
V(F64x2Min) \ V(F64x2Min) \
V(F64x2Max) \ V(F64x2Max) \
V(F64x2Eq) \ V(F64x2Eq) \

View File

@ -256,6 +256,7 @@ MachineType AtomicOpType(Operator const* op) {
V(F64x2Add, Operator::kCommutative, 2, 0, 1) \ V(F64x2Add, Operator::kCommutative, 2, 0, 1) \
V(F64x2Sub, Operator::kNoProperties, 2, 0, 1) \ V(F64x2Sub, Operator::kNoProperties, 2, 0, 1) \
V(F64x2Mul, Operator::kCommutative, 2, 0, 1) \ V(F64x2Mul, Operator::kCommutative, 2, 0, 1) \
V(F64x2Div, Operator::kNoProperties, 2, 0, 1) \
V(F64x2Min, Operator::kCommutative, 2, 0, 1) \ V(F64x2Min, Operator::kCommutative, 2, 0, 1) \
V(F64x2Max, Operator::kCommutative, 2, 0, 1) \ V(F64x2Max, Operator::kCommutative, 2, 0, 1) \
V(F64x2Eq, Operator::kCommutative, 2, 0, 1) \ V(F64x2Eq, Operator::kCommutative, 2, 0, 1) \

View File

@ -474,6 +474,7 @@ class V8_EXPORT_PRIVATE MachineOperatorBuilder final
const Operator* F64x2Add(); const Operator* F64x2Add();
const Operator* F64x2Sub(); const Operator* F64x2Sub();
const Operator* F64x2Mul(); const Operator* F64x2Mul();
const Operator* F64x2Div();
const Operator* F64x2ExtractLane(int32_t); const Operator* F64x2ExtractLane(int32_t);
const Operator* F64x2Min(); const Operator* F64x2Min();
const Operator* F64x2Max(); const Operator* F64x2Max();

View File

@ -750,6 +750,7 @@
V(F64x2Add) \ V(F64x2Add) \
V(F64x2Sub) \ V(F64x2Sub) \
V(F64x2Mul) \ V(F64x2Mul) \
V(F64x2Div) \
V(F64x2Min) \ V(F64x2Min) \
V(F64x2Max) \ V(F64x2Max) \
V(F64x2Eq) \ V(F64x2Eq) \

View File

@ -4008,6 +4008,9 @@ Node* WasmGraphBuilder::SimdOp(wasm::WasmOpcode opcode, Node* const* inputs) {
case wasm::kExprF64x2Mul: case wasm::kExprF64x2Mul:
return graph()->NewNode(mcgraph()->machine()->F64x2Mul(), inputs[0], return graph()->NewNode(mcgraph()->machine()->F64x2Mul(), inputs[0],
inputs[1]); inputs[1]);
case wasm::kExprF64x2Div:
return graph()->NewNode(mcgraph()->machine()->F64x2Div(), inputs[0],
inputs[1]);
case wasm::kExprF64x2Min: case wasm::kExprF64x2Min:
return graph()->NewNode(mcgraph()->machine()->F64x2Min(), inputs[0], return graph()->NewNode(mcgraph()->machine()->F64x2Min(), inputs[0],
inputs[1]); inputs[1]);

View File

@ -1863,6 +1863,8 @@ int DisassemblerX64::TwoByteOpcodeInstruction(byte* data) {
mnemonic = "subpd"; mnemonic = "subpd";
} else if (opcode == 0x5D) { } else if (opcode == 0x5D) {
mnemonic = "minpd"; mnemonic = "minpd";
} else if (opcode == 0x5E) {
mnemonic = "divpd";
} else if (opcode == 0x5F) { } else if (opcode == 0x5F) {
mnemonic = "maxpd"; mnemonic = "maxpd";
} else if (opcode == 0x60) { } else if (opcode == 0x60) {

View File

@ -2244,6 +2244,7 @@ class ThreadImpl {
BINOP_CASE(F64x2Add, f64x2, float2, 2, a + b) BINOP_CASE(F64x2Add, f64x2, float2, 2, a + b)
BINOP_CASE(F64x2Sub, f64x2, float2, 2, a - b) BINOP_CASE(F64x2Sub, f64x2, float2, 2, a - b)
BINOP_CASE(F64x2Mul, f64x2, float2, 2, a * b) BINOP_CASE(F64x2Mul, f64x2, float2, 2, a * b)
BINOP_CASE(F64x2Div, f64x2, float2, 2, a / b)
BINOP_CASE(F64x2Min, f64x2, float2, 2, JSMin(a, b)) BINOP_CASE(F64x2Min, f64x2, float2, 2, JSMin(a, b))
BINOP_CASE(F64x2Max, f64x2, float2, 2, JSMax(a, b)) BINOP_CASE(F64x2Max, f64x2, float2, 2, JSMax(a, b))
BINOP_CASE(F32x4Add, f32x4, float4, 4, a + b) BINOP_CASE(F32x4Add, f32x4, float4, 4, a + b)

View File

@ -237,6 +237,7 @@ const char* WasmOpcodes::OpcodeName(WasmOpcode opcode) {
CASE_SIMD_OP(Mul, "mul") CASE_SIMD_OP(Mul, "mul")
CASE_F64x2_OP(Mul, "mul") CASE_F64x2_OP(Mul, "mul")
CASE_I64x2_OP(Mul, "mul") CASE_I64x2_OP(Mul, "mul")
CASE_F64x2_OP(Div, "div")
CASE_F64x2_OP(Splat, "splat") CASE_F64x2_OP(Splat, "splat")
CASE_F64x2_OP(Lt, "lt") CASE_F64x2_OP(Lt, "lt")
CASE_F64x2_OP(Le, "le") CASE_F64x2_OP(Le, "le")

View File

@ -406,6 +406,7 @@ bool IsJSCompatibleSignature(const FunctionSig* sig, bool hasBigIntFeature);
V(F64x2Add, 0xfda5, s_ss) \ V(F64x2Add, 0xfda5, s_ss) \
V(F64x2Sub, 0xfda6, s_ss) \ V(F64x2Sub, 0xfda6, s_ss) \
V(F64x2Mul, 0xfda7, s_ss) \ V(F64x2Mul, 0xfda7, s_ss) \
V(F64x2Div, 0xfda8, s_ss) \
V(F64x2Min, 0xfda9, s_ss) \ V(F64x2Min, 0xfda9, s_ss) \
V(F64x2Max, 0xfdaa, s_ss) \ V(F64x2Max, 0xfdaa, s_ss) \
V(I32x4SConvertF32x4, 0xfdab, s_s) \ V(I32x4SConvertF32x4, 0xfdab, s_s) \

View File

@ -86,6 +86,12 @@ T Mul(T a, T b) {
return a * b; return a * b;
} }
template <typename T, typename = typename std::enable_if<
std::is_floating_point<T>::value>::type>
T Div(T a, T b) {
return a / b;
}
template <typename T> template <typename T>
T Minimum(T a, T b) { T Minimum(T a, T b) {
return a <= b ? a : b; return a <= b ? a : b;
@ -1217,6 +1223,10 @@ WASM_SIMD_TEST_NO_LOWERING(F64x2Mul) {
RunF64x2BinOpTest(execution_tier, lower_simd, kExprF64x2Mul, Mul); RunF64x2BinOpTest(execution_tier, lower_simd, kExprF64x2Mul, Mul);
} }
WASM_SIMD_TEST_NO_LOWERING(F64x2Div) {
RunF64x2BinOpTest(execution_tier, lower_simd, kExprF64x2Div, Div);
}
WASM_SIMD_TEST_NO_LOWERING(F64x2Min) { WASM_SIMD_TEST_NO_LOWERING(F64x2Min) {
RunF64x2BinOpTest(execution_tier, lower_simd, kExprF64x2Min, JSMin); RunF64x2BinOpTest(execution_tier, lower_simd, kExprF64x2Min, JSMin);
} }