Commit d953d9fb authored by Clemens Hammacher's avatar Clemens Hammacher Committed by Commit Bot

[compiler] Add fast path for simple parallel moves

Most parallel moves do not actually require the heavy analysis in the
GapResolver since there is no overlap between source and destination
registers. Handle some of these cases by a fast-path to avoid the
quadratic behaviour in the general case.
The fast path is taken for about 2/3 of the non-empty parallel moves on
wasm workloads.

R=herhut@chromium.org, titzer@chromium.org

Bug: v8:8423
Change-Id: I026256fd6cf268f176fccc97f0f427e07629aeb3
Reviewed-on: https://chromium-review.googlesource.com/c/1400410
Commit-Queue: Clemens Hammacher <clemensh@chromium.org>
Reviewed-by: 's avatarStephan Herhut <herhut@chromium.org>
Reviewed-by: 's avatarBen Titzer <titzer@chromium.org>
Cr-Commit-Position: refs/heads/master@{#58644}
parent 78081872
...@@ -8,6 +8,7 @@ ...@@ -8,6 +8,7 @@
#include <set> #include <set>
#include "src/register-configuration.h" #include "src/register-configuration.h"
#include "src/utils.h"
namespace v8 { namespace v8 {
namespace internal { namespace internal {
...@@ -73,31 +74,54 @@ MoveOperands* Split(MoveOperands* move, MachineRepresentation smaller_rep, ...@@ -73,31 +74,54 @@ MoveOperands* Split(MoveOperands* move, MachineRepresentation smaller_rep,
return move; return move;
} }
enum MoveOperandKind : uint8_t { kConstant, kGpReg, kFpReg, kStack };
MoveOperandKind GetKind(const InstructionOperand& move) {
if (move.IsConstant()) return kConstant;
LocationOperand loc_op = LocationOperand::cast(move);
if (loc_op.location_kind() != LocationOperand::REGISTER) return kStack;
return IsFloatingPoint(loc_op.representation()) ? kFpReg : kGpReg;
}
} // namespace } // namespace
void GapResolver::Resolve(ParallelMove* moves) { void GapResolver::Resolve(ParallelMove* moves) {
// Clear redundant moves, and collect FP move representations if aliasing EnumSet<MoveOperandKind, uint8_t> source_kinds;
// is non-simple. EnumSet<MoveOperandKind, uint8_t> destination_kinds;
int reps = 0;
for (size_t i = 0; i < moves->size();) { // Remove redundant moves, collect source kinds and destination kinds to
MoveOperands* move = (*moves)[i]; // detect simple non-overlapping moves, and collect FP move representations if
// aliasing is non-simple.
int fp_reps = 0;
for (auto it = moves->begin(); it != moves->end();) {
MoveOperands* move = *it;
if (move->IsRedundant()) { if (move->IsRedundant()) {
(*moves)[i] = moves->back(); *it = moves->back();
moves->pop_back(); moves->pop_back();
continue; continue;
} }
i++; source_kinds.Add(GetKind(move->source()));
destination_kinds.Add(GetKind(move->destination()));
if (!kSimpleFPAliasing && move->destination().IsFPRegister()) { if (!kSimpleFPAliasing && move->destination().IsFPRegister()) {
reps |= RepresentationBit( fp_reps |= RepresentationBit(
LocationOperand::cast(move->destination()).representation()); LocationOperand::cast(move->destination()).representation());
} }
++it;
}
if ((source_kinds & destination_kinds).IsEmpty() || moves->size() < 2) {
// Fast path for non-conflicting parallel moves.
for (MoveOperands* move : *moves) {
assembler_->AssembleMove(&move->source(), &move->destination());
}
return;
} }
if (!kSimpleFPAliasing) { if (!kSimpleFPAliasing) {
if (reps && !base::bits::IsPowerOfTwo(reps)) { if (fp_reps && !base::bits::IsPowerOfTwo(fp_reps)) {
// Start with the smallest FP moves, so we never encounter smaller moves // Start with the smallest FP moves, so we never encounter smaller moves
// in the middle of a cycle of larger moves. // in the middle of a cycle of larger moves.
if ((reps & RepresentationBit(MachineRepresentation::kFloat32)) != 0) { if ((fp_reps & RepresentationBit(MachineRepresentation::kFloat32)) != 0) {
split_rep_ = MachineRepresentation::kFloat32; split_rep_ = MachineRepresentation::kFloat32;
for (size_t i = 0; i < moves->size(); ++i) { for (size_t i = 0; i < moves->size(); ++i) {
auto move = (*moves)[i]; auto move = (*moves)[i];
...@@ -105,7 +129,7 @@ void GapResolver::Resolve(ParallelMove* moves) { ...@@ -105,7 +129,7 @@ void GapResolver::Resolve(ParallelMove* moves) {
PerformMove(moves, move); PerformMove(moves, move);
} }
} }
if ((reps & RepresentationBit(MachineRepresentation::kFloat64)) != 0) { if ((fp_reps & RepresentationBit(MachineRepresentation::kFloat64)) != 0) {
split_rep_ = MachineRepresentation::kFloat64; split_rep_ = MachineRepresentation::kFloat64;
for (size_t i = 0; i < moves->size(); ++i) { for (size_t i = 0; i < moves->size(); ++i) {
auto move = (*moves)[i]; auto move = (*moves)[i];
......
...@@ -815,6 +815,9 @@ class EnumSet { ...@@ -815,6 +815,9 @@ class EnumSet {
EnumSet operator|(const EnumSet& set) const { EnumSet operator|(const EnumSet& set) const {
return EnumSet(bits_ | set.bits_); return EnumSet(bits_ | set.bits_);
} }
EnumSet operator&(const EnumSet& set) const {
return EnumSet(bits_ & set.bits_);
}
private: private:
static_assert(std::is_enum<E>::value, "EnumSet can only be used with enums"); static_assert(std::is_enum<E>::value, "EnumSet can only be used with enums");
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment