Commit 1096e031 authored by Jakob Gruber's avatar Jakob Gruber Committed by Commit Bot

[nci] Implement tier-up, part 2 (marking)

This is part two of the implementation (part 1: heuristics in NCI code
to call the runtime profiler, part 2: heuristics in the runtime
profiler to mark the function for optimization, part 3: the final
part, recognizing and acting upon the marked function).

The runtime profiler heuristics added here remain very similar to what
we have for ignition, except that we now inspect optimized frames with
NCI code, and that we (currently) do not OSR from NCI to TF.

Bug: v8:8888
Change-Id: Ie88b0a0dcee16334cea585c771a4b505035f2291
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2358748
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Reviewed-by: 's avatarMythri Alle <mythria@chromium.org>
Cr-Commit-Position: refs/heads/master@{#69484}
parent 8f87753f
...@@ -74,24 +74,52 @@ std::ostream& operator<<(std::ostream& os, OptimizationReason reason) { ...@@ -74,24 +74,52 @@ std::ostream& operator<<(std::ostream& os, OptimizationReason reason) {
return os << OptimizationReasonToString(reason); return os << OptimizationReasonToString(reason);
} }
RuntimeProfiler::RuntimeProfiler(Isolate* isolate) namespace {
: isolate_(isolate), any_ic_changed_(false) {}
void TraceInOptimizationQueue(JSFunction function) {
if (FLAG_trace_opt_verbose) {
PrintF("[function ");
function.PrintName();
PrintF(" has been marked manually for optimization]\n");
}
}
static void TraceRecompile(JSFunction function, const char* reason, void TraceHeuristicOptimizationDisallowed(JSFunction function) {
const char* type, Isolate* isolate) { if (FLAG_trace_opt_verbose) {
PrintF("[function ");
function.PrintName();
PrintF(" has been marked manually for optimization]\n");
}
}
void TraceRecompile(JSFunction function, OptimizationReason reason,
Isolate* isolate) {
if (FLAG_trace_opt) { if (FLAG_trace_opt) {
CodeTracer::Scope scope(isolate->GetCodeTracer()); CodeTracer::Scope scope(isolate->GetCodeTracer());
PrintF(scope.file(), "[marking "); PrintF(scope.file(), "[marking ");
function.ShortPrint(scope.file()); function.ShortPrint(scope.file());
PrintF(scope.file(), " for %s recompilation, reason: %s", type, reason); PrintF(scope.file(), " for optimized recompilation, reason: %s",
OptimizationReasonToString(reason));
PrintF(scope.file(), "]\n"); PrintF(scope.file(), "]\n");
} }
} }
void TraceNCIRecompile(JSFunction function, OptimizationReason reason) {
if (FLAG_trace_turbo_nci) {
StdoutStream os;
os << "NCI tierup mark: " << Brief(function) << ", "
<< OptimizationReasonToString(reason) << std::endl;
}
}
} // namespace
RuntimeProfiler::RuntimeProfiler(Isolate* isolate)
: isolate_(isolate), any_ic_changed_(false) {}
void RuntimeProfiler::Optimize(JSFunction function, OptimizationReason reason) { void RuntimeProfiler::Optimize(JSFunction function, OptimizationReason reason) {
DCHECK_NE(reason, OptimizationReason::kDoNotOptimize); DCHECK_NE(reason, OptimizationReason::kDoNotOptimize);
TraceRecompile(function, OptimizationReasonToString(reason), "optimized", TraceRecompile(function, reason, isolate_);
isolate_);
function.MarkForOptimization(ConcurrencyMode::kConcurrent); function.MarkForOptimization(ConcurrencyMode::kConcurrent);
} }
...@@ -122,27 +150,20 @@ void RuntimeProfiler::AttemptOnStackReplacement(InterpretedFrame* frame, ...@@ -122,27 +150,20 @@ void RuntimeProfiler::AttemptOnStackReplacement(InterpretedFrame* frame,
Min(level + loop_nesting_levels, AbstractCode::kMaxLoopNestingMarker)); Min(level + loop_nesting_levels, AbstractCode::kMaxLoopNestingMarker));
} }
void RuntimeProfiler::MaybeOptimize(JSFunction function, void RuntimeProfiler::MaybeOptimizeInterpretedFrame(JSFunction function,
InterpretedFrame* frame) { InterpretedFrame* frame) {
if (function.IsInOptimizationQueue()) { if (function.IsInOptimizationQueue()) {
if (FLAG_trace_opt_verbose) { TraceInOptimizationQueue(function);
PrintF("[function ");
function.PrintName();
PrintF(" is already in optimization queue]\n");
}
return; return;
} }
if (FLAG_testing_d8_test_runner) { if (FLAG_testing_d8_test_runner &&
if (!PendingOptimizationTable::IsHeuristicOptimizationAllowed(isolate_, !PendingOptimizationTable::IsHeuristicOptimizationAllowed(isolate_,
function)) { function)) {
if (FLAG_trace_opt_verbose) { TraceHeuristicOptimizationDisallowed(function);
PrintF("[function ");
function.PrintName();
PrintF(" has been marked manually for optimization]\n");
}
return; return;
} }
}
if (function.shared().optimization_disabled()) return;
if (FLAG_always_osr) { if (FLAG_always_osr) {
AttemptOnStackReplacement(frame, AbstractCode::kMaxLoopNestingMarker); AttemptOnStackReplacement(frame, AbstractCode::kMaxLoopNestingMarker);
...@@ -151,12 +172,38 @@ void RuntimeProfiler::MaybeOptimize(JSFunction function, ...@@ -151,12 +172,38 @@ void RuntimeProfiler::MaybeOptimize(JSFunction function,
return; return;
} }
OptimizationReason reason =
ShouldOptimize(function, function.shared().GetBytecodeArray());
if (reason != OptimizationReason::kDoNotOptimize) {
Optimize(function, reason);
}
}
void RuntimeProfiler::MaybeOptimizeNCIFrame(JSFunction function) {
DCHECK_EQ(function.code().kind(), CodeKind::NATIVE_CONTEXT_INDEPENDENT);
if (function.IsInOptimizationQueue()) {
TraceInOptimizationQueue(function);
return;
}
if (FLAG_testing_d8_test_runner &&
!PendingOptimizationTable::IsHeuristicOptimizationAllowed(isolate_,
function)) {
TraceHeuristicOptimizationDisallowed(function);
return;
}
if (function.shared().optimization_disabled()) return; if (function.shared().optimization_disabled()) return;
// Note: NCI code does not OSR except when FLAG_turbo_nci_as_highest_tier
// is enabled, in which case we do not tier up from NCI code.
OptimizationReason reason = OptimizationReason reason =
ShouldOptimize(function, function.shared().GetBytecodeArray()); ShouldOptimize(function, function.shared().GetBytecodeArray());
if (reason != OptimizationReason::kDoNotOptimize) { if (reason != OptimizationReason::kDoNotOptimize) {
TraceNCIRecompile(function, reason);
Optimize(function, reason); Optimize(function, reason);
} }
} }
...@@ -190,7 +237,7 @@ bool RuntimeProfiler::MaybeOSR(JSFunction function, InterpretedFrame* frame) { ...@@ -190,7 +237,7 @@ bool RuntimeProfiler::MaybeOSR(JSFunction function, InterpretedFrame* frame) {
OptimizationReason RuntimeProfiler::ShouldOptimize(JSFunction function, OptimizationReason RuntimeProfiler::ShouldOptimize(JSFunction function,
BytecodeArray bytecode) { BytecodeArray bytecode) {
if (function.HasAvailableOptimizedCode()) { if (function.ActiveTierIsTurbofan()) {
return OptimizationReason::kDoNotOptimize; return OptimizationReason::kDoNotOptimize;
} }
int ticks = function.feedback_vector().profiler_ticks(); int ticks = function.feedback_vector().profiler_ticks();
...@@ -219,22 +266,24 @@ OptimizationReason RuntimeProfiler::ShouldOptimize(JSFunction function, ...@@ -219,22 +266,24 @@ OptimizationReason RuntimeProfiler::ShouldOptimize(JSFunction function,
return OptimizationReason::kDoNotOptimize; return OptimizationReason::kDoNotOptimize;
} }
void RuntimeProfiler::MarkCandidatesForOptimizationFromBytecode() { RuntimeProfiler::MarkCandidatesForOptimizationScope::
HandleScope scope(isolate_); MarkCandidatesForOptimizationScope(RuntimeProfiler* profiler)
: handle_scope_(profiler->isolate_), profiler_(profiler) {
if (!isolate_->use_optimizer()) return;
DisallowHeapAllocation no_gc;
TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.compile"), TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.compile"),
"V8.MarkCandidatesForOptimization"); "V8.MarkCandidatesForOptimization");
}
// Run through the JavaScript frames and collect them. If we already RuntimeProfiler::MarkCandidatesForOptimizationScope::
// have a sample of the function, we mark it for optimizations ~MarkCandidatesForOptimizationScope() {
// (eagerly or lazily). profiler_->any_ic_changed_ = false;
int frame_count = 0; }
int frame_count_limit = FLAG_frame_count;
for (JavaScriptFrameIterator it(isolate_); void RuntimeProfiler::MarkCandidatesForOptimizationFromBytecode() {
frame_count++ < frame_count_limit && !it.done(); it.Advance()) { if (!isolate_->use_optimizer()) return;
MarkCandidatesForOptimizationScope scope(this);
int i = 0;
for (JavaScriptFrameIterator it(isolate_); i < FLAG_frame_count && !it.done();
i++, it.Advance()) {
JavaScriptFrame* frame = it.frame(); JavaScriptFrame* frame = it.frame();
if (!frame->is_interpreted()) continue; if (!frame->is_interpreted()) continue;
...@@ -244,24 +293,35 @@ void RuntimeProfiler::MarkCandidatesForOptimizationFromBytecode() { ...@@ -244,24 +293,35 @@ void RuntimeProfiler::MarkCandidatesForOptimizationFromBytecode() {
if (!function.has_feedback_vector()) continue; if (!function.has_feedback_vector()) continue;
MaybeOptimize(function, InterpretedFrame::cast(frame)); MaybeOptimizeInterpretedFrame(function, InterpretedFrame::cast(frame));
// TODO(leszeks): Move this increment to before the maybe optimize checks, // TODO(leszeks): Move this increment to before the maybe optimize checks,
// and update the tests to assume the increment has already happened. // and update the tests to assume the increment has already happened.
int ticks = function.feedback_vector().profiler_ticks(); function.feedback_vector().SaturatingIncrementProfilerTicks();
if (ticks < Smi::kMaxValue) {
function.feedback_vector().set_profiler_ticks(ticks + 1);
}
} }
any_ic_changed_ = false;
} }
void RuntimeProfiler::MarkCandidatesForOptimizationFromCode() { void RuntimeProfiler::MarkCandidatesForOptimizationFromCode() {
if (FLAG_trace_turbo_nci) { if (!isolate_->use_optimizer()) return;
StdoutStream os; MarkCandidatesForOptimizationScope scope(this);
os << "NCI tier-up: Marking candidates for optimization" << std::endl; int i = 0;
for (JavaScriptFrameIterator it(isolate_); i < FLAG_frame_count && !it.done();
i++, it.Advance()) {
JavaScriptFrame* frame = it.frame();
if (!frame->is_optimized()) continue;
JSFunction function = frame->function();
if (function.code().kind() != CodeKind::NATIVE_CONTEXT_INDEPENDENT) {
continue;
}
DCHECK(function.shared().is_compiled());
DCHECK(function.has_feedback_vector());
function.feedback_vector().SaturatingIncrementProfilerTicks();
MaybeOptimizeNCIFrame(function);
} }
// TODO(jgruber,v8:8888): Implement.
} }
} // namespace internal } // namespace internal
......
...@@ -5,6 +5,8 @@ ...@@ -5,6 +5,8 @@
#ifndef V8_EXECUTION_RUNTIME_PROFILER_H_ #ifndef V8_EXECUTION_RUNTIME_PROFILER_H_
#define V8_EXECUTION_RUNTIME_PROFILER_H_ #define V8_EXECUTION_RUNTIME_PROFILER_H_
#include "src/common/assert-scope.h"
#include "src/handles/handles.h"
#include "src/utils/allocation.h" #include "src/utils/allocation.h"
namespace v8 { namespace v8 {
...@@ -31,7 +33,11 @@ class RuntimeProfiler { ...@@ -31,7 +33,11 @@ class RuntimeProfiler {
int nesting_levels = 1); int nesting_levels = 1);
private: private:
void MaybeOptimize(JSFunction function, InterpretedFrame* frame); // Make the decision whether to optimize the given function, and mark it for
// optimization if the decision was 'yes'.
void MaybeOptimizeNCIFrame(JSFunction function);
void MaybeOptimizeInterpretedFrame(JSFunction function,
InterpretedFrame* frame);
// Potentially attempts OSR from and returns whether no other // Potentially attempts OSR from and returns whether no other
// optimization attempts should be made. // optimization attempts should be made.
bool MaybeOSR(JSFunction function, InterpretedFrame* frame); bool MaybeOSR(JSFunction function, InterpretedFrame* frame);
...@@ -40,6 +46,17 @@ class RuntimeProfiler { ...@@ -40,6 +46,17 @@ class RuntimeProfiler {
void Optimize(JSFunction function, OptimizationReason reason); void Optimize(JSFunction function, OptimizationReason reason);
void Baseline(JSFunction function, OptimizationReason reason); void Baseline(JSFunction function, OptimizationReason reason);
class MarkCandidatesForOptimizationScope final {
public:
explicit MarkCandidatesForOptimizationScope(RuntimeProfiler* profiler);
~MarkCandidatesForOptimizationScope();
private:
HandleScope handle_scope_;
RuntimeProfiler* const profiler_;
DisallowHeapAllocation no_gc;
};
Isolate* isolate_; Isolate* isolate_;
bool any_ic_changed_; bool any_ic_changed_;
}; };
......
...@@ -376,7 +376,8 @@ inline bool Code::is_interpreter_trampoline_builtin() const { ...@@ -376,7 +376,8 @@ inline bool Code::is_interpreter_trampoline_builtin() const {
inline bool Code::checks_optimization_marker() const { inline bool Code::checks_optimization_marker() const {
bool checks_marker = bool checks_marker =
(builtin_index() == Builtins::kCompileLazy || (builtin_index() == Builtins::kCompileLazy ||
builtin_index() == Builtins::kInterpreterEntryTrampoline); builtin_index() == Builtins::kInterpreterEntryTrampoline ||
CodeKindChecksOptimizationMarker(kind()));
return checks_marker || return checks_marker ||
(CodeKindCanDeoptimize(kind()) && marked_for_deoptimization()); (CodeKindCanDeoptimize(kind()) && marked_for_deoptimization());
} }
......
...@@ -72,6 +72,11 @@ inline constexpr bool CodeKindCanDeoptimize(CodeKind kind) { ...@@ -72,6 +72,11 @@ inline constexpr bool CodeKindCanDeoptimize(CodeKind kind) {
return CodeKindIsOptimizedJSFunction(kind); return CodeKindIsOptimizedJSFunction(kind);
} }
inline constexpr bool CodeKindChecksOptimizationMarker(CodeKind kind) {
return kind == CodeKind::INTERPRETED_FUNCTION ||
kind == CodeKind::NATIVE_CONTEXT_INDEPENDENT;
}
inline CodeKind CodeKindForTopTier() { inline CodeKind CodeKindForTopTier() {
return FLAG_turbo_nci_as_highest_tier ? CodeKind::NATIVE_CONTEXT_INDEPENDENT return FLAG_turbo_nci_as_highest_tier ? CodeKind::NATIVE_CONTEXT_INDEPENDENT
: CodeKind::OPTIMIZED_FUNCTION; : CodeKind::OPTIMIZED_FUNCTION;
......
...@@ -374,6 +374,11 @@ void FeedbackVector::AddToVectorsForProfilingTools( ...@@ -374,6 +374,11 @@ void FeedbackVector::AddToVectorsForProfilingTools(
isolate->SetFeedbackVectorsForProfilingTools(*list); isolate->SetFeedbackVectorsForProfilingTools(*list);
} }
void FeedbackVector::SaturatingIncrementProfilerTicks() {
int ticks = profiler_ticks();
if (ticks < Smi::kMaxValue) set_profiler_ticks(ticks + 1);
}
// static // static
void FeedbackVector::SetOptimizedCode(Handle<FeedbackVector> vector, void FeedbackVector::SetOptimizedCode(Handle<FeedbackVector> vector,
Handle<Code> code) { Handle<Code> code) {
......
...@@ -213,6 +213,9 @@ class FeedbackVector : public HeapObject { ...@@ -213,6 +213,9 @@ class FeedbackVector : public HeapObject {
// runtime profiler. // runtime profiler.
DECL_INT32_ACCESSORS(profiler_ticks) DECL_INT32_ACCESSORS(profiler_ticks)
// Increment profiler ticks, saturating at the maximal value.
void SaturatingIncrementProfilerTicks();
// Initialize the padding if necessary. // Initialize the padding if necessary.
inline void clear_padding(); inline void clear_padding();
......
...@@ -132,17 +132,13 @@ bool JSFunction::ActiveTierIsIgnition() const { ...@@ -132,17 +132,13 @@ bool JSFunction::ActiveTierIsIgnition() const {
bool JSFunction::ActiveTierIsTurbofan() const { bool JSFunction::ActiveTierIsTurbofan() const {
CodeKind highest_tier; CodeKind highest_tier;
if (!HighestTierOf(GetAvailableCodeKinds(), &highest_tier)) return false; if (!HighestTierOf(GetAvailableCodeKinds(), &highest_tier)) return false;
bool result = highest_tier == CodeKind::OPTIMIZED_FUNCTION; return highest_tier == CodeKind::OPTIMIZED_FUNCTION;
DCHECK_IMPLIES(result, !code().marked_for_deoptimization());
return result;
} }
bool JSFunction::ActiveTierIsNCI() const { bool JSFunction::ActiveTierIsNCI() const {
CodeKind highest_tier; CodeKind highest_tier;
if (!HighestTierOf(GetAvailableCodeKinds(), &highest_tier)) return false; if (!HighestTierOf(GetAvailableCodeKinds(), &highest_tier)) return false;
bool result = highest_tier == CodeKind::NATIVE_CONTEXT_INDEPENDENT; return highest_tier == CodeKind::NATIVE_CONTEXT_INDEPENDENT;
DCHECK_IMPLIES(result, !code().marked_for_deoptimization());
return result;
} }
bool JSFunction::HasOptimizationMarker() { bool JSFunction::HasOptimizationMarker() {
...@@ -237,7 +233,7 @@ void JSFunction::ClearOptimizedCodeSlot(const char* reason) { ...@@ -237,7 +233,7 @@ void JSFunction::ClearOptimizedCodeSlot(const char* reason) {
void JSFunction::SetOptimizationMarker(OptimizationMarker marker) { void JSFunction::SetOptimizationMarker(OptimizationMarker marker) {
DCHECK(has_feedback_vector()); DCHECK(has_feedback_vector());
DCHECK(ChecksOptimizationMarker()); DCHECK(ChecksOptimizationMarker());
DCHECK(!HasAvailableOptimizedCode()); DCHECK(!ActiveTierIsTurbofan());
feedback_vector().SetOptimizationMarker(marker); feedback_vector().SetOptimizationMarker(marker);
} }
...@@ -458,9 +454,9 @@ void JSFunction::MarkForOptimization(ConcurrencyMode mode) { ...@@ -458,9 +454,9 @@ void JSFunction::MarkForOptimization(ConcurrencyMode mode) {
mode = ConcurrencyMode::kNotConcurrent; mode = ConcurrencyMode::kNotConcurrent;
} }
DCHECK(!is_compiled() || ActiveTierIsIgnition()); DCHECK(!is_compiled() || ActiveTierIsIgnition() || ActiveTierIsNCI());
DCHECK(!ActiveTierIsTurbofan());
DCHECK(shared().IsInterpreted()); DCHECK(shared().IsInterpreted());
DCHECK(!HasAvailableOptimizedCode());
DCHECK(shared().allows_lazy_compilation() || DCHECK(shared().allows_lazy_compilation() ||
!shared().optimization_disabled()); !shared().optimization_disabled());
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment