ruby
diff --git a/‎test/ruby/test_yjit.rb
Lines changed: 41 additions & 11 deletions b/‎test/ruby/test_yjit.rb
Lines changed: 41 additions & 11 deletions
diff --git a/‎yjit.c
Lines changed: 85 additions & 0 deletions b/‎yjit.c
Lines changed: 85 additions & 0 deletions
diff --git a/‎yjit.rb
Lines changed: 91 additions & 0 deletions b/‎yjit.rb
Lines changed: 91 additions & 0 deletions
diff --git a/‎yjit/bindgen/src/main.rs
Lines changed: 4 additions & 0 deletions b/‎yjit/bindgen/src/main.rs
Lines changed: 4 additions & 0 deletions
@@ -56,6 +56,11 @@ def test_yjit_stats_and_v_no_error
     refute_includes(stderr, "NoMethodError")
   end
 
+  def test_yjit_trace_exits_and_v_no_error
+    _stdout, stderr, _status = EnvUtil.invoke_ruby(%w(-v --yjit-trace-exits), '', true, true)
+    refute_includes(stderr, "NoMethodError")
+  end
+
   def test_enable_from_env_var
     yjit_child_env = {'RUBY_YJIT_ENABLE' => '1'}
     assert_in_out_err([yjit_child_env, '--version'], '') do |stdout, stderr|
@@ -68,7 +73,7 @@ def test_enable_from_env_var
 
   def test_compile_setclassvariable
     script = 'class Foo; def self.foo; @@foo = 1; end; end; Foo.foo'
-    assert_compiles(script, insns: %i[setclassvariable], result: 1)
+    assert_compiles(script, insns: %i[setclassvariable], result: 1, trace_exits: true)
   end
 
   def test_compile_getclassvariable
@@ -81,20 +86,20 @@ def test_compile_putnil
   end
 
   def test_compile_putobject
-    assert_compiles('true', insns: %i[putobject], result: true)
-    assert_compiles('123', insns: %i[putobject], result: 123)
-    assert_compiles(':foo', insns: %i[putobject], result: :foo)
+    assert_compiles('true', insns: %i[putobject], result: true, trace_exits: true)
+    assert_compiles('123', insns: %i[putobject], result: 123, trace_exits: true)
+    assert_compiles(':foo', insns: %i[putobject], result: :foo, trace_exits: true)
   end
 
   def test_compile_opt_succ
     assert_compiles('1.succ', insns: %i[opt_succ], result: 2)
   end
 
   def test_compile_opt_not
-    assert_compiles('!false', insns: %i[opt_not], result: true)
-    assert_compiles('!nil', insns: %i[opt_not], result: true)
-    assert_compiles('!true', insns: %i[opt_not], result: false)
-    assert_compiles('![]', insns: %i[opt_not], result: false)
+    assert_compiles('!false', insns: %i[opt_not], result: true, trace_exits: true)
+    assert_compiles('!nil', insns: %i[opt_not], result: true, trace_exits: true)
+    assert_compiles('!true', insns: %i[opt_not], result: false, trace_exits: true)
+    assert_compiles('![]', insns: %i[opt_not], result: false, trace_exits: true)
   end
 
   def test_compile_opt_newarray
@@ -653,14 +658,15 @@ def assert_no_exits(script)
   end
 
   ANY = Object.new
-  def assert_compiles(test_script, insns: [], call_threshold: 1, stdout: nil, exits: {}, result: ANY, frozen_string_literal: nil)
+  def assert_compiles(test_script, insns: [], call_threshold: 1, stdout: nil, exits: {}, trace_exits: false, result: ANY, frozen_string_literal: nil)
     reset_stats = <<~RUBY
       RubyVM::YJIT.runtime_stats
       RubyVM::YJIT.reset_stats!
     RUBY
 
     write_results = <<~RUBY
       stats = RubyVM::YJIT.runtime_stats
+      exit_locations = #{trace_exits} ? RubyVM::YJIT.exit_locations : nil
 
       def collect_insns(iseq)
         insns = RubyVM::YJIT.insns_compiled(iseq)
@@ -673,7 +679,8 @@ def collect_insns(iseq)
         result: #{result == ANY ? "nil" : "result"},
         stats: stats,
         insns: collect_insns(iseq),
-        disasm: iseq.disasm
+        disasm: iseq.disasm,
+        exit_locations: exit_locations
       })
     RUBY
 
@@ -700,6 +707,7 @@ def collect_insns(iseq)
     runtime_stats = stats[:stats]
     insns_compiled = stats[:insns]
     disasm = stats[:disasm]
+    exit_locations = stats[:exit_locations]
 
     # Check that exit counts are as expected
     # Full stats are only available when --enable-yjit=dev
@@ -729,6 +737,27 @@ def collect_insns(iseq)
         flunk "Expected to compile instructions #{missed_insns.join(", ")} but didn't.\niseq:\n#{disasm}"
       end
     end
+
+    if exit_locations
+      assert exit_locations.key?(:raw)
+      assert exit_locations.key?(:frames)
+      assert exit_locations.key?(:lines)
+      assert exit_locations.key?(:samples)
+      assert exit_locations.key?(:missed_samples)
+      assert exit_locations.key?(:gc_samples)
+
+      assert_equal 0, exit_locations[:missed_samples]
+      assert_equal 0, exit_locations[:gc_samples]
+
+      assert_not_empty exit_locations[:raw]
+      assert_not_empty exit_locations[:frames]
+      assert_not_empty exit_locations[:lines]
+
+      exit_locations[:frames].each do |frame_id, frame|
+        assert frame.key?(:samples)
+        assert frame.key?(:edges)
+      end
+    end
   end
 
   def script_shell_encode(s)
@@ -740,7 +769,8 @@ def eval_with_jit(script, call_threshold: 1, timeout: 1000)
     args = [
       "--disable-gems",
       "--yjit-call-threshold=#{call_threshold}",
-      "--yjit-stats"
+      "--yjit-stats",
+      "--yjit-trace-exits"
     ]
     args << "-e" << script_shell_encode(script)
     stats_r, stats_w = IO.pipe
 
@@ -25,6 +25,7 @@
 #include "probes.h"
 #include "probes_helper.h"
 #include "iseq.h"
+#include "ruby/debug.h"
 
 // For mmapp(), sysconf()
 #ifndef _WIN32
@@ -83,6 +84,88 @@ rb_yjit_mark_executable(void *mem_block, uint32_t mem_size)
     }
 }
 
+# define PTR2NUM(x)   (rb_int2inum((intptr_t)(void *)(x)))
+
+// For a given raw sample index, add frames to the
+// frames hash.
+static void
+rb_yjit_add_frame(VALUE hash, VALUE frame)
+{
+    VALUE frame_id = PTR2NUM(frame);
+
+    if (RTEST(rb_hash_aref(hash, frame_id))) {
+        return;
+    } else {
+        VALUE frame_info = rb_hash_new();
+        VALUE name = rb_profile_frame_full_label(frame);
+        VALUE file = rb_profile_frame_absolute_path(frame);
+        VALUE line = rb_profile_frame_first_lineno(frame);
+
+        if (NIL_P(file)) {
+            file = rb_profile_frame_path(frame);
+        }
+
+        rb_hash_aset(frame_info, ID2SYM(rb_intern("name")), name);
+        rb_hash_aset(frame_info, ID2SYM(rb_intern("file")), file);
+
+        if (line != INT2FIX(0)) {
+            rb_hash_aset(frame_info, ID2SYM(rb_intern("line")), line);
+        }
+
+       rb_hash_aset(hash, frame_id, frame_info);
+    }
+}
+
+// Parses the yjit_raw_samples and yjit_line_samples data into three
+// hashes (raw, lines, and frames) to be used by RubyVM::YJIT.exit_locations.
+VALUE
+rb_yjit_exit_locations_dict(VALUE *yjit_raw_samples, int *yjit_line_samples, int samples_len)
+{
+    VALUE result = rb_hash_new();
+    VALUE raw_samples = rb_ary_new_capa(samples_len);
+    VALUE line_samples = rb_ary_new_capa(samples_len);
+    VALUE frames = rb_hash_new();
+    int idx = 0;
+
+    // While the index is less than the length of raw_samples,
+    // parse the yjit_raw_samples and yjit_line samples, then
+    // add to raw_samples and line_samples array.
+    while (idx < samples_len) {
+        int num = (int)yjit_raw_samples[idx];
+        int line_num = (int)yjit_line_samples[idx];
+        idx++;
+
+        rb_ary_push(raw_samples, SIZET2NUM(num));
+        rb_ary_push(line_samples, INT2NUM(line_num));
+
+        // Loop through the length of yjit_line_samples and for each
+        // add to the frames hash. Also push the index onto the raw_samples
+        // and line_samples arrary respectively.
+        for (int o = 0; o < num; o++) {
+            rb_yjit_add_frame(frames, yjit_raw_samples[idx]);
+            rb_ary_push(raw_samples, SIZET2NUM(yjit_raw_samples[idx]));
+            rb_ary_push(line_samples, INT2NUM(yjit_line_samples[idx]));
+            idx++;
+        }
+
+        rb_ary_push(raw_samples, SIZET2NUM(yjit_raw_samples[idx]));
+        rb_ary_push(line_samples, INT2NUM(yjit_line_samples[idx]));
+        idx++;
+
+        rb_ary_push(raw_samples, SIZET2NUM(yjit_raw_samples[idx]));
+        rb_ary_push(line_samples, INT2NUM(yjit_line_samples[idx]));
+        idx++;
+    }
+
+    // Set add the raw_samples, line_samples, and frames to the results
+    // hash.
+    rb_hash_aset(result, ID2SYM(rb_intern("raw")), raw_samples);
+    rb_hash_aset(result, ID2SYM(rb_intern("lines")), line_samples);
+    rb_hash_aset(result, ID2SYM(rb_intern("frames")), frames);
+
+    return result;
+}
+
 uint32_t
 rb_yjit_get_page_size(void)
 {
@@ -860,12 +943,14 @@ rb_yjit_invalidate_all_method_lookup_assumptions(void)
 
 // Primitives used by yjit.rb
 VALUE rb_yjit_stats_enabled_p(rb_execution_context_t *ec, VALUE self);
+VALUE rb_yjit_trace_exit_locations_enabled_p(rb_execution_context_t *ec, VALUE self);
 VALUE rb_yjit_get_stats(rb_execution_context_t *ec, VALUE self);
 VALUE rb_yjit_reset_stats_bang(rb_execution_context_t *ec, VALUE self);
 VALUE rb_yjit_disasm_iseq(rb_execution_context_t *ec, VALUE self, VALUE iseq);
 VALUE rb_yjit_insns_compiled(rb_execution_context_t *ec, VALUE self, VALUE iseq);
 VALUE rb_yjit_simulate_oom_bang(rb_execution_context_t *ec, VALUE self);
 VALUE rb_yjit_get_stats(rb_execution_context_t *ec, VALUE self);
+VALUE rb_yjit_get_exit_locations(rb_execution_context_t *ec, VALUE self);
 
 // Preprocessed yjit.rb generated during build
 #include "yjit.rbinc"
 
@@ -18,11 +18,102 @@ def self.stats_enabled?
     Primitive.rb_yjit_stats_enabled_p
   end
 
+  # Check if rb_yjit_trace_exit_locations_enabled_p is enabled.
+  def self.trace_exit_locations_enabled?
+    Primitive.rb_yjit_trace_exit_locations_enabled_p
+  end
+
   # Discard statistics collected for --yjit-stats.
   def self.reset_stats!
     Primitive.rb_yjit_reset_stats_bang
   end
 
+  # If --yjit-trace-exits is enabled parse the hashes from
+  # Primitive.rb_yjit_get_exit_locations into a format readable
+  # by StackProf. This will allow us to find the exact location of a
+  # side exit in YJIT based on the instruction that is exiting.
+  #
+  # Usage:
+  #
+  # In a script call:
+  #
+  #   File.write("my_file.dump", Marshal.dump(RubyVM::YJIT.exit_locations))
+  #
+  # Then run the file with the following options:
+  #
+  #   ruby --yjit --yjit-stats --yjit-trace-exits test.rb
+  #
+  # Once the code is done running, use StackProf to read the dump file.
+  # See StackProf documentation for options.
+  def self.exit_locations
+    return unless trace_exit_locations_enabled?
+
+    results = Primitive.rb_yjit_get_exit_locations
+    raw_samples = results[:raw].dup
+    line_samples = results[:lines].dup
+    frames = results[:frames].dup
+    samples_count = 0
+
+    frames.each do |frame_id, frame|
+      frame[:samples] = 0
+      frame[:edges] = {}
+    end
+
+    # Loop through the instructions and set the frame hash with the data.
+    # We use nonexistent.def for the file name, otherwise insns.def will be displayed
+    # and that information isn't useful in this context.
+    RubyVM::INSTRUCTION_NAMES.each_with_index do |name, frame_id|
+      frame_hash = { samples: 0, total_samples: 0, edges: {}, name: name, file: "nonexistent.def", line: nil }
+      results[:frames][frame_id] = frame_hash
+      frames[frame_id] = frame_hash
+    end
+
+    # Loop through the raw_samples and build the hashes for StackProf.
+    # The loop is based off an example in the StackProf documentation and therefore
+    # this functionality can only work with that library.
+    while raw_samples.length > 0
+      stack_trace = raw_samples.shift(raw_samples.shift + 1)
+      lines = line_samples.shift(line_samples.shift + 1)
+      prev_frame_id = nil
+
+      stack_trace.each_with_index do |frame_id, idx|
+        if prev_frame_id
+          prev_frame = frames[prev_frame_id]
+          prev_frame[:edges][frame_id] ||= 0
+          prev_frame[:edges][frame_id] += 1
+        end
+
+        frame_info = frames[frame_id]
+        frame_info[:total_samples] ||= 0
+        frame_info[:total_samples] += 1
+
+        frame_info[:lines] ||= {}
+        frame_info[:lines][lines[idx]] ||= [0, 0]
+        frame_info[:lines][lines[idx]][0] += 1
+
+        prev_frame_id = frame_id
+      end
+
+      top_frame_id = stack_trace.last
+      top_frame_line = 1
+
+      frames[top_frame_id][:samples] += 1
+      frames[top_frame_id][:lines] ||= {}
+      frames[top_frame_id][:lines][top_frame_line] ||= [0, 0]
+      frames[top_frame_id][:lines][top_frame_line][1] += 1
+
+      samples_count += raw_samples.shift
+      line_samples.shift
+    end
+
+    results[:samples] = samples_count
+    # Set missed_samples and gc_samples to 0 as their values
+    # don't matter to us in this context.
+    results[:missed_samples] = 0
+    results[:gc_samples] = 0
+    results
+  end
+
   # Return a hash for statistics generated for the --yjit-stats command line option.
   # Return nil when option is not passed or unavailable.
   def self.runtime_stats
 
@@ -239,6 +239,7 @@ fn main() {
         .allowlist_function("rb_yjit_obj_written")
         .allowlist_function("rb_yjit_str_simple_append")
         .allowlist_function("rb_ENCODING_GET")
+        .allowlist_function("rb_yjit_exit_locations_dict")
 
         // from vm_sync.h
         .allowlist_function("rb_vm_barrier")
@@ -273,6 +274,9 @@ fn main() {
         .allowlist_function("rb_class_allocate_instance")
         .allowlist_function("rb_obj_info")
 
+        // From include/ruby/debug.h
+        .allowlist_function("rb_profile_frames")
+
         // We define VALUE manually, don't import it
         .blocklist_type("VALUE")