ruby-bench/lib/benchmark_suite.rb at 64ce9ad6ceafc7364641ff2f4e4b10f98f399fc4 · Shopify/ruby-bench · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
# frozen_string_literal: true

require 'json'
require 'pathname'
require 'fileutils'
require 'shellwords'
require 'etc'
require 'yaml'
require 'rbconfig'
require_relative 'benchmark_filter'
require_relative 'benchmark_runner'
require_relative 'benchmark_discovery'

# BenchmarkSuite runs a collection of benchmarks and collects their results
class BenchmarkSuite
  BENCHMARKS_DIR = "benchmarks"
  RACTOR_CATEGORY = ["ractor"].freeze
  RACTOR_ONLY_CATEGORY = ["ractor-only"].freeze
  RACTOR_HARNESS = "harness-ractor"

  attr_reader :categories, :name_filters, :excludes, :out_path, :harness, :harness_explicit, :pre_init, :no_pinning, :force_pinning, :bench_dir

  def initialize(categories:, name_filters:, excludes: [], out_path:, harness:, harness_explicit: false, pre_init: nil, no_pinning: false, force_pinning: false)
    @categories = categories
    @name_filters = name_filters
    @excludes = excludes
    @out_path = out_path
    @harness = harness
    @harness_explicit = harness_explicit
    @pre_init = pre_init ? expand_pre_init(pre_init) : nil
    @no_pinning = no_pinning
    @force_pinning = force_pinning
    @bench_dir = BENCHMARKS_DIR
  end

  # Run all the benchmarks and record execution times
  # Returns [bench_data, bench_failures]
  def run(ruby:, ruby_description:)
    bench_data = {}
    bench_failures = {}

    benchmark_entries = discover_benchmarks
    env = benchmark_env(ruby)
    caller_json_path = ENV["RESULT_JSON_PATH"]

    # Capture quiet setting before entering unbundled env (which clears ENV)
    quiet = ENV['BENCHMARK_QUIET'] == '1'

    benchmark_entries.each_with_index do |entry, idx|
      puts("Running benchmark \"#{entry.name}\" (#{idx+1}/#{benchmark_entries.length})")

      result_json_path = caller_json_path || File.join(out_path, "temp#{Process.pid}.json")
      cmd_prefix = base_cmd(ruby_description, entry.name)

      # Clear project-level Bundler environment so benchmarks run in a clean context.
      # Benchmarks that need Bundler (e.g., railsbench) set up their own via use_gemfile.
      # This is important when running tests under `bundle exec rake test`.
      result = if defined?(Bundler)
        Bundler.with_unbundled_env do
          run_single_benchmark(entry.script_path, result_json_path, ruby, cmd_prefix, env, entry.name, quiet: quiet)
        end
      else
        run_single_benchmark(entry.script_path, result_json_path, ruby, cmd_prefix, env, entry.name, quiet: quiet)
      end

      if result[:success]
        bench_data[entry.name] = process_benchmark_result(result_json_path, result[:command], delete_file: !caller_json_path)
      else
        bench_failures[entry.name] = result[:status].exitstatus
        FileUtils.rm_f(result_json_path) unless caller_json_path
      end
    end

    [bench_data, bench_failures]
  end

  private

  def setup_benchmark_directories
    if @ractor_only
      @bench_dir = RACTOR_BENCHMARKS_DIR
      @ractor_bench_dir = RACTOR_BENCHMARKS_DIR
      @harness = RACTOR_HARNESS
      @categories = []
    else
      @bench_dir = BENCHMARKS_DIR
      @ractor_bench_dir = RACTOR_BENCHMARKS_DIR
    end
  end

  def process_benchmark_result(result_json_path, command, delete_file: true)
    JSON.parse(File.read(result_json_path)).tap do |json|
      json["command_line"] = command
      File.unlink(result_json_path) if delete_file
    end
  end

  def discover_benchmarks
    all_entries = discover_all_benchmark_entries
    directory_map = build_directory_map(all_entries)
    filter_benchmarks(all_entries, directory_map)
  end

  def discover_all_benchmark_entries
    discovery = BenchmarkDiscovery.new(bench_dir)
    { main: discovery.discover }
  end

  def build_directory_map(all_entries)
    all_entries[:main].each_with_object({}) do |entry, map|
      map[entry.name] = entry.directory
    end
  end

  def filter_benchmarks(all_entries, directory_map)
    filter_entries(
      all_entries[:main],
      categories: categories,
      name_filters: name_filters,
      excludes: excludes,
      directory_map: directory_map
    )
  end

  def filter_entries(entries, categories:, name_filters:, excludes:, directory_map:)
    filter = BenchmarkFilter.new(
      categories: categories,
      name_filters: name_filters,
      excludes: excludes,
      metadata: benchmarks_metadata,
      directory_map: directory_map
    )
    entries.select { |entry| filter.match?(entry.name) }
  end

  def run_single_benchmark(script_path, result_json_path, ruby, cmd_prefix, env, benchmark_name, quiet: false)
    # Fix for jruby/jruby#7394 in JRuby 9.4.2.0
    script_path = File.expand_path(script_path)

    # Save and restore ENV["RESULT_JSON_PATH"] to avoid polluting the environment
    # for subsequent runs (e.g., when running multiple executables)
    original_result_json_path = ENV["RESULT_JSON_PATH"]
    ENV["RESULT_JSON_PATH"] = result_json_path

    # Use per-benchmark default_harness if set, otherwise use global harness
    benchmark_harness = benchmark_harness_for(benchmark_name)

    # Set up the benchmarking command
    cmd = cmd_prefix + [
      *ruby,
      "-I", benchmark_harness,
      *pre_init,
      script_path,
    ].compact

    # Do the benchmarking
    result = BenchmarkRunner.check_call(cmd.shelljoin, env: env, raise_error: false, quiet: quiet)
    result[:command] = cmd.shelljoin
    result
  ensure
    if original_result_json_path
      ENV["RESULT_JSON_PATH"] = original_result_json_path
    else
      ENV.delete("RESULT_JSON_PATH")
    end
  end

  def benchmark_harness_for(benchmark_name)
    return harness if harness_explicit

    benchmark_meta = benchmarks_metadata[benchmark_name] || {}
    default = ractor_category_run? ? RACTOR_HARNESS : harness
    benchmark_meta.fetch('default_harness', default)
  end

  def benchmark_env(ruby)
    # When the Ruby running this script is not the first Ruby in PATH, shell commands
    # like `bundle install` in a child process will not use the Ruby being benchmarked.
    # It overrides PATH to guarantee the commands of the benchmarked Ruby will be used.
    env = {}
    ruby_path = `#{ruby.shelljoin} -e 'print RbConfig.ruby' 2> #{File::NULL}`

    if ruby_path != RbConfig.ruby
      env["PATH"] = "#{File.dirname(ruby_path)}:#{ENV["PATH"]}"

      # chruby sets GEM_HOME and GEM_PATH in your shell. We have to unset it in the child
      # process to avoid installing gems to the version that is running run_benchmarks.rb.
      ["GEM_HOME", "GEM_PATH"].each do |var|
        env[var] = nil if ENV.key?(var)
      end
    end

    # Pass benchmark configuration env vars to subprocess.
    # These may be set after bundler loads, so they'd be lost with with_unbundled_env.
    ["WARMUP_ITRS", "MIN_BENCH_ITRS", "MIN_BENCH_TIME", "YJIT_BENCH_STATS", "ZJIT_BENCH_STATS"].each do |var|
      env[var] = ENV[var] if ENV.key?(var)
    end

    env
  end

  def benchmarks_metadata
    @benchmarks_metadata ||= YAML.load_file('benchmarks.yml')
  end

  # Check if running on Linux
  def linux?
    @linux ||= RbConfig::CONFIG['host_os'] =~ /linux/
  end

  # Set up the base command with CPU pinning if needed
  def base_cmd(ruby_description, benchmark_name)
    if linux?
      cmd = setarch_prefix

      # Pin the process to one given core to improve caching and reduce variance on CRuby
      # Other Rubies need to use multiple cores, e.g., for JIT threads
      if ruby_description.start_with?('ruby ') && should_pin?(benchmark_name)
        # The last few cores of Intel CPU may be slow E-Cores, so avoid using the last one.
        cpu = [(Etc.nprocessors / 2) - 1, 0].max
        cmd.concat(["taskset", "-c", "#{cpu}"])
      end

      cmd
    else
      []
    end
  end

  def should_pin?(benchmark_name)
    return false if no_pinning
    return true if force_pinning
    return false if ractor_category_run?

    benchmark_meta = benchmarks_metadata[benchmark_name] || {}
    !benchmark_meta["no_pinning"]
  end

  def ractor_category_run?
    categories == RACTOR_CATEGORY || categories == RACTOR_ONLY_CATEGORY
  end

  # Generate setarch prefix for Linux
  def setarch_prefix
    # Disable address space randomization (for determinism)
    prefix = ["setarch", `uname -m`.strip, "-R"]

    # Abort if we don't have permission (perhaps in a docker container).
    return [] unless system(*prefix, "true", out: File::NULL, err: File::NULL)

    prefix
  end

  # Resolve the pre_init file path into a form that can be required
  def expand_pre_init(path)
    path = Pathname.new(path)

    unless path.exist?
      puts "--with-pre-init called with non-existent file!"
      exit(-1)
    end

    if path.directory?
      puts "--with-pre-init called with a directory, please pass a .rb file"
      exit(-1)
    end

    library_name = path.basename(path.extname)
    load_path = path.parent.expand_path

    [
      "-I", load_path,
      "-r", library_name
    ]
  end
end