ruby-bench/burn_in.rb at main · ruby/ruby-bench · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
#!/usr/bin/env ruby

require 'etc'
require 'optparse'
require 'ostruct'
require 'pathname'
require 'fileutils'
require 'shellwords'
require 'csv'
require 'json'
require 'rbconfig'
require 'etc'
require 'yaml'
require 'open3'

# Default values for command-line arguments
args = OpenStruct.new({
  logs_path: "./logs_burn_in",
  delete_old_logs: false,
  num_procs: Etc.nprocessors,
  num_long_runs: 4,
  categories: ['headline', 'other'],
  no_yjit: false,
})

# Parse the command-line options
OptionParser.new do |opts|
  opts.on("--logs_path=OUT_PATH", "directory where to store output data files") do |v|
    args.logs_path = v
  end

  opts.on("--delete_old_logs") do
    args.delete_old_logs = true
  end

  opts.on("--num_procs=N", "number of processes to use in total") do |v|
    args.num_procs = v.to_i
  end

  opts.on("--num_long_runs=N", "number of processes to use for long runs") do |v|
    args.num_long_runs = v.to_i
  end

  opts.on("--category=headline,other,micro,ractor,ractor-only", "when given, only benchmarks with specified categories will run") do |v|
    args.categories = v.split(",")
  end

  opts.on("--no_yjit", "when given, test with the CRuby interpreter, without enabling YJIT") do
    args.no_yjit = true
  end
end.parse!

def free_file_path(parent_dir, name_prefix)
  (1..).each do |file_no|
    out_path = File.join(parent_dir, "#{name_prefix}_%03d.txt" % file_no)
    if !File.exist?(out_path)
      return out_path
    end
  end
end

def run_benchmark(bench_name, no_yjit, logs_path, run_time, ruby_version, metadata)
  bench_dir = 'benchmarks'
  entry = metadata[bench_name] || {}
  harness = entry.fetch('default_harness', 'harness')

  script_path = File.join(bench_dir, bench_name, 'benchmark.rb')
  if not File.exist?(script_path)
    script_path = File.join(bench_dir, bench_name + '.rb')
  end

  # Assemble random environment variable options to test
  test_env_vars = {}
  if rand < 0.5
    test_env_vars["RUBY_GC_AUTO_COMPACT"] = "1"
  end

  env = {
    "WARMUP_ITRS"=> "0",
    "MIN_BENCH_TIME"=> run_time.to_s,
    "RUST_BACKTRACE"=> "1",
  }
  env.merge!(test_env_vars)

  # Assemble random command-line options to test
  if no_yjit
    test_options = []
  else
    test_options = [
      "--yjit-call-threshold=#{[1, 2, 10, 30].sample()}",
      "--yjit-cold-threshold=#{[1, 2, 5, 10, 500, 50_000].sample()}",
      [
        "--yjit-mem-size=#{[1, 2, 3, 4, 5, 10, 64, 128].sample()}",
        "--yjit-exec-mem-size=#{[1, 2, 3, 4, 5, 10, 64, 128].sample()}",
      ].sample(),
      ['--yjit-code-gc', nil].sample(),
      ['--yjit-perf', nil].sample(),
      ['--yjit-stats', nil].sample(),
      ['--yjit-log=/dev/null', nil].sample(),
    ].compact
  end

  # Assemble the command string
  cmd = [
    'ruby',
    *test_options,
    "-I#{harness}",
    script_path,
  ].compact
  cmd_str = cmd.shelljoin

  # Prepend the tested environment variables to the command string
  # that we show to the user. We produce this separate command string
  # because capture2e doesn't support this syntax.
  user_cmd_str = cmd_str.dup
  test_env_vars.each do |name, value|
    user_cmd_str = "export #{name}=#{value} && " + user_cmd_str
  end

  puts "pid #{Process.pid} running benchmark #{bench_name}:"
  puts user_cmd_str
  output, status = Open3.capture2e(env, cmd_str)

  # If we got an error
  if !status.success?
    # Lobsters can run into connection errors with multiprocessing (port already taken, etc.), ignore that
    if bench_name == "lobsters" && output.include?("HTTP status is")
      return false
    end

    # Hexapdf can run into errors due to multiprocessing due to filesystem side-effects, ignore that
    if bench_name == "hexapdf" && output.include?("Incorrect size")
      return false
    end

    puts "ERROR"

    # Write command executed and output
    out_path = free_file_path(logs_path, "error_#{bench_name.gsub('/', '_')}")
    puts "writing output file #{out_path}"
    contents = ruby_version + "\n\n" + "pid #{status.pid}\n" + user_cmd_str + "\n\n" + output
    File.write(out_path, contents)

    # Error
    return true
  end

  # No error
  return false
end

def test_loop(bench_names, no_yjit, logs_path, run_time, ruby_version, metadata)
  error_found = false

  while true
    bench_name = bench_names.sample()
    error = run_benchmark(bench_name, no_yjit, logs_path, run_time, ruby_version, metadata)
    error_found ||= error

    if error_found
      puts "ERROR ENCOUNTERED"
    end
  end
end

# Create the output directory
if Dir.exist?(args.logs_path)
  if args.delete_old_logs
    FileUtils.rm_r(args.logs_path)
  else
    puts("Logs directory already exists. Move or delete #{args.logs_path} before running.")
    exit(-1)
  end
end
FileUtils.mkdir_p(args.logs_path)

# Get Ruby version string
ruby_version = IO.popen("ruby -v --yjit", &:read).strip
puts ruby_version

# Check that YJIT is available
if !ruby_version.include?("+YJIT")
  puts("Ruby version string doesn't include +YJIT. You may want to run `chruby ruby-yjit`.")
  exit(-1)
end

# Check if debug info is included in Ruby binary (this only works on Linux, not macOS)
output = IO.popen("file `which ruby`", &:read).strip
if !output.include?("debug_info")
  puts("WARNING: could not detect debug info in ruby binary! You may want to rebuild in dev mode so you can produce useful core dumps!")
  puts()
  sleep(10)
end

# Extract the names of benchmarks in the categories we want
metadata = YAML.load_file('benchmarks.yml')
bench_names = []

if args.categories.include?('ractor-only')
  # Include only benchmarks with ractor_only: true
  metadata.each do |name, entry|
    if entry['ractor_only']
      bench_names << name
    end
  end
elsif args.categories.include?('ractor')
  # Include benchmarks with ractor: true or ractor_only: true
  metadata.each do |name, entry|
    if entry['ractor'] || entry['ractor_only']
      bench_names << name
    end
  end

  # Also include regular category benchmarks if other categories are specified
  if args.categories.any? { |cat| ['headline', 'other', 'micro'].include?(cat) }
    metadata.each do |name, entry|
      category = entry.fetch('category', 'other')
      if args.categories.include?(category) && !bench_names.include?(name)
        bench_names << name
      end
    end
  end
else
  # Regular category filtering - exclude ractor-only and ractor harness benchmarks
  metadata.each do |name, entry|
    category = entry.fetch('category', 'other')
    is_ractor_only = entry['ractor_only'] ||
      (entry['ractor'] && entry['default_harness'] == 'harness-ractor')
    if args.categories.include?(category) && !is_ractor_only
      bench_names << name
    end
  end
end

bench_names.sort!

# Fork the test processes
puts "num processes: #{args.num_procs}"
args.num_procs.times do |i|
  pid = Process.fork do
    run_time = (i < args.num_long_runs)? (3600 * 2):10
    test_loop(bench_names, args.no_yjit, args.logs_path, run_time, ruby_version, metadata)
  end
end

# We need some kind of busy loop to not exit?
# Loop and sleep, report if forked processes crashed?
while true
  sleep(50 * 0.001)
end