Fuzzer: Ignore fuzz testcases that make VMs run out of stack (#6376)

When the stack runs out is observable and optimizations can change it, so we must ignore such testcases. Also add some logic to help debug stuff like this, as suggested by tlively in the past, to add some metrics on the reasons we ignored a testcase. That emits something like this: (ignored 253 iters, for reasons {'too many errors vs calls': 230, '[host limit ': 20, 'uninitialized non-defaultable local': 3}) As a drive by make the metrics print wasm bytes/iter rather than by second (the former is easy to compute from the latter anyhow, and the latter is more interesting I think).
author: Alon Zakai <azakai@google.com> 2024-03-04 15:55:36 -0800
committer: GitHub <noreply@github.com> 2024-03-04 15:55:36 -0800
commit: 00ed4115fb89a0fac3231eba07f5f737cf721acd (patch)
tree: 6031d9747b8165cd5b079793a44adce5cc608d3a
parent: 53f8d5f7bd32c8b47ee235033f3f913a8f3f2d09 (diff)
download: binaryen-00ed4115fb89a0fac3231eba07f5f737cf721acd.tar.gz
binaryen-00ed4115fb89a0fac3231eba07f5f737cf721acd.tar.bz2
binaryen-00ed4115fb89a0fac3231eba07f5f737cf721acd.zip
1 files changed, 19 insertions, 8 deletions
diff --git a/scripts/fuzz_opt.py b/scripts/fuzz_opt.py
index 448a00705..4b4439e4f 100755
--- a/scripts/fuzz_opt.py
+++ b/scripts/fuzz_opt.py
@@ -622,12 +622,17 @@ def fix_spec_output(out):
 
 
 ignored_vm_runs = 0
+ignored_vm_run_reasons = dict()
 
 
-def note_ignored_vm_run(text='(ignore VM run)'):
+# Notes a VM run that we ignore, and the reason for it (for metrics purposes).
+# Extra text can also be printed that is not included in the metrics.
+def note_ignored_vm_run(reason, extra_text=''):
     global ignored_vm_runs
-    print(text)
+    print(f'(ignore VM run: {reason}{extra_text})')
     ignored_vm_runs += 1
+    ignored_vm_run_reasons.setdefault(reason, 0)
+    ignored_vm_run_reasons[reason] += 1
 
 
 def run_vm(cmd):
@@ -644,6 +649,11 @@ def run_vm(cmd):
             # this text is emitted from V8 when it runs out of memory during a
             # GC allocation.
             'out of memory',
+            # if the call stack is exceeded we must ignore this, as
+            # optimizations can change whether this happens or not (e.g. by
+            # removing locals, which makes stack frames smaller), which is
+            # noticeable.
+            'Maximum call stack size exceeded',
             # all host limitations are arbitrary and may differ between VMs and
             # also be affected by optimizations, so ignore them.
             # this is the prefix that the binaryen interpreter emits. For V8,
@@ -656,7 +666,7 @@ def run_vm(cmd):
         ]
         for issue in known_issues:
             if issue in output:
-                note_ignored_vm_run()
+                note_ignored_vm_run(issue)
                 return IGNORE
         return output
 
@@ -769,7 +779,7 @@ class CompareVMs(TestCaseHandler):
                         # still be useful testing here (up to 50%), so we only
                         # note that this is a mostly-ignored run, but we do not
                         # ignore the parts that are useful.
-                        note_ignored_vm_run(f'(testcase mostly ignored: {calls} calls, {errors} errors)')
+                        note_ignored_vm_run('too many errors vs calls', extra_text=f' ({calls} calls, {errors} errors)')
                 return output
 
             def can_run(self, wasm):
@@ -1688,10 +1698,11 @@ if __name__ == '__main__':
         elapsed = max(0.000001, time.time() - start_time)
         print('ITERATION:', counter, 'seed:', seed, 'size:', input_size,
               '(mean:', str(mean) + ', stddev:', str(stddev) + ')',
-              'speed:', counter / elapsed,
-              'iters/sec, ', total_wasm_size / elapsed,
-              'wasm_bytes/sec, ', ignored_vm_runs,
-              'ignored\n')
+              'speed:', counter / elapsed, 'iters/sec, ',
+              total_wasm_size / counter, 'wasm_bytes/iter')
+        if ignored_vm_runs:
+            print(f'(ignored {ignored_vm_runs} iters, for reasons {ignored_vm_run_reasons})')
+        print()
         make_random_input(input_size, raw_input_data)
         assert os.path.getsize(raw_input_data) == input_size
         # remove the generated wasm file, so that we can tell if the fuzzer
author	Alon Zakai <azakai@google.com>	2024-03-04 15:55:36 -0800
committer	GitHub <noreply@github.com>	2024-03-04 15:55:36 -0800
commit	00ed4115fb89a0fac3231eba07f5f737cf721acd (patch)
tree	6031d9747b8165cd5b079793a44adce5cc608d3a
parent	53f8d5f7bd32c8b47ee235033f3f913a8f3f2d09 (diff)
download	binaryen-00ed4115fb89a0fac3231eba07f5f737cf721acd.tar.gz binaryen-00ed4115fb89a0fac3231eba07f5f737cf721acd.tar.bz2 binaryen-00ed4115fb89a0fac3231eba07f5f737cf721acd.zip