rems-project · bensimner · Apr 23, 2025 · Apr 17, 2025 · Apr 17, 2025 · Apr 17, 2025
diff --git a/Makefile b/Makefile
@@ -1,5 +1,5 @@
 .PHONY: build clean
-.PHONY: checks example-traces
+.PHONY: checks example-traces check-examples check-rocq
 .PHONY: casemate casemate-check casemate-lib
 .PHONY: help
 
@@ -53,5 +53,10 @@ clean:
 example-traces:
 	$(call build_subdir,RUN,examples,logs)
 
-checks:
-	$(call build_subdir,RUN,examples,checks)
+check-rocq:
+	$(call build_subdir,RUN,examples,check-rocq)
+
+check-examples:
+	$(call build_subdir,RUN,examples,check-examples)
+
+checks: check-examples check-rocq
diff --git a/examples/Makefile b/examples/Makefile
@@ -1,4 +1,4 @@
-.PHONY: build clean logs list-build-objs
+.PHONY: build clean logs checks list-build-objs
 
 build-objs += simple
 build-objs += good_write
@@ -40,22 +40,20 @@ test_logs = $(patsubst %,$(src)/tests/%.log,$(build-objs))
 
 common_obj = $(src)/common.o
 
-test_checks = $(patsubst %,check-%,$(build-objs))
-
-checks: $(test_checks)
 expected: $(test_expects)
-logs: $(test_logs)
 
 .PRECIOUS: $(common_obj) $(test_objs) $(test_logs)
 
 $(src)/%: $(src)/tests/%.o $(common_obj) $(casemate_o)
 	$(call run_cmd,LD,$@,$(CC) $^ -o $@)
 
-$(src)/tests/%.log: FORCE
-	$(call run_cmd,RUN,$(src)/$*,test -f $(src)/$* && ($(src)/$* -at 1> $@ 2>/dev/null || true))
+check-examples: FORCE
+	$(call run_cmd,CHECK,examples,$(src)/scripts/run_tests.py --examples)
+
+check-rocq: FORCE
+	$(call run_cmd,CHECK,examples,$(src)/scripts/run_tests.py --rocq)
 
-check-%: $(src)/tests/%.log FORCE
-	$(call run_cmd,CHECK,$(src)/$*,$(src)/scripts/check_simulation.py $< $(src)/$(EXPECTEDDIR)/$*.log)
+checks: check-examples check-rocq
 
 clean-%:
 	$(call run_clean,$(src)/$*,rm -f $(src)/$* $(src)/tests/$*.o $(src)/tests/$*.log)

diff --git a/examples/scripts/run_tests.py b/examples/scripts/run_tests.py
@@ -0,0 +1,86 @@
+#!/usr/bin/env python3
+import sys
+import pathlib
+import argparse
+import subprocess
+
+HERE = pathlib.Path(__file__).parent
+EXAMPLES_ROOT = HERE.parent
+CASEMATE_ROOT = EXAMPLES_ROOT.parent
+CASEMATE_CHECK_ROCQ_ROOT = CASEMATE_ROOT / "src" / "casemate-check-rocq"
+
+EXAMPLES = (
+    subprocess.run(
+        ["make", "list-build-objs"],
+        cwd=EXAMPLES_ROOT,
+        capture_output=True,
+        text=True,
+        check=True,
+    ).stdout.strip().split()
+)
+
+
+def runmsg(prefix, s):
+    print(f'  {prefix:<8}\t\t\t{s}', file=sys.stderr)
+
+def check_expected(test_name):
+    example_exe = EXAMPLES_ROOT / test_name
+    out_path = (EXAMPLES_ROOT / "tests" / test_name).with_suffix(".log")
+
+    runmsg("RUN", test_name)
+    with open(out_path, "wb") as logf:
+        subprocess.run(
+            [str(example_exe)],
+            cwd=EXAMPLES_ROOT,
+            stdout=logf,
+            check=False,
+        )
+
+    expected = (EXAMPLES_ROOT / "expected" / test_name).with_suffix(".log")
+    runmsg("CHECK", test_name)
+    subprocess.run(
+        ["python3", "./scripts/check_simulation.py", str(out_path), str(expected)],
+        cwd=EXAMPLES_ROOT,
+        check=True,
+    )
+
+def check_rocq_trace(test_name):
+    expected_log = (EXAMPLES_ROOT / "expected" / test_name).with_suffix(".log")
+
+    runmsg("CHECK", test_name)
+
+    expected_status = expected_log.read_text().strip().splitlines()[-1]
+    expected_status = 121 if expected_status.startswith("!") else 0
+
+    cp = (
+        subprocess.run(
+            ["dune", "exec", "casemate", "--", str(expected_log)],
+            cwd=CASEMATE_CHECK_ROCQ_ROOT,
+            check=False,
+        )
+    )
+
+    if cp.returncode != expected_status:
+        raise ValueError(f"Fail check on {test_name}")
+
+
+def main(argv):
+    args = parser.parse_args(argv)
+
+    for example in EXAMPLES:
+        expected_log = (EXAMPLES_ROOT / "expected" / example).with_suffix(".log")
+
+        if expected_log.exists():
+            if args.rocq:
+                check_rocq_trace(example)
+            else:
+                check_expected(example)
+
+
+parser = argparse.ArgumentParser()
+grp = parser.add_mutually_exclusive_group(required=True)
+grp.add_argument("--rocq", action="store_true", default=False)
+grp.add_argument("--examples", action="store_true", default=False)
+
+if __name__ == "__main__":
+    sys.exit(main(sys.argv[1:]))