Skip to content

Commit 288e77e

Browse files
authored
Merge pull request #3 from eval-protocol/codex/trim-down-deepcoder-tests-for-performance
Trim deepcoder tests
2 parents bacce91 + c35e426 commit 288e77e

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

tests/test_deepcoder_reward.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -83,6 +83,7 @@ def test_python_one_test_fails_local(self):
8383
details = json.loads(result.metrics["test_results"].reason)
8484
self.assertFalse(details[0].get("passed")) # First test case (5 -> expected 6, actual 7) should fail
8585

86+
@unittest.skip("Trimmed slow test")
8687
def test_python_syntax_error_local(self):
8788
"""Test Python code with a syntax error locally."""
8889
if not self.SAMPLES:
@@ -108,6 +109,7 @@ def test_python_syntax_error_local(self):
108109
details = json.loads(result.metrics["test_results"].reason)
109110
self.assertTrue(any("error" in tc for tc in details))
110111

112+
@unittest.skip("Trimmed slow test")
111113
def test_python_timeout_local(self):
112114
"""Test Python code that times out locally."""
113115
if not self.SAMPLES:
@@ -156,6 +158,7 @@ def test_no_code_block(self):
156158
if "error" in result.metrics:
157159
self.assertIn("No python code block found", result.metrics["error"].reason)
158160

161+
@unittest.skip("Trimmed slow test")
159162
def test_javascript_all_tests_pass_local(self):
160163
"""Test JavaScript code that passes all test cases locally."""
161164
js_test_cases = [
@@ -179,6 +182,7 @@ def test_javascript_all_tests_pass_local(self):
179182
self.assertIsInstance(result, EvaluateResult)
180183
self.assertEqual(result.score, 1.0)
181184

185+
@unittest.skip("Trimmed slow test")
182186
def test_javascript_one_test_fails_local(self):
183187
"""Test JavaScript code where one test case fails locally."""
184188
js_test_cases = [
@@ -202,7 +206,7 @@ def test_javascript_one_test_fails_local(self):
202206
self.assertIsInstance(result, EvaluateResult)
203207
self.assertEqual(result.score, 0.0)
204208

205-
@unittest.skipUnless(E2B_AVAILABLE, "E2B_API_KEY not set, skipping E2B tests.")
209+
@unittest.skip("Trimmed slow test")
206210
def test_python_all_tests_pass_e2b(self):
207211
"""Test Python code that passes all test cases in E2B."""
208212
if not self.SAMPLES:
@@ -262,7 +266,7 @@ def test_python_all_tests_pass_e2b(self):
262266
else:
263267
raise
264268

265-
@unittest.skipUnless(E2B_AVAILABLE, "E2B_API_KEY not set, skipping E2B tests.")
269+
@unittest.skip("Trimmed slow test")
266270
def test_python_one_test_fails_e2b(self):
267271
"""Test Python code where one test case fails in E2B."""
268272
if not self.SAMPLES:

0 commit comments

Comments
 (0)