We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cff7e3e commit 3dfebb3Copy full SHA for 3dfebb3
tests/pipeline/rlvr_pipeline_meg_critic.py
@@ -347,7 +347,11 @@ def run(self):
347
actor_infer_response_timer = _Timer(window_size=5)
348
actor_train_timer = _Timer(window_size=5)
349
350
- for global_step in range(self.pipeline_config.max_steps):
+ # Modified for testing: Run only 5 steps
351
+ test_max_steps = min(5, self.pipeline_config.max_steps)
352
+ logger.info(f"TEST MODE: Running only {test_max_steps} steps for critic comparison")
353
+
354
+ for global_step in range(test_max_steps):
355
if global_step <= self.state.step:
356
global_step += 1
357
continue
0 commit comments