@@ -178,7 +178,7 @@ def teardown_method(self, method):
178178 # ((2, 1), 2, 2),
179179 ],
180180 )
181- @pytest .mark .skip ( reason = "Tests are flaky and need to be debugged" )
181+ @pytest .mark .flaky
182182 def test_dp_sharding (self , tmp_path_dist_ckpt , tp_pp , src_dp , dest_dp , use_fpsl , initialize_fn ):
183183 src_world_size = tp_pp [0 ] * tp_pp [1 ] * src_dp
184184 dest_world_size = tp_pp [0 ] * tp_pp [1 ] * dest_dp
@@ -256,7 +256,7 @@ def test_dp_sharding(self, tmp_path_dist_ckpt, tp_pp, src_dp, dest_dp, use_fpsl,
256256 ('src_tp_pp' , 'dest_tp_pp' , 'use_glu' ),
257257 [((2 , 2 ), (2 , 4 ), False ), ((1 , 8 ), (4 , 1 ), True ), ((2 , 4 ), (4 , 2 ), False )],
258258 )
259- @pytest .mark .skip ( reason = "Tests are flaky and need to be debugged" )
259+ @pytest .mark .flaky
260260 def test_finetune_doesnt_load_optimizer (
261261 self , tmp_path_dist_ckpt , src_tp_pp , dest_tp_pp , use_glu
262262 ):
@@ -329,7 +329,7 @@ def test_finetune_doesnt_load_optimizer(
329329 assert not diffs [0 ] and not diffs [1 ] and diffs [2 ]
330330 assert not any (diff (optimizer .state_dict (), optim_unloaded_state_dict ))
331331
332- @pytest .mark .skip ( reason = "Tests are flaky and need to be debugged" )
332+ @pytest .mark .flaky
333333 def test_can_load_deprecated_bucket_space_format (self , tmp_path_dist_ckpt ):
334334 # sync=True to make sure other ranks wait for rank 0 to finish creating directory.
335335 tp = 4
@@ -398,7 +398,7 @@ def teardown_method(self, method):
398398 @pytest .mark .parametrize (
399399 ('src_tp_pp' , 'dest_tp_pp' ), [((2 , 4 ), (2 , 4 )), ((2 , 4 ), (4 , 2 )), ((8 , 1 ), (1 , 2 ))]
400400 )
401- @pytest .mark .skip ( reason = "Tests are flaky and need to be debugged" )
401+ @pytest .mark .flaky
402402 def test_fp32_optimizer_resharding (self , tmp_path_dist_ckpt , src_tp_pp , dest_tp_pp ):
403403 # sync=True to make sure other ranks wait for rank 0 to finish creating directory.
404404 Utils .initialize_model_parallel (* src_tp_pp )
@@ -465,7 +465,7 @@ def teardown_method(self, method):
465465 ('src_tp_pp' , 'dest_tp_pp' ),
466466 [((2 , 4 ), (2 , 4 )), ((2 , 4 ), (2 , 2 )), ((2 , 4 ), (4 , 2 )), ((8 , 1 ), (1 , 2 ))],
467467 )
468- @pytest .mark .skip ( reason = "Tests are flaky and need to be debugged" )
468+ @pytest .mark .flaky
469469 def test_optimizer_resharding (
470470 self , tmp_path_dist_ckpt , src_tp_pp , dest_tp_pp , use_dist_opt , bf16
471471 ):
0 commit comments