Skip to content

Commit 855b40e

Browse files
authored
Merge pull request #454 from malay-nagda/340b_duplicate_params
remove duplicate 340b params
2 parents 5730fac + 10120db commit 855b40e

File tree

1 file changed

+0
-2
lines changed

1 file changed

+0
-2
lines changed

launcher_scripts/conf/training/nemotron/nemotron_340b.yaml

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,6 @@ model:
135135
defer_embedding_wgrad_compute: True
136136
wgrad_deferral_limit: 22
137137
cross_entropy_loss_fusion: True
138-
enable_vboost: True
139138
ub_tp_comm_overlap: True
140139
apply_rope_fusion: True
141140
deteministic_mode: False
@@ -161,7 +160,6 @@ model:
161160
fp8_amax_history_len: 1024 # Number of steps for which amax history is recorded per tensor
162161
fp8_amax_compute_algo: max # 'most_recent' or 'max'. Algorithm for computing amax from history
163162
fp8_wgrad: True
164-
ub_tp_comm_overlap: False
165163

166164
optim:
167165
name: mcore_distributed_optim

0 commit comments

Comments
 (0)