File tree Expand file tree Collapse file tree 1 file changed +1
-5
lines changed Expand file tree Collapse file tree 1 file changed +1
-5
lines changed Original file line number Diff line number Diff line change @@ -34,7 +34,7 @@ usage() {
3434 1. test-maxtext.sh -b 2 --model-name=gpt3-52k
3535 2. test-maxtext.sh -b 2 --model-name=gemma-2b --dtype=fp8
3636 3. test-maxtext.sh -n 1 -b 2 --model-name=llama2-7b --attn-type=cudnn_flash_te --remat-policy=minimal_flash --steps=10 --fsdp=8 --output train_output --multiprocess
37- 4. test-maxtext.sh -n 1 -b 2 --model-name=llama2-7b --attn-type=cudnn_flash_te --remat-policy=minimal_flash --steps=10 --fsdp=8 --output train_output --multiprocess -a " scan_layers=false max_target_length=4096 use_iota_embed=true logits_dot_in_fp32=false"
37+ 4. test-maxtext.sh -n 1 -b 2 --model-name=llama2-7b --attn-type=cudnn_flash_te --remat-policy=minimal_flash --steps=10 --fsdp=8 --output train_output --multiprocess -a ' scan_layers=false max_target_length=4096 use_iota_embed=true logits_dot_in_fp32=false'
3838 5. test-maxtext.sh -n 1 -b 2 --model-name=llama2-7b --attn-type=cudnn_flash_te --remat-policy=minimal_flash --dtype=fp8 --steps=10 --fsdp=8 --output train_output --multiprocess
3939 6. test-maxtext.sh -n 8 -b 2 --model-name=llama2-7b --attn-type=cudnn_flash_te --remat-policy=minimal_flash --steps=10 --output train_output --fsdp=8 --data-parallel=8 --multiprocess
4040 7. test-maxtext.sh -n 8 -b 2 --model-name=llama2-7b --attn-type=cudnn_flash_te --remat-policy=minimal_flash --steps=10 --output train_output --fsdp=4 --tensor-parallel=2 --data-parallel=8 --multiprocess
@@ -107,10 +107,6 @@ while [ : ]; do
107107 DTYPE=" $2 "
108108 shift 2
109109 ;;
110- --enable-te)
111- ENABLE_TE=1
112- shift 1
113- ;;
114110 -s | --steps)
115111 STEPS=" $2 "
116112 shift 2
You can’t perform that action at this time.
0 commit comments