Skip to content

Commit 7fe863f

Browse files
committed
Merge branch 'hn-tokenizer-imports' into 'main'
Fix some more imports from the refactor See merge request ADLR/megatron-lm!1325
2 parents e6fb9b1 + eba39bb commit 7fe863f

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

megatron/training/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
from .global_vars import get_adlr_autoresume
1515
from .global_vars import get_timers
1616
from .initialize import initialize_megatron
17-
from .training import pretrain, get_model
17+
from .training import pretrain, get_model, get_train_valid_test_num_samples
1818

1919
from .utils import (print_rank_0,
2020
is_last_rank,

tools/retro/preprocess_data.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@
3636
get_config_path,
3737
get_gpt_data_dir,
3838
)
39-
from megatron.tokenizer.tokenizer import (
39+
from megatron.training.tokenizer.tokenizer import (
4040
_BertWordPieceTokenizer,
4141
_GPT2BPETokenizer,
4242
_GPTSentencePieceTokenizer,

0 commit comments

Comments
 (0)