Skip to content

Commit 565202f

Browse files
committed
Fixes of Merge main into dev
Signed-off-by: oliver könig <[email protected]>
1 parent bfbf13f commit 565202f

File tree

5 files changed

+1099
-571
lines changed

5 files changed

+1099
-571
lines changed

.gitlab/stages/04.functional-tests.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -172,15 +172,15 @@ functional:run_dev_dgx_h100:
172172
functional:run_nemo:
173173
extends: [.functional_tests_rules]
174174
trigger:
175-
project: "dl/joc/nemo-ci"
175+
project: 'dl/joc/nemo-ci'
176176
branch: main-mirror
177177
strategy: depend
178178
inherit:
179179
variables: true
180180
variables:
181181
MCORE_MR_COMMIT: $CI_COMMIT_SHA
182-
TEST_NEMO2_MODULE: "True"
183-
ALLOW_FAILURE_DEPENDENCY: "True"
182+
TEST_NEMO2_MODULE: 'True'
183+
ALLOW_FAILURE_DEPENDENCY: 'True'
184184
TESTS_TO_RUN_ON_THIS_COMMIT: nightly
185185
rules:
186186
- if: $FUNCTIONAL_TEST == "yes"
@@ -217,7 +217,7 @@ functional:x_notify:
217217
- export RO_API_TOKEN=${PROJECT_ACCESS_TOKEN_MCORE}
218218
- export GITLAB_ENDPOINT
219219
- export CONTEXT=$FUNCTIONAL_TEST_SCOPE
220-
- export TAG_TEAM=$([[ "$CI_COMMIT_BRANCH" == "main" ]] && echo "1" || "0")
220+
- export TAG_TEAM=$([[ "$CI_COMMIT_BRANCH" == "main" || "$CI_COMMIT_BRANCH" == "dev" ]] && echo "1" || "0")
221221
- export TEAM_SLUG=$SLACK_ADMIN
222222
- |
223223
python tests/test_utils/python_scripts/notify.py \

examples/inference/gpt/gpt_static_inference.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -104,7 +104,7 @@ def get_inference_engine(args: Namespace, model: MegatronModule) -> StaticInfere
104104
text_generation_controller = TextGenerationController(
105105
inference_wrapped_model=inference_wrapped_model, tokenizer=tokenizer
106106
)
107-
return StaticInferenceEngine(text_generation_controller=text_generation_controller, legacy=args.use_legacy_static_engine)
107+
return StaticInferenceEngine(text_generation_controller=text_generation_controller, legacy=True)
108108

109109

110110
async def generate(

pyproject.toml

Lines changed: 6 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,7 @@ mlm = ["flask-restful", "sentencepiece", "tiktoken", "wandb", "transformers"]
6969
dev = [
7070
"nvidia-modelopt[torch]>=0.33.0a0,<0.34.0; sys_platform != 'darwin'",
7171
"transformer-engine[pytorch]>=2.9.0a0,<2.10.0",
72-
"nvidia-resiliency-ext",
72+
"nvidia-resiliency-ext>=0.4.0a0,<0.5.0",
7373
"tqdm",
7474
"einops~=0.8",
7575
"tensorstore~=0.1,!=0.1.46,!=0.1.72",
@@ -91,20 +91,13 @@ dev = [
9191

9292
lts = [
9393
"tqdm",
94-
"einops~=0.8",
95-
"tensorstore~=0.1,!=0.1.46,!=0.1.72",
96-
"nvtx~=0.2",
97-
"multi-storage-client~=0.27",
98-
"opentelemetry-api~=1.33.1",
94+
"einops",
95+
"tensorstore!=0.1.46,!=0.1.72",
96+
"nvtx",
97+
"transformers",
98+
"zarr",
9999
"setuptools<80.0.0",
100-
"mamba-ssm~=2.2",
101-
"causal-conv1d~=1.5",
102-
"nv-grouped-gemm~=1.1",
103-
"megatron-energon[av_decode]~=6.0",
104-
"av<16.0.0", # At the time, av 16.0.0 is not compatible with Python 3.12
105-
"flashinfer-python",
106100
"wget",
107-
"onnxscript",
108101
]
109102

110103
[dependency-groups]

tests/unit_tests/inference/engines/test_dynamic_engine.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -102,7 +102,7 @@ class DynamicEngineTestConfig:
102102
model_provider: str = "gpt"
103103
return_log_probs: bool = False
104104
materialize_only_last_token_logits: bool = True
105-
skip_prompt_log_probs_for_dynamic_inference: bool = False
105+
skip_prompt_log_probs: bool = False
106106
cuda_graph_scope: List[str] = None
107107
force_build_cuda_graphs: bool = False
108108
# If False, do not build cuda graphs in the tests, even if

0 commit comments

Comments
 (0)