Skip to content
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion .github/container/Dockerfile.axlearn
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
# syntax=docker/dockerfile:1-labs
ARG BASE_IMAGE=ghcr.io/nvidia/jax-mealkit:jax
ARG URLREF_AXLEARN=https://github.com/Steboss/axlearn.git#main
ARG URLREF_AXLEARN=https://github.com/Steboss/axlearn.git#sbosisio/tree_util
ARG SRC_PATH_AXLEARN=/opt/axlearn

###############################################################################
Expand Down
2 changes: 2 additions & 0 deletions .github/eks-workflow-files/axlearn/axlearn-fuji-model.yml
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,8 @@ spec:
mkdir -p ${TRAINER_DIR}
OUTPUT_LOG_FILE=${TRAINER_DIR}/output.log

export XLA_FLAGS="--xla_gpu_enable_command_buffer="

python3 /usr/local/bin/fuji-train-perf.py \
--module=text.gpt.c4_trainer \
--config=${CONFIG} \
Expand Down
Loading