diff --git a/pretrain/scripts/v4-8b-phase1/base/params.sh b/pretrain/scripts/v4-8b-phase1/base/params.sh index 57a307d..6b28681 100644 --- a/pretrain/scripts/v4-8b-phase1/base/params.sh +++ b/pretrain/scripts/v4-8b-phase1/base/params.sh @@ -112,4 +112,5 @@ ALL_PARAMS+=( # NOTE(odashi): # https://docs.nvidia.com/nemo-framework/user-guide/latest/performance/performance-guide.html#communication-overlaps-and-tuning export NVTE_FWD_LAYERNORM_SM_MARGIN=16 -export NVTE_BWD_LAYERNORM_SM_MARGIN=16 \ No newline at end of file +export NVTE_BWD_LAYERNORM_SM_MARGIN=16 +