From 42d164e558555669fd96ba9a56e9afb6c1bc1ee1 Mon Sep 17 00:00:00 2001 From: Hemil Desai Date: Mon, 25 Nov 2024 02:25:51 -0800 Subject: [PATCH] Fix environment variables in torchrun executor (#11363) Signed-off-by: Hemil Desai Co-authored-by: Marc Romeyn --- nemo/collections/llm/recipes/run/executor.py | 4 ---- 1 file changed, 4 deletions(-) diff --git a/nemo/collections/llm/recipes/run/executor.py b/nemo/collections/llm/recipes/run/executor.py index 305fa6b0a3c7..fe14a4f55bd2 100644 --- a/nemo/collections/llm/recipes/run/executor.py +++ b/nemo/collections/llm/recipes/run/executor.py @@ -18,11 +18,7 @@ def torchrun(devices: int = 8) -> run.Config[run.LocalExecutor]: """Local executor using torchrun.""" env_vars = { - "TRANSFORMERS_OFFLINE": "1", "TORCH_NCCL_AVOID_RECORD_STREAMS": "1", - "NCCL_NVLS_ENABLE": "0", - "NVTE_DP_AMAX_REDUCE_INTERVAL": "0", - "NVTE_ASYNC_AMAX_REDUCTION": "1", } executor = run.Config(