diff --git a/test/cpp_extensions/test/dispatch_allreduce.py b/test/cpp_extensions/test/dispatch_allreduce.py index 0502401db53799e5b5690d2af75b13c959188827..9a1578ce3b5a5e849aced7919e7418971c53845c 100644 --- a/test/cpp_extensions/test/dispatch_allreduce.py +++ b/test/cpp_extensions/test/dispatch_allreduce.py @@ -3,6 +3,7 @@ import os os.environ["TASK_QUEUE_ENABLE"] = "1" os.environ["ASCEND_LAUNCH_BLOCKING"] = "0" os.environ["ASCEND_SLOG_PRINT_TO_STDOUT"] = "1" +os.environ["ASCEND_GLOBAL_LOG_LEVEL"] = "1" os.environ["HCCL_EXEC_TIMEOUT"] = "160" import torch diff --git a/torch_npu/csrc/distributed/ProcessGroupHCCL.cpp b/torch_npu/csrc/distributed/ProcessGroupHCCL.cpp index 61c018dda393e895b421d2811610e428989ec28a..e50d2c78dd74384377850f0da2421fe54c83a21b 100644 --- a/torch_npu/csrc/distributed/ProcessGroupHCCL.cpp +++ b/torch_npu/csrc/distributed/ProcessGroupHCCL.cpp @@ -452,11 +452,11 @@ void ProcessGroupHCCL::WorkHCCL::checkDispatch() auto timeElapsed = std::chrono::duration_cast(currentTimepoint - workStartTime_); if (timeElapsed > dispatchTimeout_) { std::string repo_info = c10_npu::getRepoInfo(); - ASCEND_LOGE("Process group work %s, seq_num %u dispatch timeout. %s", opTypeToString(opType_).c_str(), seq_, repo_info.c_str()); + ASCEND_LOGI("Process group work %s, seq_num %u dispatch timeout. %s", opTypeToString(opType_).c_str(), seq_, repo_info.c_str()); is_reported = true; } } else if (*is_dispatched && is_reported) { - ASCEND_LOGE("Process group work %s, seq_num %u dispatch sucess. This error log can be ignored.", opTypeToString(opType_).c_str(), seq_); + ASCEND_LOGI("Process group work %s, seq_num %u dispatch sucess. This error log can be ignored.", opTypeToString(opType_).c_str(), seq_); is_reported = false; } } @@ -926,7 +926,7 @@ void ProcessGroupHCCL::workCleanupLoop() // Clean up completed work if (work.isCompleted()) { if (*(work.is_dispatched) && work.is_reported) { - ASCEND_LOGE("Process group work %s, seq_num %u dispatch sucess. This error log can be ignored.", opTypeToString(work.opType_).c_str(), work.seq_); + ASCEND_LOGI("Process group work %s, seq_num %u dispatch sucess. This error log can be ignored.", opTypeToString(work.opType_).c_str(), work.seq_); work.is_reported = false; } it = workMetaList_.erase(it);