From 0822f571618a49c582106ff7cd2aadc01fe07640 Mon Sep 17 00:00:00 2001 From: Aravind Gopalakrishnan Date: Wed, 20 Dec 2017 14:58:49 -0800 Subject: [PATCH] MTL OFI: Allow retries in MTL progress for interrupted syscalls This fixes a regression in sockets provider which could return -EINTR value from fi_cq_read() due to a syscall being interrupted. The error value is currently interpreted as fatal condition. Relax the rule so that we can retry fi_cq_read() operation. Signed-off-by: Aravind Gopalakrishnan (cherry picked from commit fb68726baf0aa482e53ffb1f4e4490949c7e0e05) --- ompi/mca/mtl/ofi/mtl_ofi.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ompi/mca/mtl/ofi/mtl_ofi.h b/ompi/mca/mtl/ofi/mtl_ofi.h index a20c9d4a5fb..263c39ceac5 100644 --- a/ompi/mca/mtl/ofi/mtl_ofi.h +++ b/ompi/mca/mtl/ofi/mtl_ofi.h @@ -116,7 +116,7 @@ ompi_mtl_ofi_progress(void) exit(1); } } else { - if (ret == -FI_EAGAIN) { + if (ret == -FI_EAGAIN || ret == -EINTR) { break; } else { opal_output(0, "%s:%d: Error returned from fi_cq_read: %s(%zd).\n"