From 2a632df681125923c4b9e8d4426df76c0eb8db69 Mon Sep 17 00:00:00 2001 From: Devendar Bureddy Date: Wed, 16 Oct 2024 20:14:09 +0300 Subject: [PATCH] Fix ece check --- src/ib_plugin.c | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/ib_plugin.c b/src/ib_plugin.c index e6d6db2..edccd51 100644 --- a/src/ib_plugin.c +++ b/src/ib_plugin.c @@ -762,6 +762,7 @@ ncclResult_t ncclIbConnect(int dev, void* opaqueHandle, void** sendComm, ncclNet } struct ncclIbConnectionMetadata meta; + memset(&meta, 0, sizeof(meta)); meta.ndevs = comm->base.ndevs; // Alternate QPs between devices @@ -1003,6 +1004,7 @@ ncclResult_t ncclIbAccept(void* listenComm, void** recvComm, ncclNetDeviceHandl // Metadata to send back to requestor (sender) struct ncclIbConnectionMetadata meta; + memset(&meta, 0, sizeof(meta)); for (int i = 0; i < rComm->base.ndevs; i++) { rCommDev = rComm->devs + i; ibDevN = mergedDev->devs[i]; @@ -1050,6 +1052,8 @@ ncclResult_t ncclIbAccept(void* listenComm, void** recvComm, ncclNetDeviceHandl // Store this in our own qpInfo for returning to the requestor if (meta.qpInfo[q].ece_supported) NCCLCHECKGOTO(wrap_ibv_query_ece(qp->qp, &meta.qpInfo[q].ece, &meta.qpInfo[q].ece_supported), ret, fail); + } else { + meta.qpInfo[q].ece_supported = 0; } bool override_tc = (q == 0) ? true : false; NCCLCHECKGOTO(ncclIbRtrQp(qp->qp, &rCommDev->base.gidInfo, remMeta.qpInfo[q].qpn, remDevInfo, override_tc), ret, fail);