Add timeout for distributed tests. (#10315)

This commit is contained in:
Jiaming Yuan
2024-05-23 11:11:49 +08:00
committed by GitHub
parent b8a7773736
commit d5fcbee44b
2 changed files with 14 additions and 8 deletions

View File

@@ -191,7 +191,7 @@ Result BroadcastAllgatherV(NCCLComm const* comm, common::Span<std::int8_t const>
for (std::int32_t r = 0; r < comm->World(); ++r) {
auto as_bytes = sizes[r];
auto rc = stub->Broadcast(data.data(), recv.subspan(offset, as_bytes).data(), as_bytes,
ncclInt8, r, comm->Handle(), dh::DefaultStream());
ncclInt8, r, comm->Handle(), comm->Stream());
if (!rc.OK()) {
return rc;
}