Skip to content

Commit

Permalink
Post gemm after comm
Browse files Browse the repository at this point in the history
  • Loading branch information
Nicholas Sarkauskas committed Dec 10, 2024
1 parent 08073ef commit c482ec9
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion tests/cpp/test_multidevice_overlap.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1084,13 +1084,13 @@ TEST_F(
// send & matmul current index
std::vector<at::Tensor> src = {ta_j_curr_slice};
std::vector<at::Tensor> dst = {ta_j_next_slice};
torch::matmul_out(tc_j, ta_j_curr_slice, tb_unsharded_);
if (j < number_of_steps_per_ring_ - 1) {
world_communicator_->startCoalescing();
world_communicator_->send(src, send_rank, 0);
world_communicator_->recv(dst, recv_rank, 0);
comms_req = world_communicator_->endCoalescing();
}
torch::matmul_out(tc_j, ta_j_curr_slice, tb_unsharded_);
}
}
synchronizeStreams(streams);
Expand Down

0 comments on commit c482ec9

Please sign in to comment.