Skip to content
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions aiter/dist/device_communicators/communicator_cuda.py
Original file line number Diff line number Diff line change
Expand Up @@ -149,6 +149,8 @@ def all_reduce(
qr_comm is not None
and not qr_comm.disabled
and qr_comm.should_quick_allreduce(input_)
and (input_.nelement() * input_.element_size()) >= 4*1024*1024 # input shape should be such that quick reduce will show benefits.
# input shape estimated at 2 * max concurrency for now. if performance issues, subject to change
):
out = qr_comm.quick_all_reduce(input_)
assert out is not None
Expand Down