Skip to content

Commit 950c0e2

Browse files
r-barnesfacebook-github-bot
authored andcommitted
Use emplace_back for more speed
Summary: Prevents a copy Reviewed By: rohan-varma Differential Revision: D37418718 fbshipit-source-id: 9475a5817cc461066a2b462eea1242fdee175042
1 parent 96cec6b commit 950c0e2

File tree

2 files changed

+3
-4
lines changed

2 files changed

+3
-4
lines changed

gloo/cuda_collectives_nccl.h

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -23,12 +23,11 @@ std::vector<nccl::NCCLElement<T> > toDeviceElements(
2323
std::vector<nccl::NCCLElement<T> > elements;
2424
elements.reserve(ptrs.size());
2525
for (auto i = 0; i < ptrs.size(); i++) {
26-
elements.push_back(
27-
nccl::NCCLElement<T>(
26+
elements.emplace_back(
2827
ptrs[i].range(offset, count),
2928
streams[i],
3029
ptrs[i].range(offset, count),
31-
streams[i]));
30+
streams[i]);
3231
}
3332
return elements;
3433
}

gloo/cuda_private.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -148,7 +148,7 @@ class CudaDeviceStreams {
148148
const int numDevices = getDeviceCount();
149149
streams_.reserve(numDevices);
150150
for (auto i = 0; i < numDevices; i++) {
151-
streams_.push_back(CudaStream(i));
151+
streams_.emplace_back(i);
152152
}
153153
}
154154
cudaStream_t operator[](const int i) {

0 commit comments

Comments
 (0)