Skip to content
This repository has been archived by the owner on Nov 25, 2024. It is now read-only.

[Bugfix] Sync stream for scatter_op #235

Merged
merged 3 commits into from
Nov 21, 2024
Merged
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions cpp/src/wholememory_ops/scatter_op_impl_mapped.cu
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@
#include <wholememory/env_func_ptrs.h>
#include <wholememory/wholememory.h>

#include "cuda_macros.hpp"
#include "wholememory_ops/functions/gather_scatter_func.h"

namespace wholememory_ops {
Expand All @@ -41,6 +42,7 @@ wholememory_error_code_t wholememory_scatter_mapped(
wholememory_desc,
stream,
scatter_sms);
WM_CUDA_CHECK(cudaStreamSynchronize(stream));
}

} // namespace wholememory_ops