Skip to content

Commit

Permalink
Fix CUDA async stream. (dmlc#8380)
Browse files Browse the repository at this point in the history
  • Loading branch information
trivialfis committed Oct 26, 2022
1 parent 153d995 commit c4ab762
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions src/objective/adaptive.cu
Expand Up @@ -67,6 +67,10 @@ void EncodeTreeLeafDevice(Context const* ctx, common::Span<bst_node_t const> pos
auto pinned = pinned_pool.GetSpan<char>(sizeof(size_t) + sizeof(bst_node_t));
dh::CUDAStream copy_stream;
size_t* h_num_runs = reinterpret_cast<size_t*>(pinned.subspan(0, sizeof(size_t)).data());

dh::CUDAEvent e;
e.Record(dh::DefaultStream());
copy_stream.View().Wait(e);
// flag for whether there's ignored position
bst_node_t* h_first_unique =
reinterpret_cast<bst_node_t*>(pinned.subspan(sizeof(size_t), sizeof(bst_node_t)).data());
Expand Down

0 comments on commit c4ab762

Please sign in to comment.