Bugfix gpu output data copy
This commit is contained in:
@@ -66,6 +66,8 @@ struct GPUBackend::Impl {
|
|||||||
launch_sincosf_kernel(d_x, d_s, d_c, n);
|
launch_sincosf_kernel(d_x, d_s, d_c, n);
|
||||||
cudaMemcpy(h_s, d_s, bytes, cudaMemcpyDeviceToHost);
|
cudaMemcpy(h_s, d_s, bytes, cudaMemcpyDeviceToHost);
|
||||||
cudaMemcpy(h_c, d_c, bytes, cudaMemcpyDeviceToHost);
|
cudaMemcpy(h_c, d_c, bytes, cudaMemcpyDeviceToHost);
|
||||||
|
std::memcpy(s, h_s, bytes);
|
||||||
|
std::memcpy(c, h_c, bytes);
|
||||||
}
|
}
|
||||||
|
|
||||||
float *h_x = nullptr;
|
float *h_x = nullptr;
|
||||||
|
|||||||
Reference in New Issue
Block a user