summaryrefslogtreecommitdiff
path: root/samples/sgemm_cuda.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'samples/sgemm_cuda.cpp')
-rw-r--r--samples/sgemm_cuda.cpp4
1 files changed, 2 insertions, 2 deletions
diff --git a/samples/sgemm_cuda.cpp b/samples/sgemm_cuda.cpp
index f1138316..8e4397df 100644
--- a/samples/sgemm_cuda.cpp
+++ b/samples/sgemm_cuda.cpp
@@ -69,8 +69,8 @@ int main() {
cuMemAlloc(&device_b, host_b.size()*sizeof(float));
cuMemAlloc(&device_c, host_c.size()*sizeof(float));
cuMemcpyHtoDAsync(device_a, host_a.data(), host_a.size()*sizeof(float), stream);
- cuMemcpyHtoDAsync(device_b, host_c.data(), host_b.size()*sizeof(float), stream);
- cuMemcpyHtoDAsync(device_c, host_b.data(), host_c.size()*sizeof(float), stream);
+ cuMemcpyHtoDAsync(device_b, host_b.data(), host_b.size()*sizeof(float), stream);
+ cuMemcpyHtoDAsync(device_c, host_c.data(), host_c.size()*sizeof(float), stream);
// Start the timer
auto start_time = std::chrono::steady_clock::now();