blob: abba1cd230266e35fe11bd9b086857455210cf4f (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
|
This fixes a problem in the upstream code. There is an extra argument in
the call to the x_buffer.CopyToAsync function that must be removed. Otherwise
the build fails when CUDA is enabled.
--- CLBlast/src/routines/level3/xtrsm.cpp 2022-05-21 08:44:13.815816361 -0600
+++ CLBlast_fixed/src/routines/level3/xtrsm.cpp 2022-05-21 08:28:06.756355738 -0600
@@ -246,7 +246,7 @@
}
// Retrieves the results
- x_buffer.CopyToAsync(queue_, b_size, b_buffer, event_);
+ x_buffer.CopyToAsync(queue_, b_size, b_buffer);
}
// =================================================================================================
|