Spaces:
Running
Running
Commit
·
4168dda
1
Parent(s):
db87c9d
musa: fix failures in test-backend-ops for mul_mat_id op (llama/15236)
Browse files* musa: fix failures in test-backend-ops for mul_mat_id op
Signed-off-by: Xiaodong Ye <[email protected]>
* Address review comments
Signed-off-by: Xiaodong Ye <[email protected]>
---------
Signed-off-by: Xiaodong Ye <[email protected]>
ggml/src/ggml-cuda/common.cuh
CHANGED
|
@@ -312,11 +312,11 @@ static bool turing_mma_available(const int cc) {
|
|
| 312 |
}
|
| 313 |
|
| 314 |
static bool ampere_mma_available(const int cc) {
|
| 315 |
-
return cc
|
| 316 |
}
|
| 317 |
|
| 318 |
static bool cp_async_available(const int cc) {
|
| 319 |
-
return cc
|
| 320 |
}
|
| 321 |
|
| 322 |
static constexpr __device__ int ggml_cuda_get_physical_warp_size() {
|
|
|
|
| 312 |
}
|
| 313 |
|
| 314 |
static bool ampere_mma_available(const int cc) {
|
| 315 |
+
return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
|
| 316 |
}
|
| 317 |
|
| 318 |
static bool cp_async_available(const int cc) {
|
| 319 |
+
return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
|
| 320 |
}
|
| 321 |
|
| 322 |
static constexpr __device__ int ggml_cuda_get_physical_warp_size() {
|