yeahdongcn commited on
Commit
4168dda
·
1 Parent(s): db87c9d

musa: fix failures in test-backend-ops for mul_mat_id op (llama/15236)

Browse files

* musa: fix failures in test-backend-ops for mul_mat_id op

Signed-off-by: Xiaodong Ye <[email protected]>

* Address review comments

Signed-off-by: Xiaodong Ye <[email protected]>

---------

Signed-off-by: Xiaodong Ye <[email protected]>

Files changed (1) hide show
  1. ggml/src/ggml-cuda/common.cuh +2 -2
ggml/src/ggml-cuda/common.cuh CHANGED
@@ -312,11 +312,11 @@ static bool turing_mma_available(const int cc) {
312
  }
313
 
314
  static bool ampere_mma_available(const int cc) {
315
- return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
316
  }
317
 
318
  static bool cp_async_available(const int cc) {
319
- return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
320
  }
321
 
322
  static constexpr __device__ int ggml_cuda_get_physical_warp_size() {
 
312
  }
313
 
314
  static bool ampere_mma_available(const int cc) {
315
+ return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
316
  }
317
 
318
  static bool cp_async_available(const int cc) {
319
+ return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
320
  }
321
 
322
  static constexpr __device__ int ggml_cuda_get_physical_warp_size() {