whisper.cpp

Running

yeahdongcn commited on Aug 12

Commit

4168dda

1 Parent(s): db87c9d

musa: fix failures in test-backend-ops for mul_mat_id op (llama/15236)

* musa: fix failures in test-backend-ops for mul_mat_id op

Signed-off-by: Xiaodong Ye <[email protected]>

* Address review comments

Signed-off-by: Xiaodong Ye <[email protected]>

---------

Signed-off-by: Xiaodong Ye <[email protected]>

Files changed (1) hide show

ggml/src/ggml-cuda/common.cuh +2 -2

ggml/src/ggml-cuda/common.cuh CHANGED Viewed

@@ -312,11 +312,11 @@ static bool turing_mma_available(const int cc) {
 }
 static bool ampere_mma_available(const int cc) {
-    return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
 }
 static bool cp_async_available(const int cc) {
-    return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
 }
 static constexpr __device__ int ggml_cuda_get_physical_warp_size() {

 }
 static bool ampere_mma_available(const int cc) {
+    return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
 }
 static bool cp_async_available(const int cc) {
+    return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
 }
 static constexpr __device__ int ggml_cuda_get_physical_warp_size() {