lhez commited on
Commit
e6a209e
·
1 Parent(s): 9e85264

opencl: fix adreno compiler detection logic (llama/15029)

Browse files
ggml/src/ggml-opencl/ggml-opencl.cpp CHANGED
@@ -2046,8 +2046,8 @@ static ggml_backend_opencl_context * ggml_cl2_init(ggml_backend_dev_t dev) {
2046
 
2047
  backend_ctx->adreno_cl_compiler_version = get_adreno_cl_compiler_version(driver_version);
2048
  backend_ctx->has_vector_subgroup_broadcast =
2049
- backend_ctx->adreno_cl_compiler_version.major >= 47 ||
2050
- backend_ctx->adreno_cl_compiler_version.major == 17;
2051
  GGML_LOG_INFO("ggml_opencl: vector subgroup broadcast support: %s\n",
2052
  backend_ctx->has_vector_subgroup_broadcast ? "true" : "false");
2053
 
 
2046
 
2047
  backend_ctx->adreno_cl_compiler_version = get_adreno_cl_compiler_version(driver_version);
2048
  backend_ctx->has_vector_subgroup_broadcast =
2049
+ (backend_ctx->adreno_cl_compiler_version.type == E031 && backend_ctx->adreno_cl_compiler_version.major >= 47) ||
2050
+ (backend_ctx->adreno_cl_compiler_version.type == DX && backend_ctx->adreno_cl_compiler_version.major >= 17);
2051
  GGML_LOG_INFO("ggml_opencl: vector subgroup broadcast support: %s\n",
2052
  backend_ctx->has_vector_subgroup_broadcast ? "true" : "false");
2053