|
1 | 1 | /*
|
2 |
| - * MIT license |
3 |
| - * Copyright (C) 2024 GGML Authors |
4 |
| - * SPDX-License-Identifier: MIT |
5 |
| - * |
6 | 2 | * this is implementation of ggml QNN(Qualcomm Neural Network, aka AI Engine Direct) backend
|
7 | 3 | *
|
8 | 4 | * status:
|
@@ -959,7 +955,7 @@ static int free_qnn_tensor(Qnn_Tensor_t & tensor) {
|
959 | 955 | QNN_LOG_INFO("it should not happen, pls check");
|
960 | 956 | } else {
|
961 | 957 | //TODO:why crash in here? why pointer changed with mul_mat?
|
962 |
| - //memory leak after comment above line |
| 958 | + //memory leak after comment below line |
963 | 959 | //free(QNN_TENSOR_GET_DIMENSIONS(tensor));
|
964 | 960 | }
|
965 | 961 |
|
@@ -1464,7 +1460,7 @@ static void ggml_qnn_log_internal(ggml_log_level level, const char * file, const
|
1464 | 1460 | #if (defined __ANDROID__) || (defined ANDROID)
|
1465 | 1461 | __android_log_print(level, "llamacpp", "%s", s_ggml_qnn_log_internal_buf);
|
1466 | 1462 | #else
|
1467 |
| - printf("%s", buffer); //Qualcomm's QNN could running on Window over ARM |
| 1463 | + printf("%s", buffer); //Qualcomm's QNN could running on Windows over ARM(aka WoA) |
1468 | 1464 | #endif
|
1469 | 1465 | }
|
1470 | 1466 | va_end(args);
|
@@ -2108,11 +2104,11 @@ int qnn_instance::load_system() {
|
2108 | 2104 |
|
2109 | 2105 | _system_lib_handle = dlopen(system_lib_path.c_str(), RTLD_NOW | RTLD_LOCAL);
|
2110 | 2106 | if (nullptr == _system_lib_handle) {
|
2111 |
| - QNN_LOG_WARN("can not pen QNN library %s, error: %s\n", system_lib_path.c_str(), dlerror()); |
| 2107 | + QNN_LOG_WARN("can not open QNN library %s, error: %s\n", system_lib_path.c_str(), dlerror()); |
2112 | 2108 | return 1;
|
2113 | 2109 | }
|
2114 | 2110 |
|
2115 |
| - auto *get_providers = reinterpret_cast<_pfn_QnnSystemInterface_getProviders *>(dlsym( |
| 2111 | + auto * get_providers = reinterpret_cast<_pfn_QnnSystemInterface_getProviders *>(dlsym( |
2116 | 2112 | _system_lib_handle, "QnnSystemInterface_getProviders"));
|
2117 | 2113 | if (nullptr == get_providers) {
|
2118 | 2114 | QNN_LOG_WARN("can not load QNN symbol QnnSystemInterface_getProviders: %s\n", dlerror());
|
@@ -3605,7 +3601,6 @@ bool ggml_qnn_compute_forward(struct ggml_compute_params * params, struct ggml_t
|
3605 | 3601 | }
|
3606 | 3602 |
|
3607 | 3603 |
|
3608 |
| - //ok, real show time in Qualcomm's QNN internal |
3609 | 3604 | if (nullptr != func)
|
3610 | 3605 | func(tensor->src[0], tensor->src[1], tensor);
|
3611 | 3606 | if (nullptr != func_common)
|
@@ -3845,7 +3840,7 @@ static size_t ggml_backend_qnn_buffer_type_get_alignment(ggml_backend_buffer_typ
|
3845 | 3840 | static size_t ggml_backend_qnn_buffer_type_get_max_size(ggml_backend_buffer_type_t buft) {
|
3846 | 3841 | GGML_UNUSED(buft);
|
3847 | 3842 |
|
3848 |
| - return (38 * 1024 * 1024); |
| 3843 | + return (96 * 1024 * 1024); |
3849 | 3844 | }
|
3850 | 3845 |
|
3851 | 3846 |
|
|
0 commit comments