aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2023-04-22 16:31:56 +0300
committerGeorgi Gerganov <ggerganov@gmail.com>2023-04-22 16:32:07 +0300
commit0e018fe008eacebdbcfa2d61b6c988c245c961cd (patch)
tree5a2051e9896f120527484732b9a9a14f0107f547
parent857308d1e8fb6afe33edb481d48560eee8fe7d7c (diff)
ggml : fix Q4_3 cuBLAS
-rw-r--r--CMakeLists.txt2
-rw-r--r--ggml.c3
2 files changed, 5 insertions, 0 deletions
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 2d4e30e..11ebe9e 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -312,6 +312,7 @@ add_library(ggml OBJECT
target_include_directories(ggml PUBLIC .)
target_compile_features(ggml PUBLIC c_std_11) # don't bump
target_link_libraries(ggml PUBLIC Threads::Threads ${LLAMA_EXTRA_LIBS})
+
if (BUILD_SHARED_LIBS)
set_target_properties(ggml PROPERTIES POSITION_INDEPENDENT_CODE ON)
endif()
@@ -324,6 +325,7 @@ add_library(llama
target_include_directories(llama PUBLIC .)
target_compile_features(llama PUBLIC cxx_std_11) # don't bump
target_link_libraries(llama PRIVATE ggml ${LLAMA_EXTRA_LIBS})
+
if (BUILD_SHARED_LIBS)
set_target_properties(llama PROPERTIES POSITION_INDEPENDENT_CODE ON)
target_compile_definitions(llama PRIVATE LLAMA_SHARED LLAMA_BUILD)
diff --git a/ggml.c b/ggml.c
index d9a95af..281b202 100644
--- a/ggml.c
+++ b/ggml.c
@@ -7992,6 +7992,9 @@ static void ggml_compute_forward_mul_mat_q_f32(
else if (type == GGML_TYPE_Q4_2) {
dequantize_row_q_cuda = dequantize_row_q4_2_cuda;
}
+ else if (type == GGML_TYPE_Q4_3) {
+ dequantize_row_q_cuda = dequantize_row_q4_3_cuda;
+ }
else {
GGML_ASSERT(false);
}