Compare commits

...

2 Commits

Author SHA1 Message Date
cebtenzzre
9a19c740ee
kompute: fix library loading issues with kp_logger (#1517) 2023-10-16 16:58:17 -04:00
Aaron Miller
f79557d2aa speedup: just use mat*vec shaders for mat*mat
so far my from-scratch mat*mats are still slower than just running more
invocations of the existing Metal ported mat*vec shaders - it should be
theoretically possible to make a mat*mat that's faster (for actual
mat*mat cases) than an optimal mat*vec, but it will need to be at
*least* as fast as the mat*vec op and then take special care to be
cache-friendly and save memory bandwidth, as the # of compute ops is the
same
2023-10-16 13:45:51 -04:00
2 changed files with 2 additions and 11 deletions

@ -1 +1 @@
Subproject commit 500689ad356a81a471a7fb68cc70f7aee5a5f56e Subproject commit ffe96e1ebf9cdae1dc82b2049d9e45c1875472ab

View File

@ -222,6 +222,7 @@ if (LLAMA_KOMPUTE)
if (EXISTS "${LLAMA_DIR}/kompute/CMakeLists.txt") if (EXISTS "${LLAMA_DIR}/kompute/CMakeLists.txt")
message(STATUS "Kompute found") message(STATUS "Kompute found")
set(KOMPUTE_OPT_LOG_LEVEL Error CACHE STRING "Kompute log level")
add_subdirectory(${LLAMA_DIR}/kompute) add_subdirectory(${LLAMA_DIR}/kompute)
# Compile our shaders # Compile our shaders
@ -239,11 +240,6 @@ if (LLAMA_KOMPUTE)
kompute/op_rmsnorm.comp kompute/op_rmsnorm.comp
kompute/op_diagmask.comp kompute/op_diagmask.comp
kompute/op_mul_mat_mat_f32.comp kompute/op_mul_mat_mat_f32.comp
kompute/op_mul_mat_mat_f16.comp
kompute/op_mul_mat_mat_q8_0.comp
kompute/op_mul_mat_mat_q4_0.comp
kompute/op_mul_mat_mat_q4_1.comp
kompute/op_mul_mat_mat_q6_k.comp
kompute/op_mul_mat_f16.comp kompute/op_mul_mat_f16.comp
kompute/op_mul_mat_q8_0.comp kompute/op_mul_mat_q8_0.comp
kompute/op_mul_mat_q4_0.comp kompute/op_mul_mat_q4_0.comp
@ -275,11 +271,6 @@ if (LLAMA_KOMPUTE)
shaderop_rmsnorm.h shaderop_rmsnorm.h
shaderop_diagmask.h shaderop_diagmask.h
shaderop_mul_mat_mat_f32.h shaderop_mul_mat_mat_f32.h
shaderop_mul_mat_mat_f16.h
shaderop_mul_mat_mat_q8_0.h
shaderop_mul_mat_mat_q4_0.h
shaderop_mul_mat_mat_q4_1.h
shaderop_mul_mat_mat_q6_k.h
shaderop_mul_mat_f16.h shaderop_mul_mat_f16.h
shaderop_mul_mat_q8_0.h shaderop_mul_mat_q8_0.h
shaderop_mul_mat_q4_0.h shaderop_mul_mat_q4_0.h