feat: Update llama.cpp

abetlen · abetlen · commit c032fc65b087 · 2024-09-06T04:12:29.000-04:00
diff --git a/llama_cpp/llama_cpp.py b/llama_cpp/llama_cpp.py
@@ -443,6 +443,8 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
 #     LLAMA_FTYPE_MOSTLY_Q4_0_4_4      = 33, // except 1d tensors
 #     LLAMA_FTYPE_MOSTLY_Q4_0_4_8      = 34, // except 1d tensors
 #     LLAMA_FTYPE_MOSTLY_Q4_0_8_8      = 35, // except 1d tensors
+#     LLAMA_FTYPE_MOSTLY_TQ1_0         = 36, // except 1d tensors
+#     LLAMA_FTYPE_MOSTLY_TQ2_0         = 37, // except 1d tensors
 #
 #     LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
 # };
@@ -479,6 +481,8 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
 LLAMA_FTYPE_MOSTLY_Q4_0_4_4 = 33
 LLAMA_FTYPE_MOSTLY_Q4_0_4_8 = 34
 LLAMA_FTYPE_MOSTLY_Q4_0_8_8 = 35
+LLAMA_FTYPE_MOSTLY_TQ1_0 = 36
+LLAMA_FTYPE_MOSTLY_TQ2_0 = 37
 LLAMA_FTYPE_GUESSED = 1024
 
 # enum llama_rope_scaling_type {
diff --git a/vendor/llama.cpp b/vendor/llama.cpp
@@ -1 +1 @@
-Subproject commit 581c305186a0ff93f360346c57e21fe16e967bb7
+Subproject commit 8ebe8ddebd68526757c631cd019de009697c63c2