8000 feat: Update llama.cpp · coderonion/llama-cpp-python@748c0ce · GitHub
[go: up one dir, main page]

Skip to content

Commit 748c0ce

Browse files
committed
feat: Update llama.cpp
1 parent 53f6f5f commit 748c0ce

File tree

2 files changed

+3
-1
lines changed

2 files changed

+3
-1
lines changed

llama_cpp/llama_cpp.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -190,6 +190,7 @@ def _load_shared_library(lib_base_name: str):
190190
# LLAMA_FTYPE_MOSTLY_Q2_K_S = 21, // except 1d tensors
191191
# LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22, // except 1d tensors
192192
# LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23, // except 1d tensors
193+
# LLAMA_FTYPE_MOSTLY_IQ1_S = 24, // except 1d tensors
193194

194195
# LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
195196
# };
@@ -215,6 +216,7 @@ def _load_shared_library(lib_base_name: str):
215216
LLAMA_FTYPE_MOSTLY_Q2_K_S = 21
216217
LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22
217218
LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23
219+
LLAMA_FTYPE_MOSTLY_IQ1_S = 24
218220
LLAMA_FTYPE_GUESSED = 1024
219221

220222
# enum llama_rope_scaling_type {

vendor/llama.cpp

0 commit comments

Comments
 (0)
0