8000 feat: Update llama.cpp · sunnykim1206/llama-cpp-python@4edde21 · GitHub
[go: up one dir, main page]

Skip to content

Commit 4edde21

Browse files
committed
feat: Update llama.cpp
1 parent f57b01a commit 4edde21

File tree

2 files changed

+3
-1
lines changed

2 files changed

+3
-1
lines changed

llama_cpp/llama_cpp.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -191,6 +191,7 @@ def _load_shared_library(lib_base_name: str):
191191
# LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22, // except 1d tensors
192192
# LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23, // except 1d tensors
193193
# LLAMA_FTYPE_MOSTLY_IQ1_S = 24, // except 1d tensors
194+ 8228
# LLAMA_FTYPE_MOSTLY_IQ4_NL = 25, // except 1d tensors
194195

195196
# LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
196197
# };
@@ -217,6 +218,7 @@ def _load_shared_library(lib_base_name: str):
217218
LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22
218219
LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23
219220
LLAMA_FTYPE_MOSTLY_IQ1_S = 24
221+
LLAMA_FTYPE_MOSTLY_IQ4_NL = 25
220222
LLAMA_FTYPE_GUESSED = 1024
221223

222224
# enum llama_rope_scaling_type {

vendor/llama.cpp

0 commit comments

Comments
 (0)
0