8000
We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
embeddings=False
1 parent 117cbb2 commit bf5e0bbCopy full SHA for bf5e0bb
llama_cpp/server/settings.py
@@ -96,7 +96,7 @@ class ModelSettings(BaseSettings):
96
default=True, description="if true, use experimental mul_mat_q kernels"
97
)
98
logits_all: bool = Field(default=True, description="Whether to return logits.")
99
- embedding: bool = Field(default=True, description="Whether to use embeddings.")
+ embedding: bool = Field(default=False, description="Whether to use embeddings.")
100
offload_kqv: bool = Field(
101
default=True, description="Whether to offload kqv to the GPU."
102
0 commit comments