diff --git a/llama_cpp/llama.py b/llama_cpp/llama.py index a37a62aef..b780ef6c6 100644 --- a/llama_cpp/llama.py +++ b/llama_cpp/llama.py @@ -1523,7 +1523,8 @@ def logit_bias_processor( if self.verbose: print("Llama._create_completion: cache save", file=sys.stderr) self.cache[prompt_tokens + completion_tokens] = self.save_state() - print("Llama._create_completion: cache saved", file=sys.stderr) + if self.verbose: + print("Llama._create_completion: cache saved", file=sys.stderr) return if self.cache: