Update llama.py: Added how many input tokens in ValueError exception

nb-programmer · web-flow · commit fd9f294b3a51 · 2023-06-16T14:11:57.000+05:30
diff --git a/llama_cpp/llama.py b/llama_cpp/llama.py
@@ -814,7 +814,7 @@ def _create_completion(
             llama_cpp.llama_reset_timings(self.ctx)
 
         if len(prompt_tokens) > self._n_ctx:
-            raise ValueError(f"Requested tokens exceed context window of {self._n_ctx}")
+            raise ValueError(f"Requested tokens ({len(prompt_tokens)}) exceed context window of {self._n_ctx}")
 
         # Truncate max_tokens if requested tokens would exceed the context window
         max_tokens = (