mirror of
https://github.com/abetlen/llama-cpp-python.git
synced 2023-09-07 17:34:22 +03:00
Update llama.py: Added how many input tokens in ValueError exception
This commit is contained in:
@@ -814,7 +814,7 @@ class Llama:
|
|||||||
llama_cpp.llama_reset_timings(self.ctx)
|
llama_cpp.llama_reset_timings(self.ctx)
|
||||||
|
|
||||||
if len(prompt_tokens) > self._n_ctx:
|
if len(prompt_tokens) > self._n_ctx:
|
||||||
raise ValueError(f"Requested tokens exceed context window of {self._n_ctx}")
|
raise ValueError(f"Requested tokens ({len(prompt_tokens)}) exceed context window of {self._n_ctx}")
|
||||||
|
|
||||||
# Truncate max_tokens if requested tokens would exceed the context window
|
# Truncate max_tokens if requested tokens would exceed the context window
|
||||||
max_tokens = (
|
max_tokens = (
|
||||||
|
|||||||
Reference in New Issue
Block a user