mirror of
https://github.com/abetlen/llama-cpp-python.git
synced 2023-09-07 17:34:22 +03:00
Bugfix: n_batch should always be <= n_ctx
This commit is contained in:
@@ -68,7 +68,7 @@ class Llama:
|
|||||||
maxlen=self.last_n_tokens_size,
|
maxlen=self.last_n_tokens_size,
|
||||||
)
|
)
|
||||||
self.tokens_consumed = 0
|
self.tokens_consumed = 0
|
||||||
self.n_batch = n_batch
|
self.n_batch = min(n_ctx, n_batch)
|
||||||
|
|
||||||
self.n_threads = n_threads or multiprocessing.cpu_count()
|
self.n_threads = n_threads or multiprocessing.cpu_count()
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user