diff --git a/examples/high_level_api_basic_inference.py b/examples/high_level_api_inference.py similarity index 78% rename from examples/high_level_api_basic_inference.py rename to examples/high_level_api_inference.py index a72adf1..136f22c 100644 --- a/examples/high_level_api_basic_inference.py +++ b/examples/high_level_api_inference.py @@ -4,14 +4,14 @@ import argparse from llama_cpp import Llama parser = argparse.ArgumentParser() -parser.add_argument("-m", "--model", type=str, default=".//models/...") +parser.add_argument("-m", "--model", type=str, default="./models/...") args = parser.parse_args() llm = Llama(model_path=args.model) output = llm( "Question: What are the names of the planets in the solar system? Answer: ", - max_tokens=48, + max_tokens=1, stop=["Q:", "\n"], echo=True, )