Use Llama3.1 as default for llamachat

e6832e69 · Max Kimmich · f2fd6467 · e6832e69
Commit e6832e69 authored 7 months ago by Max Kimmich
--- a/evoprompt/models.py
+++ b/evoprompt/models.py
@@ -240,14 +240,14 @@ class Llama(LLMModel):
        group.add_argument(
            "--llama-model",
            type=str,
-            default="QuantFactory/Meta-Llama-3-8B-Instruct-GGUF",
+            default="QuantFactory/Meta-Llama-3.1-8B-Instruct-GGUF",
            help="A pre-trained model from HF hub",
        ),
        group.add_argument(
            "--llama-model-file",
            type=str,
            # TODO provide some help for selecting model files, and point user to set this argument if needed
-            default="Meta-Llama-3-8B-Instruct.Q5_K_M.gguf",
+            default="Meta-Llama-3.1-8B-Instruct.Q8_0.gguf",
            help="Specify the model file in case of a pre-trained model from HF hub, e.g., a specific quantized version",
        ),
        group.add_argument(