Update Mistral hyper parameters and results

dafc5c2f · jbreton · c1653711 · dafc5c2f · dafc5c2f
Commit dafc5c2f authored 1 year ago by jbreton
--- a/modules/llm/Mistral-7b/Mistral-7b_fine_tune.py
+++ b/modules/llm/Mistral-7b/Mistral-7b_fine_tune.py
@@ -57,7 +57,8 @@ def fine_tune(base_model, new_model):
    # Hyperparameters should beadjusted based on the hardware you using
    training_arguments = TrainingArguments(
        per_device_train_batch_size=2,
-        gradient_accumulation_steps=1,
+        gradient_accumulation_steps=2,
+        num_train_epochs=6,
        learning_rate=1e-4,
        logging_steps=2,
        optim="adamw_torch",

--- a/results/LLM/Mistral-7b/MISTRAL_fine_tuned_raw_answers.json
+++ b/results/LLM/Mistral-7b/MISTRAL_fine_tuned_raw_answers.json