diff --git a/training_configs/mistral-7b-instruct-simpo.yaml b/training_configs/mistral-7b-instruct-simpo.yaml index cc42119..8808423 100644 --- a/training_configs/mistral-7b-instruct-simpo.yaml +++ b/training_configs/mistral-7b-instruct-simpo.yaml @@ -5,7 +5,7 @@ use_flash_attention_2: true # Data training arguments dataset_mixer: - snorkelai/Snorkel-Mistral-PairRM-DPO-Dataset: 1.0 + princeton-nlp/mistral-instruct-ultrafeedback: 1.0 dataset_splits: - train - test