diff --git a/model/supervised_finetuning/custom_datasets/formatting.py b/model/supervised_finetuning/custom_datasets/formatting.py index 2f0adecd..a6c1c0d8 100644 --- a/model/supervised_finetuning/custom_datasets/formatting.py +++ b/model/supervised_finetuning/custom_datasets/formatting.py @@ -2,4 +2,4 @@ QA_SPECIAL_TOKENS = {"Question": "", "Answer": "", "StartPrefix": "< def format_pair(pair): - return "{} {} {}".format(QA_SPECIAL_TOKENS["Question"], pair[0], QA_SPECIAL_TOKENS["Answer"]), pair[1] + return "{}{}{}".format(QA_SPECIAL_TOKENS["Question"], pair[0], QA_SPECIAL_TOKENS["Answer"]), pair[1]