fix on-policy data order

This commit is contained in:
Yu Meng
2024-08-22 16:06:04 -04:00
parent 54545e803b
commit 2dcc4350f8
+1 -1
View File
@@ -30,7 +30,7 @@ tokenizer = llm.get_tokenizer()
train_dataset= load_dataset(data_dir, split='train_prefs') train_dataset= load_dataset(data_dir, split='train_prefs')
prompts = list(set(train_dataset['prompt'])) prompts = sorted(list(set(train_dataset['prompt'])))
conversations = [tokenizer.apply_chat_template([{'role': 'user', 'content': prompt}], tokenize=False, add_generation_prompt=True) for prompt in prompts] conversations = [tokenizer.apply_chat_template([{'role': 'user', 'content': prompt}], tokenize=False, add_generation_prompt=True) for prompt in prompts]