mirror of
https://github.com/wassname/SimPO.git
synced 2026-06-27 15:13:50 +08:00
fix on-policy data order
This commit is contained in:
@@ -30,7 +30,7 @@ tokenizer = llm.get_tokenizer()
|
||||
|
||||
train_dataset= load_dataset(data_dir, split='train_prefs')
|
||||
|
||||
prompts = list(set(train_dataset['prompt']))
|
||||
prompts = sorted(list(set(train_dataset['prompt'])))
|
||||
|
||||
conversations = [tokenizer.apply_chat_template([{'role': 'user', 'content': prompt}], tokenize=False, add_generation_prompt=True) for prompt in prompts]
|
||||
|
||||
|
||||
Reference in New Issue
Block a user