We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 54545e8 commit 2dcc435Copy full SHA for 2dcc435
on_policy_data_gen/decode.py
@@ -30,7 +30,7 @@
30
31
train_dataset= load_dataset(data_dir, split='train_prefs')
32
33
-prompts = list(set(train_dataset['prompt']))
+prompts = sorted(list(set(train_dataset['prompt'])))
34
35
conversations = [tokenizer.apply_chat_template([{'role': 'user', 'content': prompt}], tokenize=False, add_generation_prompt=True) for prompt in prompts]
36
0 commit comments