Enhancement to mitigate response included in user message

#1
by dvilasuero HF staff - opened
src/distilabel_dataset_generator/sft.py CHANGED
@@ -151,6 +151,13 @@ def _run_pipeline(result_queue, num_turns, num_rows, system_prompt, token: str =
151
  generation_kwargs={
152
  "temperature": 0.8, # it's the best value for Llama 3.1 70B Instruct
153
  "do_sample": True,
 
 
 
 
 
 
 
154
  },
155
  api_key=token,
156
  ),
 
151
  generation_kwargs={
152
  "temperature": 0.8, # it's the best value for Llama 3.1 70B Instruct
153
  "do_sample": True,
154
+ "stop_sequences": [
155
+ "<|eot_id|>",
156
+ "<|end_of_text|>",
157
+ "<|start_header_id|>",
158
+ "<|end_header_id|>",
159
+ "assistant"
160
+ ]
161
  },
162
  api_key=token,
163
  ),