Skip to content

Commit 03531bb

Browse files
committed
dpo nb lightly cleaned
1 parent 1bf4e45 commit 03531bb

File tree

1 file changed

+3
-10
lines changed

1 file changed

+3
-10
lines changed

dpo.ipynb

+3-10
Original file line numberDiff line numberDiff line change
@@ -223,10 +223,6 @@
223223
"metadata": {},
224224
"outputs": [],
225225
"source": [
226-
"# Define template: `response_template_ids`, `collator`, `format_prompt`\n",
227-
"response_template_ids = tokenizer.encode(response_template, add_special_tokens=False)[1:]\n",
228-
"collator = DataCollatorForCompletionOnlyLM(response_template_ids, tokenizer=tokenizer)\n",
229-
"\n",
230226
"def format_prompt(example) -> Tuple[str, str]:\n",
231227
" return f\"{example['context']} \\n-- Question: {example['question']}{response_template}\", example['answer']"
232228
]
@@ -323,7 +319,7 @@
323319
" return out\n",
324320
"\n",
325321
" dataset.set_transform(batched_mutate)\n",
326-
" return dataset # dataset.map(batched_mutate, batched=True, num_proc=num_proc, remove_columns=original_columns)"
322+
" return dataset"
327323
]
328324
},
329325
{
@@ -427,18 +423,15 @@
427423
" model_ref, # The model with peft adapters turned off will be used as a reference model if not provided\n",
428424
" tokenizer=tokenizer,\n",
429425
" train_dataset=ds,\n",
430-
" # eval_dataset=eval_dataset,\n",
431-
" beta=0.2, # TODO: determine\n",
426+
" beta=0.2, \n",
432427
" max_length=2048,\n",
433-
" # max_target_length=248,\n",
434428
" max_prompt_length=1500,\n",
435429
" args=TrainingArguments(\n",
436430
" output_dir=\"./dpo_results\",\n",
437431
" optim=\"paged_adamw_32bit\",\n",
438432
"\n",
439433
" max_grad_norm=0.3,\n",
440434
" warmup_ratio=0.03,\n",
441-
" # group_by_length=True,\n",
442435
" \n",
443436
" learning_rate=2e-4,\n",
444437
" weight_decay=0.001,\n",
@@ -533,7 +526,7 @@
533526
"metadata": {},
534527
"outputs": [],
535528
"source": [
536-
"# Fine-tuned model\n",
529+
"# Save trained model\n",
537530
"new_model = \"open_llama_3b_v2_sft_plus_dpo\"\n",
538531
"trainer.model.save_pretrained(new_model)"
539532
]

0 commit comments

Comments
 (0)