dvilasuero commited on
Commit
a932ff3
1 Parent(s): bdaa8f7

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +55 -0
README.md ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ ---
4
+
5
+ Experiment with distilabel:
6
+
7
+ ```python
8
+
9
+ dataset = load_dataset("argilla/distilabel-intel-orca-dpo-pairs", split="train", token=hf_token)
10
+ dataset = dataset.filter(lambda r: r["status"]!="tie" and r["chosen_score"]>5)
11
+
12
+ def chatml_format(example):
13
+ # Format system
14
+ if len(example['system']) > 0:
15
+ message = {"role": "system", "content": example['system']}
16
+ system = tokenizer.apply_chat_template([message], tokenize=False)
17
+ else:
18
+ system = ""
19
+
20
+ # Format instruction
21
+ message = {"role": "user", "content": example['input']}
22
+ prompt = tokenizer.apply_chat_template([message], tokenize=False, add_generation_prompt=True)
23
+
24
+ # Format chosen answer
25
+ chosen = example['chosen'] + "<|im_end|>\n"
26
+
27
+ # Format rejected answer
28
+ rejected = example['rejected'] + "<|im_end|>\n"
29
+
30
+ return {
31
+ "prompt": system + prompt,
32
+ "chosen": chosen,
33
+ "rejected": rejected,
34
+ }
35
+
36
+ # Load dataset
37
+ #dataset = load_dataset("Intel/orca_dpo_pairs")['train']
38
+
39
+ # Save columns
40
+ original_columns = dataset.column_names
41
+
42
+ # Tokenizer
43
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
44
+ tokenizer.pad_token = tokenizer.eos_token
45
+ tokenizer.padding_side = "left"
46
+
47
+ # Format dataset
48
+ dataset = dataset.map(
49
+ chatml_format,
50
+ remove_columns=original_columns
51
+ )
52
+
53
+ # Print sample
54
+ dataset[1]
55
+ ```