Husnain commited on
Commit
11d1015
1 Parent(s): e51b66c

⚡ [Enhance] Upgrade gemma-7b to 1.1

Browse files
Files changed (1) hide show
  1. messagers/message_composer.py +6 -6
messagers/message_composer.py CHANGED
@@ -52,7 +52,7 @@ class MessageComposer:
52
  # - https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1#instruction-format
53
  # - https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO#prompt-format
54
  # - https://huggingface.co/openchat/openchat-3.5-0106
55
- # - https://huggingface.co/google/gemma-1.1-7b-it#chat-template
56
 
57
  # Mistral and Mixtral:
58
  # <s> [INST] Instruction [/INST] Model answer </s> [INST] Follow-up instruction [/INST]
@@ -126,7 +126,7 @@ class MessageComposer:
126
  self.merged_str_list.append(f"GPT4 Correct Assistant:\n")
127
  self.merged_str = "\n".join(self.merged_str_list)
128
  # https://huggingface.co/google/gemma-1.1-7b-it#chat-template
129
- elif self.model in ["gemma-1.1-7b"]:
130
  self.messages = self.concat_messages_by_role(messages)
131
  self.merged_str_list = []
132
  self.end_of_turn = "<end_of_turn>"
@@ -147,11 +147,11 @@ class MessageComposer:
147
  f"{self.start_of_turn}user\n{content}{self.end_of_turn}"
148
  )
149
  self.merged_str_list.append(f"{self.start_of_turn}model\n")
150
- self.merged_str = "\n".join(self.merged_str_list)
151
  # https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO#prompt-format
152
  # https://huggingface.co/openchat/openchat-3.5-0106
153
  # elif self.model in ["openchat-3.5", "nous-mixtral-8x7b"]:
154
- elif self.model in ["openchat-3.5", "command-r-plus"]:
155
  tokenizer = AutoTokenizer.from_pretrained(self.model_fullname)
156
  self.merged_str = tokenizer.apply_chat_template(
157
  messages, tokenize=False, add_generation_prompt=True
@@ -167,9 +167,9 @@ class MessageComposer:
167
  if __name__ == "__main__":
168
  # model = "mixtral-8x7b"
169
  # model = "nous-mixtral-8x7b"
170
- # model = "gemma-1.1-7b"
171
  # model = "openchat-3.5"
172
- model = "command-r-plus"
173
  composer = MessageComposer(model)
174
  messages = [
175
  {
 
52
  # - https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1#instruction-format
53
  # - https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO#prompt-format
54
  # - https://huggingface.co/openchat/openchat-3.5-0106
55
+ # - https://huggingface.co/google/gemma-7b-it#chat-template
56
 
57
  # Mistral and Mixtral:
58
  # <s> [INST] Instruction [/INST] Model answer </s> [INST] Follow-up instruction [/INST]
 
126
  self.merged_str_list.append(f"GPT4 Correct Assistant:\n")
127
  self.merged_str = "\n".join(self.merged_str_list)
128
  # https://huggingface.co/google/gemma-1.1-7b-it#chat-template
129
+ elif self.model in ["gemma-7b"]:
130
  self.messages = self.concat_messages_by_role(messages)
131
  self.merged_str_list = []
132
  self.end_of_turn = "<end_of_turn>"
 
147
  f"{self.start_of_turn}user\n{content}{self.end_of_turn}"
148
  )
149
  self.merged_str_list.append(f"{self.start_of_turn}model\n")
150
+ self.merged_str = "<bos>" + "\n".join(self.merged_str_list)
151
  # https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO#prompt-format
152
  # https://huggingface.co/openchat/openchat-3.5-0106
153
  # elif self.model in ["openchat-3.5", "nous-mixtral-8x7b"]:
154
+ elif self.model in ["openchat-3.5", "command-r-plus", "gemma-7b"]:
155
  tokenizer = AutoTokenizer.from_pretrained(self.model_fullname)
156
  self.merged_str = tokenizer.apply_chat_template(
157
  messages, tokenize=False, add_generation_prompt=True
 
167
  if __name__ == "__main__":
168
  # model = "mixtral-8x7b"
169
  # model = "nous-mixtral-8x7b"
170
+ model = "gemma-7b"
171
  # model = "openchat-3.5"
172
+ # model = "command-r-plus"
173
  composer = MessageComposer(model)
174
  messages = [
175
  {