Spaces:

huggingchat
/

chat-ui

Running

App Files Files Community

717

nsarrazin HF Staff commited on Apr 18, 2024

Commit

8582ce1

unverified ·

1 Parent(s): 9c8ed38

Add support for Meta Llama 3 70B in HuggingChat (#1029)

Browse files

Files changed (3) hide show

.env.template +26 -1
src/lib/components/ModelCardMetadata.svelte +8 -2
src/routes/conversation/[id]/+server.ts +2 -1

.env.template CHANGED Viewed

@@ -27,6 +27,31 @@ MODELS=`[
       }
     ]
   },
   {
     "name" : "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
     "tokenizer": "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
@@ -51,7 +76,7 @@ MODELS=`[
         "prompt": "How do I make a delicious lemon cheesecake?"
       }
     ]
-    },
   {
     "name" : "mistralai/Mixtral-8x7B-Instruct-v0.1",
     "description" : "The latest MoE model from Mistral AI! 8x7B and outperforms Llama 2 70B in most benchmarks.",

       }
     ]
   },
+  {
+    "name" : "meta-llama/Meta-Llama-3-70B-Instruct",
+    "description": "Generation over generation, Meta Llama 3 demonstrates state-of-the-art performance on a wide range of industry benchmarks and offers new capabilities, including improved reasoning.",
+    "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",
+    "modelUrl": "https://huggingface.co/meta-llama/Meta-Llama-3-70B-Instruct",
+    "websiteUrl": "https://llama.meta.com/llama3/",
+    "tokenizer" : "meta-llama/Meta-Llama-3-70B-Instruct",
+    "promptExamples" : [
+      {
+        "title": "Write an email from bullet list",
+        "prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
+      }, {
+        "title": "Code a snake game",
+        "prompt": "Code a basic snake game in python, give explanations for each step."
+      }, {
+        "title": "Assist in a task",
+        "prompt": "How do I make a delicious lemon cheesecake?"
+      }
+    ],
+    "parameters": {
+      "stop": ["<|eot_id|>"],
+      "truncate": 6144,
+      "max_new_tokens": 2047
+    }
+  },
   {
     "name" : "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
     "tokenizer": "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
         "prompt": "How do I make a delicious lemon cheesecake?"
       }
     ]
+  },
   {
     "name" : "mistralai/Mixtral-8x7B-Instruct-v0.1",
     "description" : "The latest MoE model from Mistral AI! 8x7B and outperforms Llama 2 70B in most benchmarks.",

src/lib/components/ModelCardMetadata.svelte CHANGED Viewed

@@ -1,6 +1,7 @@
 <script lang="ts">
 	import CarbonEarth from "~icons/carbon/earth";
 	import CarbonArrowUpRight from "~icons/carbon/arrow-up-right";
 	import type { Model } from "$lib/types/Model";
 	export let model: Pick<Model, "name" | "datasetName" | "websiteUrl" | "modelUrl" | "datasetUrl">;
@@ -41,8 +42,13 @@
 			class="ml-auto flex items-center hover:underline"
 			rel="noreferrer"
 		>
-			<CarbonEarth class="mr-1.5 shrink-0 text-xs text-gray-400" />
-			Website
 		</a>
 	{/if}
 </div>

 <script lang="ts">
 	import CarbonEarth from "~icons/carbon/earth";
 	import CarbonArrowUpRight from "~icons/carbon/arrow-up-right";
+	import BIMeta from "~icons/bi/meta";
 	import type { Model } from "$lib/types/Model";
 	export let model: Pick<Model, "name" | "datasetName" | "websiteUrl" | "modelUrl" | "datasetUrl">;
 			class="ml-auto flex items-center hover:underline"
 			rel="noreferrer"
 		>
+			{#if model.name === "meta-llama/Meta-Llama-3-70B-Instruct"}
+				<BIMeta class="mr-1.5 shrink-0 text-xs text-gray-400" />
+				Built with Meta Llama 3
+			{:else}
+				<CarbonEarth class="mr-1.5 shrink-0 text-xs text-gray-400" />
+				Website
+			{/if}
 		</a>
 	{/if}
 </div>

src/routes/conversation/[id]/+server.ts CHANGED Viewed

@@ -447,7 +447,8 @@ export async function POST({ request, locals, params, getClientAddress }) {
 							messageToWriteTo.content += output.token.text;
 						}
 					} else {
-						messageToWriteTo.interrupted = !output.token.special;
 						// add output.generated text to the last message
 						// strip end tokens from the output.generated_text
 						const text = (model.parameters.stop ?? []).reduce((acc: string, curr: string) => {

 							messageToWriteTo.content += output.token.text;
 						}
 					} else {
+						messageToWriteTo.interrupted =
+							!output.token.special && !model.parameters.stop?.includes(output.token.text);
 						// add output.generated text to the last message
 						// strip end tokens from the output.generated_text
 						const text = (model.parameters.stop ?? []).reduce((acc: string, curr: string) => {