HF-Chat-with-domain-filters

Sleeping

olivierdehaene commited on Apr 26, 2023

Commit

ffa4f55

unverified ·

1 Parent(s): b56bba1

✨ Add preprompt (#124)

Co-authored-by: OlivierDehaene <Olivier.dehaene@gmail.com>

Files changed (3) hide show

.env CHANGED Viewed

@@ -13,6 +13,7 @@ PUBLIC_DISABLE_INTRO_TILES=false
 PUBLIC_USER_MESSAGE_TOKEN=<|prompter|>
 PUBLIC_ASSISTANT_MESSAGE_TOKEN=<|assistant|>
 PUBLIC_SEP_TOKEN=<|endoftext|>
 # [{"endpoint": "https://api-inference.huggingface.co/models/...", authorization: "Bearer hf_<token>", weight: 1}] to load balance
 # Eg if one endpoint has weight 2 and the other has weight 1, the first endpoint will be called twice as often

 PUBLIC_USER_MESSAGE_TOKEN=<|prompter|>
 PUBLIC_ASSISTANT_MESSAGE_TOKEN=<|assistant|>
 PUBLIC_SEP_TOKEN=<|endoftext|>
+PUBLIC_PREPROMPT="Below are a series of dialogues between various people and an AI assistant. The AI tries to be helpful, polite, honest, sophisticated, emotionally aware, and humble-but-knowledgeable. The assistant is happy to help with almost anything, and will do its best to understand exactly what is needed. It also tries to avoid giving false or misleading information, and it caveats when it isn't entirely sure about the right answer. That said, the assistant is practical and really does its best, and doesn't let caution get too much in the way of being useful."
 # [{"endpoint": "https://api-inference.huggingface.co/models/...", authorization: "Bearer hf_<token>", weight: 1}] to load balance
 # Eg if one endpoint has weight 2 and the other has weight 1, the first endpoint will be called twice as often

src/lib/buildPrompt.ts CHANGED Viewed

@@ -1,6 +1,7 @@
 import {
 	PUBLIC_ASSISTANT_MESSAGE_TOKEN,
 	PUBLIC_MAX_INPUT_TOKENS,
 	PUBLIC_SEP_TOKEN,
 	PUBLIC_USER_MESSAGE_TOKEN,
 } from "$env/static/public";
@@ -24,5 +25,9 @@ export function buildPrompt(messages: Message[]): string {
 			.join("") + PUBLIC_ASSISTANT_MESSAGE_TOKEN;
 	// Not super precise, but it's truncated in the model's backend anyway
-	return prompt.split(" ").slice(-parseInt(PUBLIC_MAX_INPUT_TOKENS)).join(" ");
 }

 import {
 	PUBLIC_ASSISTANT_MESSAGE_TOKEN,
 	PUBLIC_MAX_INPUT_TOKENS,
+	PUBLIC_PREPROMPT,
 	PUBLIC_SEP_TOKEN,
 	PUBLIC_USER_MESSAGE_TOKEN,
 } from "$env/static/public";
 			.join("") + PUBLIC_ASSISTANT_MESSAGE_TOKEN;
 	// Not super precise, but it's truncated in the model's backend anyway
+	return (
+		PUBLIC_PREPROMPT +
+		"\n-----\n" +
+		prompt.split(" ").slice(-parseInt(PUBLIC_MAX_INPUT_TOKENS)).join(" ")
+	);
 }

src/routes/conversation/[id]/summarize/+server.ts CHANGED Viewed

@@ -21,7 +21,7 @@ export async function POST({ params, locals, fetch }) {
 	const firstMessage = conversation.messages.find((m) => m.from === "user");
 	const userPrompt =
-		`You are a summarizing assistant. Please summarize the following message as a single sentence of less than 5 words:\n` +
 		firstMessage?.content;
 	const prompt = buildPrompt([{ from: "user", content: userPrompt }]);

 	const firstMessage = conversation.messages.find((m) => m.from === "user");
 	const userPrompt =
+		`Please summarize the following message as a single sentence of less than 5 words:\n` +
 		firstMessage?.content;
 	const prompt = buildPrompt([{ from: "user", content: userPrompt }]);