huggi / src /lib /buildPrompt.ts
andreasmadsen's picture
allow different user and assistant end-token (#375)
f209301 unverified
raw
history blame
1.67 kB
import type { BackendModel } from "./server/models";
import type { Message } from "./types/Message";
import { collections } from "$lib/server/database";
import { ObjectId } from "mongodb";
/**
* Convert [{user: "assistant", content: "hi"}, {user: "user", content: "hello"}] to:
*
* <|assistant|>hi<|endoftext|><|prompter|>hello<|endoftext|><|assistant|>
*/
export async function buildPrompt(
messages: Pick<Message, "from" | "content">[],
model: BackendModel,
webSearchId?: string
): Promise<string> {
const userEndToken = model.userMessageEndToken ?? model.messageEndToken;
const assistantEndToken = model.assistantMessageEndToken ?? model.messageEndToken;
const prompt =
messages
.map((m) =>
m.from === "user"
? model.userMessageToken +
m.content +
(m.content.endsWith(userEndToken) ? "" : userEndToken)
: model.assistantMessageToken +
m.content +
(m.content.endsWith(assistantEndToken) ? "" : assistantEndToken)
)
.join("") + model.assistantMessageToken;
let webPrompt = "";
if (webSearchId) {
const webSearch = await collections.webSearches.findOne({
_id: new ObjectId(webSearchId),
});
if (!webSearch) throw new Error("Web search not found");
if (webSearch.summary) {
webPrompt =
model.assistantMessageToken +
`The following context was found while searching the internet: ${webSearch.summary}` +
model.assistantMessageEndToken;
}
}
const finalPrompt =
model.preprompt +
webPrompt +
prompt
.split(" ")
.slice(-(model.parameters?.truncate ?? 0))
.join(" ");
// Not super precise, but it's truncated in the model's backend anyway
return finalPrompt;
}