|
import { PUBLIC_SEP_TOKEN } from "$env/static/public"; |
|
import { buildPrompt } from "$lib/buildPrompt.js"; |
|
import { abortedGenerations } from "$lib/server/abortedGenerations.js"; |
|
import { collections } from "$lib/server/database.js"; |
|
import { modelEndpoint } from "$lib/server/modelEndpoint.js"; |
|
import type { Message } from "$lib/types/Message.js"; |
|
import { concatUint8Arrays } from "$lib/utils/concatUint8Arrays.js"; |
|
import { streamToAsyncIterable } from "$lib/utils/streamToAsyncIterable"; |
|
import { trimPrefix } from "$lib/utils/trimPrefix.js"; |
|
import { trimSuffix } from "$lib/utils/trimSuffix.js"; |
|
import type { TextGenerationStreamOutput } from "@huggingface/inference"; |
|
import { error } from "@sveltejs/kit"; |
|
import { ObjectId } from "mongodb"; |
|
|
|
export async function POST({ request, fetch, locals, params }) { |
|
|
|
const convId = new ObjectId(params.id); |
|
const date = new Date(); |
|
|
|
const conv = await collections.conversations.findOne({ |
|
_id: convId, |
|
sessionId: locals.sessionId, |
|
}); |
|
|
|
if (!conv) { |
|
throw error(404, "Conversation not found"); |
|
} |
|
|
|
|
|
const json = await request.json(); |
|
|
|
const messages = [...conv.messages, { from: "user", content: json.inputs }] satisfies Message[]; |
|
const prompt = buildPrompt(messages); |
|
|
|
const randomEndpoint = modelEndpoint(); |
|
|
|
const abortController = new AbortController(); |
|
|
|
const resp = await fetch(randomEndpoint.endpoint, { |
|
headers: { |
|
"Content-Type": request.headers.get("Content-Type") ?? "application/json", |
|
Authorization: randomEndpoint.authorization, |
|
}, |
|
method: "POST", |
|
body: JSON.stringify({ |
|
...json, |
|
inputs: prompt, |
|
}), |
|
signal: abortController.signal, |
|
}); |
|
|
|
const [stream1, stream2] = resp.body!.tee(); |
|
|
|
async function saveMessage() { |
|
let generated_text = await parseGeneratedText(stream2, convId, date, abortController); |
|
|
|
|
|
if (generated_text.startsWith(prompt)) { |
|
generated_text = generated_text.slice(prompt.length); |
|
} |
|
|
|
generated_text = trimSuffix(trimPrefix(generated_text, "<|startoftext|>"), PUBLIC_SEP_TOKEN); |
|
|
|
messages.push({ from: "assistant", content: generated_text }); |
|
|
|
await collections.conversations.updateOne( |
|
{ |
|
_id: convId, |
|
}, |
|
{ |
|
$set: { |
|
messages, |
|
updatedAt: new Date(), |
|
}, |
|
} |
|
); |
|
} |
|
|
|
saveMessage().catch(console.error); |
|
|
|
|
|
return new Response(stream1, { |
|
headers: Object.fromEntries(resp.headers.entries()), |
|
status: resp.status, |
|
statusText: resp.statusText, |
|
}); |
|
} |
|
|
|
export async function DELETE({ locals, params }) { |
|
const convId = new ObjectId(params.id); |
|
|
|
const conv = await collections.conversations.findOne({ |
|
_id: convId, |
|
sessionId: locals.sessionId, |
|
}); |
|
|
|
if (!conv) { |
|
throw error(404, "Conversation not found"); |
|
} |
|
|
|
await collections.conversations.deleteOne({ _id: conv._id }); |
|
|
|
return new Response(); |
|
} |
|
|
|
async function parseGeneratedText( |
|
stream: ReadableStream, |
|
conversationId: ObjectId, |
|
promptedAt: Date, |
|
abortController: AbortController |
|
): Promise<string> { |
|
const inputs: Uint8Array[] = []; |
|
for await (const input of streamToAsyncIterable(stream)) { |
|
inputs.push(input); |
|
|
|
const date = abortedGenerations.get(conversationId.toString()); |
|
|
|
if (date && date > promptedAt) { |
|
abortController.abort("Cancelled by user"); |
|
const completeInput = concatUint8Arrays(inputs); |
|
|
|
const lines = new TextDecoder() |
|
.decode(completeInput) |
|
.split("\n") |
|
.filter((line) => line.startsWith("data:")); |
|
|
|
const tokens = lines.map((line) => { |
|
try { |
|
const json: TextGenerationStreamOutput = JSON.parse(line.slice("data:".length)); |
|
return json.token.text; |
|
} catch { |
|
return ""; |
|
} |
|
}); |
|
return tokens.join(""); |
|
} |
|
} |
|
|
|
|
|
const completeInput = concatUint8Arrays(inputs); |
|
|
|
|
|
const message = new TextDecoder().decode(completeInput); |
|
|
|
let lastIndex = message.lastIndexOf("\ndata:"); |
|
if (lastIndex === -1) { |
|
lastIndex = message.indexOf("data"); |
|
} |
|
|
|
if (lastIndex === -1) { |
|
console.error("Could not parse in last message"); |
|
} |
|
|
|
let lastMessage = message.slice(lastIndex).trim().slice("data:".length); |
|
if (lastMessage.includes("\n")) { |
|
lastMessage = lastMessage.slice(0, lastMessage.indexOf("\n")); |
|
} |
|
|
|
const res = JSON.parse(lastMessage).generated_text; |
|
|
|
if (typeof res !== "string") { |
|
throw new Error("Could not parse generated text"); |
|
} |
|
|
|
return res; |
|
} |
|
|