ai-manga-factory

Running

App Files Files Community

jbilcke-hf HF staff commited on Aug 28, 2023

Commit

2f7798c

•

1 Parent(s): a5a608f

try to improve robustness of LLM responses

Browse files

Files changed (5) hide show

src/app/queries/getStory.ts +37 -23
src/lib/dirtyCaptionCleaner.ts +3 -0
src/lib/dirtyLLMJsonParser.ts +15 -0
src/lib/dirtyLLMResponseCleaner.ts +8 -0
src/types.ts +2 -0

src/app/queries/getStory.ts CHANGED Viewed

@@ -1,10 +1,11 @@
 import { createLlamaPrompt } from "@/lib/createLlamaPrompt"
 import { predict } from "./predict"
 import { Preset } from "../engine/presets"
-type LLMResponse = Array<{panel: number; caption: string }>
 export const getStory = async ({
   preset,
   prompt = "",
@@ -32,6 +33,7 @@ export const getStory = async ({
   let result = ""
   try {
     result = await predict(query)
     if (!result.trim().length) {
@@ -51,33 +53,45 @@ export const getStory = async ({
   }
   console.log("Raw response from LLM:", result)
-  let tmp = result // result.split("Caption:").pop() || result
-  tmp = tmp
-    .replaceAll("}}", "}")
-    .replaceAll("]]", "]")
-    .replaceAll(",,", ",")
   try {
-    // we only keep what's after the first [
-    let jsonOrNot = `[${tmp.split("[").pop() || ""}`
-    // and before the first ]
-    jsonOrNot = `${jsonOrNot.split("]").shift() || ""}]`
-    const jsonData = JSON.parse(jsonOrNot) as LLMResponse
-    const captions = jsonData.map(item => item.caption.trim())
-    return captions.map(caption => caption.split(":").pop()?.trim() || "")
   } catch (err) {
     console.log(`failed to read LLM response: ${err}`)
-    // in case of failure, it might be because the LLM hallucinated a completely different response,
-    // such as markdown. There is no real solution.. but we can try a fallback:
-    const candidateList = (
-      tmp.split("*")
-      .map(item => item.replaceAll("[", "[").replaceAll("]", "]").trim())
-    )
-    return candidateList
   }
 }

 import { createLlamaPrompt } from "@/lib/createLlamaPrompt"
+import { dirtyLLMResponseCleaner } from "@/lib/dirtyLLMResponseCleaner"
+import { dirtyLLMJsonParser } from "@/lib/dirtyLLMJsonParser"
+import { dirtyCaptionCleaner } from "@/lib/dirtyCaptionCleaner"
 import { predict } from "./predict"
 import { Preset } from "../engine/presets"
 export const getStory = async ({
   preset,
   prompt = "",
   let result = ""
   try {
     result = await predict(query)
     if (!result.trim().length) {
   }
   console.log("Raw response from LLM:", result)
+  const tmp = dirtyLLMResponseCleaner(result)
+  let captions: string[] = []
   try {
+    captions = dirtyLLMJsonParser(tmp)
   } catch (err) {
     console.log(`failed to read LLM response: ${err}`)
+    // it is possible that the LLM has generated multiple JSON files like this:
+    /*
+    [ {
+      "panel": 1,
+      "caption": "A samurai stands at the edge of a bustling street in San Francisco, looking out of place among the hippies and beatniks."
+      } ]
+      [ {
+      "panel": 2,
+      "caption": "The samurai spots a group of young people playing music on the sidewalk. He approaches them, intrigued."
+      } ]
+    */
+    try {
+      // in that case, we can try to repair it like so:
+      let strategy2 = `[${tmp.split("[").pop() || ""}`
+      strategy2.replaceAll("[", ",")
+      captions = dirtyLLMJsonParser(strategy2)
+    } catch (err2) {
+      // in case of failure here, it might be because the LLM hallucinated a completely different response,
+      // such as markdown. There is no real solution.. but we can try a fallback:
+      captions = (
+        tmp.split("*")
+        .map(item => item.replaceAll("[", "[").replaceAll("]", "]").trim())
+      )
+    }
   }
+  return captions.map(caption => dirtyCaptionCleaner(caption))
 }

src/lib/dirtyCaptionCleaner.ts ADDED Viewed

	@@ -0,0 +1,3 @@

+export function dirtyCaptionCleaner(input: string) {
+  return input.split(":").pop()?.trim() || ""
+}

src/lib/dirtyLLMJsonParser.ts ADDED Viewed

	@@ -0,0 +1,15 @@

+import { LLMResponse } from "@/types"
+export function dirtyLLMJsonParser(input: string): string[] {
+  // we only keep what's after the first [
+  let jsonOrNot = `[${input.split("[").pop() || ""}`
+  // and before the first ]
+  jsonOrNot = `${jsonOrNot.split("]").shift() || ""}]`
+  const jsonData = JSON.parse(jsonOrNot) as LLMResponse
+  const captions = jsonData.map(item => item.caption.trim())
+  return captions
+}

src/lib/dirtyLLMResponseCleaner.ts ADDED Viewed

	@@ -0,0 +1,8 @@

+export function dirtyLLMResponseCleaner(input: string) {
+  return (
+    `${input || ""}`
+    .replaceAll("}}", "}")
+    .replaceAll("]]", "]")
+    .replaceAll(",,", ",")
+  )
+}

src/types.ts CHANGED Viewed

@@ -78,3 +78,5 @@ export interface ImageAnalysisResponse {
   result: string
   error?: string
 }

   result: string
   error?: string
 }
+export type LLMResponse = Array<{panel: number; caption: string }>