Spaces:

taesiri
/

BugsBunny-Llama-3.2-Base-Medium

Running on Zero

App Files Files Community

taesiri commited on Nov 16

Commit

3192fb4

•

1 Parent(s): 0c17050

backup

Browse files

Files changed (1) hide show

app.py +7 -22

app.py CHANGED Viewed

@@ -29,7 +29,7 @@ login(token=os.environ["HF_TOKEN"])
 # Load model and processor (do this outside the inference function to avoid reloading)
 base_model_path = "meta-llama/Llama-3.2-11B-Vision-Instruct"
-lora_weights_path = "taesiri/BungsBunny-LLama-3.2-11B-Vision-Instruct-Medium"
 processor = AutoProcessor.from_pretrained(base_model_path)
 model = MllamaForConditionalGeneration.from_pretrained(
@@ -48,10 +48,7 @@ def parse_json_response(json_str):
     try:
         # Debug original input
-        print(
-            "DEBUG: Raw JSON input:",
-            json_str[:200] + "..." if len(json_str) > 200 else json_str,
-        )
         # Handle potential JSON string escaping
         json_str = json_str.strip()
@@ -59,17 +56,11 @@ def parse_json_response(json_str):
             print("DEBUG: Removing outer quotes")
             json_str = json_str[1:-1]
         first_parse = json.loads(json_str)
         print("DEBUG: First parse result type:", type(first_parse))
-        print(
-            "DEBUG: First parse content:",
-            (
-                str(first_parse)[:200] + "..."
-                if len(str(first_parse)) > 200
-                else str(first_parse)
-            ),
-        )
         json_object = (
             json.loads(first_parse) if isinstance(first_parse, str) else first_parse
         )
@@ -178,17 +169,11 @@ def inference(image):
     # Decode output
     result = processor.decode(output[0], skip_special_tokens=True)
-    print(
-        "DEBUG: Full decoded output:",
-        result[:200] + "..." if len(result) > 200 else result,
-    )
     try:
         json_str = result.strip().split("assistant\n")[1].strip()
-        print(
-            "DEBUG: Extracted JSON string after split:",
-            json_str[:200] + "..." if len(json_str) > 200 else json_str,
-        )
     except Exception as e:
         print("DEBUG: Error splitting response:", e)
         return ["Error extracting JSON from response"] * 8 + [
@@ -224,7 +209,7 @@ def inference(image):
 # Update Gradio interface
 with gr.Blocks() as demo:
-    gr.Markdown("# BungsBunny-LLama-3.2-11B-Base-Medium Demo")
     with gr.Row():
         with gr.Column(scale=1):

 # Load model and processor (do this outside the inference function to avoid reloading)
 base_model_path = "meta-llama/Llama-3.2-11B-Vision-Instruct"
+lora_weights_path = "taesiri/BugsBunny-LLama-3.2-11B-Vision-Instruct-Medium"
 processor = AutoProcessor.from_pretrained(base_model_path)
 model = MllamaForConditionalGeneration.from_pretrained(
     try:
         # Debug original input
+        print("DEBUG: Raw JSON input:", json_str)
         # Handle potential JSON string escaping
         json_str = json_str.strip()
             print("DEBUG: Removing outer quotes")
             json_str = json_str[1:-1]
+        # First parse - handles the outer JSON encoding
         first_parse = json.loads(json_str)
         print("DEBUG: First parse result type:", type(first_parse))
+        # Second parse - if the result is still a string, parse again
         json_object = (
             json.loads(first_parse) if isinstance(first_parse, str) else first_parse
         )
     # Decode output
     result = processor.decode(output[0], skip_special_tokens=True)
+    print("DEBUG: Full decoded output:", result)
     try:
         json_str = result.strip().split("assistant\n")[1].strip()
+        print("DEBUG: Extracted JSON string after split:", json_str)
     except Exception as e:
         print("DEBUG: Error splitting response:", e)
         return ["Error extracting JSON from response"] * 8 + [
 # Update Gradio interface
 with gr.Blocks() as demo:
+    gr.Markdown("# BugsBunny-LLama-3.2-11B-Base-Medium Demo")
     with gr.Row():
         with gr.Column(scale=1):