Spaces:

banao-tech
/

omniapi

Sleeping

gauthambalraj07@gmail.com commited on Feb 4

Commit

3dc870c

1 Parent(s): 707dfbd

fix yolo call

Files changed (4) hide show

main.py CHANGED Viewed

@@ -36,6 +36,9 @@ try:
 except:
     yolo_model = torch.load("weights/icon_detect/best.pt", map_location="cpu", weights_only=False)["model"]
 from transformers import AutoProcessor, AutoModelForCausalLM
 import torch

 except:
     yolo_model = torch.load("weights/icon_detect/best.pt", map_location="cpu", weights_only=False)["model"]
+print(f"YOLO model type: {type(yolo_model)}")
 from transformers import AutoProcessor, AutoModelForCausalLM
 import torch

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-torch==2.0.1
 easyocr
 torchvision
 supervision==0.18.0

+torch==2.2.2
 easyocr
 torchvision
 supervision==0.18.0

test.ipynb CHANGED Viewed

@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 3,
    "metadata": {},
    "outputs": [
     {
@@ -11,8 +11,8 @@
      "text": [
       "Processing imscdr_ac_in___8.png...\n",
       "Status Code: 500\n",
-      "Response Text: {\"detail\":\"BaseModel.predict() got an unexpected keyword argument 'source'\"}\n",
-      "Finished processing imscdr_ac_in___8.png in 43.56 seconds\n",
       "Processing imscdr_ac_in___9.png...\n",
       "Status Code: 500\n",
       "Response Text: <!DOCTYPE html>\n",
@@ -124,7 +124,7 @@
       "</body>\n",
       "</html>\n",
       "\n",
-      "Finished processing imscdr_ac_in___9.png in 9.98 seconds\n",
       "{}\n"
      ]
     }

  "cells": [
   {
    "cell_type": "code",
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
      "text": [
       "Processing imscdr_ac_in___8.png...\n",
       "Status Code: 500\n",
+      "Response Text: {\"detail\":\"BaseModel.predict() got an unexpected keyword argument 'conf'\"}\n",
+      "Finished processing imscdr_ac_in___8.png in 10.38 seconds\n",
       "Processing imscdr_ac_in___9.png...\n",
       "Status Code: 500\n",
       "Response Text: <!DOCTYPE html>\n",
       "</body>\n",
       "</html>\n",
       "\n",
+      "Finished processing imscdr_ac_in___9.png in 10.32 seconds\n",
       "{}\n"
      ]
     }

utils.py CHANGED Viewed

@@ -378,19 +378,14 @@ def predict_yolo(model, image_path, box_threshold, imgsz, scale_img, iou_thresho
     """ Use huggingface model to replace the original model
     """
     # model = model['model']
     if scale_img:
-        result = model(
-        image_path,
-        conf=box_threshold,
-        imgsz=imgsz,
-        iou=iou_threshold, # default 0.7
-        )
-    else:
-        result = model(
-        image_path,
-        conf=box_threshold,
-        iou=iou_threshold, # default 0.7
-        )
     boxes = result[0].boxes.xyxy#.tolist() # in pixel space
     conf = result[0].boxes.conf
     phrases = [str(i) for i in range(len(boxes))]

     """ Use huggingface model to replace the original model
     """
     # model = model['model']
+    kwargs = {
+        'conf': box_threshold,
+        'iou': iou_threshold,
+    }
     if scale_img:
+        kwargs['imgsz'] = imgsz
+    result = model(image_path, **kwargs)
     boxes = result[0].boxes.xyxy#.tolist() # in pixel space
     conf = result[0].boxes.conf
     phrases = [str(i) for i in range(len(boxes))]