import gradio as gr
import matplotlib.pyplot as plt
from PIL import Image
from ultralyticsplus import YOLO
import cv2
import numpy as np
from transformers import pipeline
import requests
from io import BytesIO
import os

model = YOLO('best (1).pt')
name = ['grenade','knife','pistol','rifle']
image_directory = "/home/user/app/image"
video_directory = "/home/user/app/video"

# url_example="https://drive.google.com/file/d/1bBq0bNmJ5X83tDWCzdzHSYCdg-aUL4xO/view?usp=drive_link"
# url_example='https://drive.google.com/uc?id=' + url_example.split('/')[-2]
# r = requests.get(url_example)
# im1 = Image.open(BytesIO(r.content))

# url_example="https://drive.google.com/file/d/16Z7QzvZ99fbEPj1sls_jOCJBsC0h_dYZ/view?usp=drive_link"
# url_example='https://drive.google.com/uc?id=' + url_example.split('/')[-2]
# r = requests.get(url_example)
# im2 = Image.open(BytesIO(r.content))

# url_example="https://drive.google.com/file/d/13mjTMS3eR0AKYSbV-Fpb3fTBno_T42JN/view?usp=drive_link"
# url_example='https://drive.google.com/uc?id=' + url_example.split('/')[-2]
# r = requests.get(url_example)
# im3 = Image.open(BytesIO(r.content))

# url_example="https://drive.google.com/file/d/1-XpFsa_nz506Ul6grKElVJDu_Jl3KZIF/view?usp=drive_link"
# url_example='https://drive.google.com/uc?id=' + url_example.split('/')[-2]
# r = requests.get(url_example)
# im4 = Image.open(BytesIO(r.content))
 # for i, r in enumerate(results):
      
 #    # Plot results image
 #      im_bgr = r.plot()  
 #      im_rgb = im_bgr[..., ::-1]  # Convert BGR to RGB

def response(image):
  print(image)
  results = model(image)
  text = ""
  name_weap = ""
    
  for r in results:
    conf = np.array(r.boxes.conf)
    cls = np.array(r.boxes.cls)
    cls = cls.astype(int)
    xywh = np.array(r.boxes.xywh)
    xywh = xywh.astype(int)  
      
    for con, cl, xy in zip(conf, cls, xywh):
        cone = con.astype(float)
        conef = round(cone,3)
        conef = conef * 100
        text += (f"Detected {name[cl]} with confidence {round(conef,1)}% at ({xy[0]},{xy[1]})\n")
        
        if cl == 0:
            name_weap += name[cl] + '\n'
        elif cl == 1:
            name_weap += name[cl] + '\n'
        elif cl == 2:
            out = model2(image)
            name_weap += out[0]["label"] + '\n'
        elif cl == 3:
            out = model2(image)
            name_weap += out[0]["label"] + '\n'

        
    # im_rgb = Image.fromarray(im_rgb)
    
      
    return name_weap, text


def response2(image: gr.Image = None,image_size: gr.Slider = 640, conf_threshold: gr.Slider = 0.3, iou_threshold: gr.Slider = 0.6):

    results = model.predict(image, conf=conf_threshold, iou=iou_threshold, imgsz=image_size)
    
    box = results[0].boxes

    for r in results:
        im_array = r.plot()
        im = Image.fromarray(im_array[..., ::-1])

   
    model2 = pipeline('image-classification','Kaludi/csgo-weapon-classification')
    weapon_name, text_detection = response(image)
   
    
    # xywh = int(results.boxes.xywh)
    # x = xywh[0]
    # y = xywh[1]
           
    return im, text_detection, weapon_name


inputs = [
    gr.Image(type="pil",  label="Input Image"),
    gr.Slider(minimum=320, maximum=1280, value=640,
                     step=32, label="Image Size"),
    gr.Slider(minimum=0.0, maximum=1.0, value=0.3,
                     step=0.05, label="Confidence Threshold"),
    gr.Slider(minimum=0.0, maximum=1.0, value=0.6,
                     step=0.05, label="IOU Threshold"),
]

outputs = [gr.Image( type="pil", label="Output Image"),
           gr.Textbox(label="Result"),
           gr.Textbox(label="Weapon Name")
          ]

examples = [[os.path.join(image_directory, "th (5).jpg"),640, 0.3, 0.6],
            [os.path.join(image_directory, "th (8).jpg"),640, 0.3, 0.6],
            [os.path.join(image_directory, "th (11).jpg"),640, 0.3, 0.6],
            [os.path.join(image_directory, "th (3).jpg"),640, 0.3, 0.6]
           ]
title = 'Weapon Detection Finetuned YOLOv8'
description = 'Image Size: Defines the image size for inference.\nConfidence Treshold: Sets the minimum confidence threshold for detections.\nIOU Treshold: Intersection Over Union (IoU) threshold for Non-Maximum Suppression (NMS). Useful for reducing duplicates.'


def pil_to_cv2(pil_image):
    open_cv_image = cv2.cvtColor(np.array(pil_image), cv2.COLOR_RGB2BGR)
    return open_cv_image


def process_video(video_path):
    cap = cv2.VideoCapture(video_path)
    
    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            breakformat
        
        pil_img = Image.fromarray(frame[..., ::-1])  
        result = model.predict(source=pil_img)
        for r in result:
            im_array = r.plot()
            processed_frame = Image.fromarray(im_array[..., ::-1])  
        yield processed_frame
    cap.release()


video_iface = gr.Interface(
    fn=process_video,
    inputs=[
        gr.Video(label="Upload Video", interactive=True)
    ],
    outputs=gr.Image(type="pil",label="Result"),
    title=title,
    description="Upload video for inference.",
    examples=[[os.path.join(video_directory, "ExampleRifle.mp4")],
        [os.path.join(video_directory, "Knife.mp4")],
    ]
)


image_iface = gr.Interface(fn=response2, inputs=inputs, outputs=outputs, examples=examples, title=title, description=description)

demo = gr.TabbedInterface([image_iface, video_iface], ["Image Inference", "Video Inference"])

if __name__ == '__main__':
    demo.launch()