Spaces:

oliverlevn
/

ocean_faster_RCNN

Build error

App Files Files Community

ocean_faster_RCNN / app.py

oliverlevn

remove resize

bb029d9 over 1 year ago

raw

history blame contribute delete

4.04 kB

	import gradio
	import torch
	import torchvision.transforms as T
	import numpy as np
	import matplotlib.pyplot as plt
	import os
	import random
	import PIL.Image as Image
	import time
	from model import create_fasterrcnn_model

	categories = [
	{
	"id": 0,
	"name": "creatures",
	"supercategory": "none"
	},
	{
	"id": 1,
	"name": "fish",
	"supercategory": "creatures"
	},
	{
	"id": 2,
	"name": "jellyfish",
	"supercategory": "creatures"
	},
	{
	"id": 3,
	"name": "penguin",
	"supercategory": "creatures"
	},
	{
	"id": 4,
	"name": "puffin",
	"supercategory": "creatures"
	},
	{
	"id": 5,
	"name": "shark",
	"supercategory": "creatures"
	},
	{
	"id": 6,
	"name": "starfish",
	"supercategory": "creatures"
	},
	{
	"id": 7,
	"name": "stingray",
	"supercategory": "creatures"
	}
	]



	# 1, Create title, description and article strings
	title = "Ocean creatures detection Faster-R-CNN"
	description = "A Faster-RCNN-ResNet-50 backbone feature extractor computer vision model to classify images of fish, penguin, shark, etc"

	faster_rcnn = create_fasterrcnn_model(
	num_classes=8, # len(class_names) would also work
	)

	# Load saved weights
	faster_rcnn.load_state_dict(
	torch.load(
	f="./third_train.pth",
	map_location=torch.device("cpu"), # load to CPU
	)
	)
	import random
	# Create predict function
	def predict(img):
	"""Transforms and performs a prediction on img and returns prediction and time taken.
	"""
	# Start the timer
	start_time = time.time()
	device = 'cpu'
	transform = T.Compose([T.ToPILImage(),T.ToTensor()])
	image_tensor = transform(img).to(device)
	image_tensor = image_tensor.unsqueeze(0)
	faster_rcnn.eval()
	with torch.no_grad():
	predictions = faster_rcnn(image_tensor)
	pred_boxes = predictions[0]['boxes'].cpu().numpy()
	pred_scores = predictions[0]['scores'].cpu().numpy()
	pred_labels = predictions[0]['labels'].cpu().numpy()
	label_names = [categories[label]['name'] for label in pred_labels]
	fig, ax = plt.subplots(1)
	ax.imshow(img)
	for box, score, label_name in zip(pred_boxes, pred_scores, label_names):
	if score > 0.5:
	x1, y1, x2, y2 = box
	w, h = x2 - x1, y2 - y1
	rect = plt.Rectangle((x1, y1), w, h, fill=False, edgecolor='red', linewidth=2)
	ax.add_patch(rect)
	ax.text(x1, y1, f'{label_name}: {score:.2f}', fontsize=5, color='white', bbox=dict(facecolor='red', alpha=0.2))
	# save the figure to an image file
	random_name = str(random.randint(0,99))
	img_path = f"./{random_name}.png"
	fig.savefig(img_path)
	# convert the figure to an image
	fig.canvas.draw()

	# Calculate the prediction time
	pred_time = round(time.time() - start_time, 5)

	# return the predicted label, the path to the saved image, and the prediction time
	return img_path, str(pred_time)


	### 4. Gradio app ###

	# Get a list of all image file paths in the folder
	example_list = [["examples/" + example] for example in os.listdir("examples")]


	# Create the Gradio demo
	demo = gradio.Interface(fn=predict, # mapping function from input to output
	inputs=gradio.Image(type= "numpy"), # what are the inputs?
	outputs=[gradio.outputs.Image(type= "filepath", label="Image with Bounding Boxes"),
	gradio.outputs.Label(type="auto", label="Prediction Time")], # our fn has two outputs
	# Create examples list from "examples/" directory
	examples=example_list,
	title=title,
	description=description)

	# Launch the demo!
	demo.launch(debug =True)