Spaces:

sabaridsnfuji
/

Symbol_SpottingonDigital_Architectural_FloorPlans_Using_objectdetection

Running

App Files Files Community

Symbol_SpottingonDigital_Architectural_FloorPlans_Using_objectdetection / app.py

sabaridsnfuji

Update app.py

e00ea77 verified 2 months ago

raw

history blame

4.06 kB

	# -- coding: utf-8 --
	"""
	Created on Wed Nov 13 18:37:31 2024
	@author: sabar
	"""

	import gradio as gr
	import cv2
	import numpy as np
	import os
	import json
	from openvino.runtime import Core # Assuming you're using OpenVINO
	from tf_post_processing import non_max_suppression # Assuming this is defined elsewhere
	from PIL import Image

	# Load the OpenVINO model
	classification_model_xml = "./model/best.xml"
	core = Core()
	config = {
	"INFERENCE_NUM_THREADS": 2,
	"ENABLE_CPU_PINNING": True
	}
	model = core.read_model(model=classification_model_xml)
	compiled_model = core.compile_model(model=model, device_name="CPU", config=config)

	label_to_class_text = {
	0: 'range',
	1: 'entry door',
	2: 'kitchen sink',
	3: 'bathroom sink',
	4: 'toilet',
	5: 'double folding door',
	6: 'window',
	7: 'shower',
	8: 'bathtub',
	9: 'single folding door',
	10: 'dishwasher',
	11: 'refrigerator'
	}

	# Function to perform inference
	def predict_image(image):
	# Convert the Pillow image to a NumPy array and BGR format for OpenCV
	image = np.array(image.convert("RGB"))
	image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)

	# Resize, preprocess, and reshape the input image
	img_size = 960
	resized_image = cv2.resize(image, (img_size, img_size)) / 255.0
	resized_image = resized_image.transpose(2, 0, 1)
	reshaped_image = np.expand_dims(resized_image, axis=0).astype(np.float32)

	im_height, im_width, _ = image.shape
	output_numpy = compiled_model(reshaped_image)[0]
	results = non_max_suppression(output_numpy, conf_thres=0.2, iou_thres=0.6, max_wh=15000)[0]

	# Prepare output paths
	output_path = "./output_file_train/"
	output_image_folder = os.path.join(output_path, "images_alienware_openvino/")
	os.makedirs(output_image_folder, exist_ok=True)

	output_json_folder = os.path.join(output_path, "json_output/")
	os.makedirs(output_json_folder, exist_ok=True)

	predictions = []

	# Draw boxes and collect prediction data
	for result in results:
	boxes = result[:4]
	prob = result[4]
	classes = int(result[5])

	x1, y1, x2, y2 = np.uint16([
	boxes[0] * im_width,
	boxes[1] * im_height,
	boxes[2] * im_width,
	boxes[3] * im_height
	])

	if prob > 0.2:
	cv2.rectangle(image, (x1, y1), (x2, y2), (255, 255, 0), 2)
	label_text = f"{classes} {round(prob, 2)}"
	cv2.putText(image, label_text, (x1, y1), 0, 0.5, (0, 255, 0), 2)

	# Store prediction info in a JSON-compatible format
	predictions.append({
	"class": label_to_class_text[classes],
	"probability": round(float(prob), 2),
	"coordinates": {
	"xmin": int(x1),
	"ymin": int(y1),
	"xmax": int(x2),
	"ymax": int(y2)
	}
	})

	# Save the processed image
	output_image_path = os.path.join(output_image_folder, "result_image.jpg")
	cv2.imwrite(output_image_path, image)

	# Convert predictions to a formatted string
	predictions_str = json.dumps(predictions, indent=4)

	return image, predictions_str

	# Define sample images for user convenience
	sample_images = [
	"./sample/10_2.jpg",
	"./sample/10_10.jpg",
	"./sample/10_12.jpg"
	]

	# Set up Gradio interface
	def gradio_interface(image):
	output_image, predictions_str = predict_image(image)
	return output_image, predictions_str

	# Create the Gradio Interface
	gr_interface = gr.Interface(
	fn=gradio_interface,
	inputs=gr.Image(label="Upload or Select an Image", type="pil", examples=sample_images),
	outputs=[gr.Image(label="Result Image"), gr.Textbox(label="Predictions JSON")],
	title="House CAD Design Object Detection",
	description="Upload a CAD design image of a house to detect objects with bounding boxes and probabilities."
	)

	# Launch the Gradio interface if run as main
	if __name__ == "__main__":
	gr_interface.launch()