Spaces:

SeoJunn
/

segmentation3

Sleeping

App Files Files Community

segmentation3 / app.py

SeoJunn

Refactor : detection 코드 주석

bb78b14 10 months ago

raw

history blame

No virus

5.95 kB

	import gradio as gr
	from PIL import Image
	from matplotlib import gridspec
	import matplotlib.pyplot as plt
	import numpy as np
	from transformers import SegformerFeatureExtractor, TFSegformerForSemanticSegmentation
	from transformers import DetrImageProcessor, DetrForObjectDetection
	import torch
	import tensorflow as tf
	from PIL import ImageDraw

	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

	# image segmentation 모델
	feature_extractor = SegformerFeatureExtractor.from_pretrained(
	"nvidia/segformer-b1-finetuned-cityscapes-1024-1024"
	)
	model_segmentation = TFSegformerForSemanticSegmentation.from_pretrained(
	"nvidia/segformer-b1-finetuned-cityscapes-1024-1024"
	)

	# image detection 모델
	# processor_detection = DetrImageProcessor.from_pretrained(
	# "facebook/detr-resnet-50", revision="no_timm"
	# )
	# model_detection = DetrForObjectDetection.from_pretrained(
	# "facebook/detr-resnet-50", revision="no_timm"
	# )


	def ade_palette():
	"""ADE20K 팔레트: 각 클래스를 RGB 값에 매핑해주는 함수입니다."""

	return [
	[204, 87, 92],
	[112, 185, 212],
	[45, 189, 106],
	[234, 123, 67],
	[78, 56, 123],
	[210, 32, 89],
	[90, 180, 56],
	[155, 102, 200],
	[33, 147, 176],
	[255, 183, 76],
	[67, 123, 89],
	[190, 60, 45],
	[134, 112, 200],
	[56, 45, 189],
	[200, 56, 123],
	[87, 92, 204],
	[120, 56, 123],
	[45, 78, 123],
	[45, 123, 67],
	]


	labels_list = []

	with open(r"labels.txt", "r") as fp:
	for line in fp:
	labels_list.append(line[:-1])

	colormap = np.asarray(ade_palette())


	def label_to_color_image(label):
	"""라벨을 컬러 이미지로 변환해주는 함수입니다."""

	if label.ndim != 2:
	raise ValueError("2차원 입력 라벨을 기대합니다.")

	if np.max(label) >= len(colormap):
	raise ValueError("라벨 값이 너무 큽니다.")
	return colormap[label]


	def draw_plot(pred_img, seg):
	"""이미지와 세그멘테이션 결과를 floating 하는 함수입니다."""

	fig = plt.figure(figsize=(20, 15))
	grid_spec = gridspec.GridSpec(1, 2, width_ratios=[6, 1])

	plt.subplot(grid_spec[0])
	plt.imshow(pred_img)
	plt.axis("off")
	LABEL_NAMES = np.asarray(labels_list)
	FULL_LABEL_MAP = np.arange(len(LABEL_NAMES)).reshape(len(LABEL_NAMES), 1)
	FULL_COLOR_MAP = label_to_color_image(FULL_LABEL_MAP)

	unique_labels = np.unique(seg.numpy().astype("uint8"))
	ax = plt.subplot(grid_spec[1])
	plt.imshow(FULL_COLOR_MAP[unique_labels].astype(np.uint8), interpolation="nearest")
	ax.yaxis.tick_right()
	plt.yticks(range(len(unique_labels)), LABEL_NAMES[unique_labels])
	plt.xticks([], [])
	ax.tick_params(width=0.0, labelsize=25)

	return fig


	def sepia(inputs, button_text):
	"""객체 검출 또는 세그멘테이션을 수행하고 결과를 반환하는 함수입니다."""

	input_img = Image.fromarray(inputs)
	# if button_text == "detection":
	# inputs_detection = processor_detection(images=input_img, return_tensors="pt")
	# outputs_detection = model_detection(**inputs_detection)

	# target_sizes = torch.tensor([input_img.size[::-1]])
	# results_detection = processor_detection.post_process_object_detection(
	# outputs_detection, target_sizes=target_sizes, threshold=0.9
	# )[0]

	# draw = ImageDraw.Draw(input_img)
	# for score, label, box in zip(
	# results_detection["scores"],
	# results_detection["labels"],
	# results_detection["boxes"],
	# ):
	# box = [round(i, 2) for i in box.tolist()]
	# label_name = model_detection.config.id2label[label.item()]
	# print(
	# f"Detected {label_name} with confidence "
	# f"{round(score.item(), 3)} at location {box}"
	# )
	# draw.rectangle(box, outline="red", width=3)
	# draw.text((box[0], box[1]), label_name, fill="red", font=None)

	# fig = plt.figure(figsize=(20, 15))
	# plt.imshow(input_img)
	# plt.axis("off")
	# return fig

	if button_text == "segmentation":
	inputs_segmentation = feature_extractor(images=input_img, return_tensors="tf")
	outputs_segmentation = model_segmentation(**inputs_segmentation)
	logits_segmentation = outputs_segmentation.logits

	logits_segmentation = tf.transpose(logits_segmentation, [0, 2, 3, 1])
	logits_segmentation = tf.image.resize(logits_segmentation, input_img.size[::-1])
	seg = tf.math.argmax(logits_segmentation, axis=-1)[0]

	color_seg = np.zeros((seg.shape[0], seg.shape[1], 3), dtype=np.uint8)
	for label, color in enumerate(colormap):
	color_seg[seg.numpy() == label, :] = color

	pred_img = np.array(input_img) * 0.5 + color_seg * 0.5
	pred_img = pred_img.astype(np.uint8)

	fig = draw_plot(pred_img, seg)
	return fig

	return "Please select 'detection' or 'segmentation'."

	def on_button_click(inputs):
	"""버튼 클릭 이벤트 핸들러"""
	image_path, selected_option = inputs
	if selected_option == "dropout":
	# 'dropout'이면 두 가지 중에 하나를 랜덤으로 선택
	selected_option = np.random.choice(["segmentation"])

	return sepia(image_path, selected_option)

	# Gr.Dropdown을 사용하여 옵션을 선택할 수 있도록 변경
	dropdown = gr.Dropdown(
	["segmentation"], label="Menu", info="Chose Segmentation!"
	)

	demo = gr.Interface(
	fn=sepia,
	inputs=[gr.Image(shape=(400, 600)), dropdown],
	outputs=["plot"],
	examples=[
	["01.jpg", "Click me"],
	["02.jpeg", "Click me"],
	["03.jpeg", "Click me"],
	["04.jpeg", "Click me"],
	],
	allow_flagging="never",
	)

	demo.launch()