Spaces:

MinhNH232331M
/

Neural_painting

Running

App Files Files Community

Neural_painting / app.py

minhnh

Fix bug import wrong dep

e0b460b 7 months ago

raw

history blame

9.77 kB

	import gradio as gr
	import os
	import cv2
	import torch
	import numpy as np
	import argparse
	import torch.nn as nn
	import torch.nn.functional as F
	import gc
	from baseline.DRL.actor import *
	from baseline.Renderer.stroke_gen import *
	from baseline.Renderer.model import *

	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	width = 128


	actor_path = 'ckpts/actor.pkl'
	renderer_path = 'ckpts/renderer.pkl'
	#
	divide = 4
	canvas_cnt = divide * divide

	Decoder = FCN()
	Decoder.load_state_dict(torch.load(renderer_path))
	actor = ResNet(9, 18, 65) # action_bundle = 5, 65 = 5 * 13
	actor.load_state_dict(torch.load(actor_path))
	actor = actor.to(device).eval()
	Decoder = Decoder.to(device).eval()

	decoders = {"Default": Decoder}
	actors = {"Default": actor}

	def decode(x, canvas, decoder = Decoder): # b * (10 + 3)
	x = x.view(-1, 10 + 3)
	stroke = 1 - decoder(x[:, :10])
	stroke = stroke.view(-1, width, width, 1)
	color_stroke = stroke * x[:, -3:].view(-1, 1, 1, 3)
	stroke = stroke.permute(0, 3, 1, 2)
	color_stroke = color_stroke.permute(0, 3, 1, 2)
	stroke = stroke.view(-1, 5, 1, width, width)
	color_stroke = color_stroke.view(-1, 5, 3, width, width)
	res = []
	for i in range(5):
	canvas = canvas * (1 - stroke[:, i]) + color_stroke[:, i]
	res.append(canvas)
	gc.collect()
	if torch.cuda.is_available():
	torch.cuda.empty_cache()
	return canvas, res

	def small2large(x):
	# (d * d, width, width) -> (d * width, d * width)
	x = x.reshape(divide, divide, width, width, -1)
	x = np.transpose(x, (0, 2, 1, 3, 4))
	x = x.reshape(divide * width, divide * width, -1)
	return x

	def large2small(x):
	# (d * width, d * width) -> (d * d, width, width)
	x = x.reshape(divide, width, divide, width, 3)
	x = np.transpose(x, (0, 2, 1, 3, 4))
	x = x.reshape(canvas_cnt, width, width, 3)
	return x

	def smooth(img):
	def smooth_pix(img, tx, ty):
	if tx == divide * width - 1 or ty == divide * width - 1 or tx == 0 or ty == 0:
	return img
	img[tx, ty] = (img[tx, ty] + img[tx + 1, ty] + img[tx, ty + 1] + img[tx - 1, ty] + img[tx, ty - 1] + img[tx + 1, ty - 1] + img[tx - 1, ty + 1] + img[tx - 1, ty - 1] + img[tx + 1, ty + 1]) / 9
	return img

	for p in range(divide):
	for q in range(divide):
	x = p * width
	y = q * width
	for k in range(width):
	img = smooth_pix(img, x + k, y + width - 1)
	if q != divide - 1:
	img = smooth_pix(img, x + k, y + width)
	for k in range(width):
	img = smooth_pix(img, x + width - 1, y + k)
	if p != divide - 1:
	img = smooth_pix(img, x + width, y + k)
	return img

	def save_img(res, imgid, origin_shape, output_name, divide=False):
	output = res.detach().cpu().numpy() # d * d, 3, width, width
	output = np.transpose(output, (0, 2, 3, 1))
	if divide:
	output = small2large(output)
	output = smooth(output)
	else:
	output = output[0]
	output = (output * 255).astype('uint8')
	output = cv2.resize(output, origin_shape)
	cv2.imwrite(output_name +"/" + str(imgid) + '.jpg', output)





	def paint_img(img, max_step = 40, model_choices = "Default"):
	Decoder = decoders[model_choices]
	actor = actors[model_choices]
	max_step = int(max_step)
	# imgid = 0
	# output_name = os.path.join('output', str(len(os.listdir('output'))) if os.path.exists('output') else '0')
	# os.makedirs(output_name, exist_ok= True)
	# img = cv2.imread(args.img, cv2.IMREAD_COLOR)
	origin_shape = (img.shape[1], img.shape[0])
	patch_img = cv2.resize(img, (width * divide, width * divide))
	patch_img = large2small(patch_img)
	patch_img = np.transpose(patch_img, (0, 3, 1, 2))
	patch_img = torch.tensor(patch_img).to(device).float() / 255.

	img = cv2.resize(img, (width, width))
	img = img.reshape(1, width, width, 3)
	img = np.transpose(img, (0, 3, 1, 2))
	img = torch.tensor(img).to(device).float() / 255.

	T = torch.ones([1, 1, width, width], dtype=torch.float32).to(device)
	coord = torch.zeros([1, 2, width, width])
	for i in range(width):
	for j in range(width):
	coord[0, 0, i, j] = i / (width - 1.)
	coord[0, 1, i, j] = j / (width - 1.)
	coord = coord.to(device) # Coordconv
	canvas = torch.zeros([1, 3, width, width]).to(device)

	with torch.no_grad():
	if divide != 1:
	max_step = max_step // 2
	for i in range(max_step):
	stepnum = T * i / max_step
	actions = actor(torch.cat([canvas, img, stepnum, coord], 1))
	canvas, res = decode(actions, canvas, Decoder)
	for j in range(5):
	# save_img(res[j], imgid)
	# imgid += 1
	output = res[j].detach().cpu().numpy() # d * d, 3, width, width
	output = np.transpose(output, (0, 2, 3, 1))
	output = output[0]
	output = (output * 255).astype('uint8')
	output = cv2.resize(output, origin_shape)
	yield output
	if divide != 1:
	canvas = canvas[0].detach().cpu().numpy()
	canvas = np.transpose(canvas, (1, 2, 0))
	canvas = cv2.resize(canvas, (width * divide, width * divide))
	canvas = large2small(canvas)
	canvas = np.transpose(canvas, (0, 3, 1, 2))
	canvas = torch.tensor(canvas).to(device).float()
	coord = coord.expand(canvas_cnt, 2, width, width)
	T = T.expand(canvas_cnt, 1, width, width)
	for i in range(max_step):
	stepnum = T * i / max_step
	actions = actor(torch.cat([canvas, patch_img, stepnum, coord], 1))
	canvas, res = decode(actions, canvas, Decoder)
	# print('divided canvas step {}, L2Loss = {}'.format(i, ((canvas - patch_img) ** 2).mean()))
	for j in range(5):
	# save_img(res[j], imgid, True)
	# imgid += 1
	output = res[j].detach().cpu().numpy() # d * d, 3, width, width
	output = np.transpose(output, (0, 2, 3, 1))
	output = small2large(output)
	output = smooth(output)
	output = (output * 255).astype('uint8')
	output = cv2.resize(output, origin_shape)
	yield output

	yield output


	def load_model_if_needed(choice: str):
	# global Decoder, actor
	if choice == "Default":
	actor_path = 'ckpts/actor.pkl'
	renderer_path = 'ckpts/renderer.pkl'
	elif choice == "Triangle":
	actor_path = 'ckpts/actor_triangle.pkl'
	renderer_path = 'ckpts/triangle.pkl'
	elif choice == "Round":
	actor_path = 'ckpts/actor_round.pkl'
	renderer_path = 'ckpts/round.pkl'
	else:
	actor_path = 'ckpts/actor_notrans.pkl'
	renderer_path = 'ckpts/bezierwotrans.pkl'
	if choice not in decoders:
	Decoder = FCN()
	Decoder.load_state_dict(torch.load(renderer_path, map_location= "cpu"))
	Decoder = Decoder.to(device).eval()
	decoders[choice] = Decoder
	if choice not in actors:
	actor = ResNet(9, 18, 65) # action_bundle = 5, 65 = 5 * 13
	actor.load_state_dict(torch.load(actor_path, map_location= "cpu"))
	actor = actor.to(device).eval()
	actors[choice] = actor




	from typing import Generator
	def wrapper(func):
	event:Generator = range(0)
	def inner(args, *kwargs):
	nonlocal event
	val = args[0]
	if val == "Cancel":
	args_ = tuple(x for i,x in enumerate(args) if i > 0)
	event = func(args_, *kwargs)
	yield from event
	else:
	try:
	event.close()
	yield
	except:
	pass
	return inner


	examples = [
	["image/chaoyue.png"],
	["image/degang.png"],
	["image/JayChou.png"],
	["image/Leslie.png"],
	["image/mayun.png"],
	]
	output = gr.Image(label="Painting Result")
	with gr.Blocks() as demo:
	with gr.Row():
	with gr.Column():
	input_image = gr.Image(label="Input image")
	with gr.Row():
	step = gr.Slider(20, 100, value= 40, step = 1, label= 'Painting step')
	with gr.Row():
	dropdown = gr.Dropdown(['Default', 'Round', 'Triangle', 'Bezier wo trans'], value= 'Default', label= 'Stroke choice')
	with gr.Row():
	with gr.Column():
	clr_btn = gr.ClearButton([input_image, output], variant= "stop")
	with gr.Column():
	translate_btn = gr.Button(value="Paint", variant="primary")

	with gr.Column():
	output.render()


	dropdown.select(load_model_if_needed, dropdown)
	click_event = translate_btn.click(lambda x: gr.Button(value="Cancel", variant="stop") if x == "Paint" else gr.Button(value="Paint", variant="primary"), translate_btn, translate_btn)\
	.then(wrapper(paint_img), inputs=[translate_btn, input_image, step, dropdown], outputs=output, trigger_mode = 'multiple')\
	.then(lambda x: gr.Button(value="Paint", variant="primary"), translate_btn, translate_btn)
	clr_btn.click(None, None, cancels=[click_event])
	examples = gr.Examples(examples=examples,
	inputs=[input_image], cache_examples = False)



	# demo = gr.Interface(fn=paint_img, inputs=gr.Image(), outputs="image", examples = examples)
	demo.queue(default_concurrency_limit= 4)
	demo.launch(server_name="0.0.0.0", )