SadTalker

Paused

SadTalker / src /utils /paste_pic.py

tts

416263d over 1 year ago

1.58 kB

	import cv2, os
	import numpy as np
	from tqdm import tqdm
	import uuid

	def paste_pic(video_path, pic_path, crop_info, new_audio_path, full_video_path):

	full_img = cv2.imread(pic_path)
	print(full_img.dtype)
	frame_h = full_img.shape[0]
	frame_w = full_img.shape[1]

	video_stream = cv2.VideoCapture(video_path)
	fps = video_stream.get(cv2.CAP_PROP_FPS)
	crop_frames = []
	while 1:
	still_reading, frame = video_stream.read()
	if not still_reading:
	video_stream.release()
	break
	crop_frames.append(frame)

	if len(crop_info) != 3:
	print("you didn't crop the image")
	return
	else:
	r_w, r_h = crop_info[0]
	clx, cly, crx, cry = crop_info[1]
	lx, ly, rx, ry = crop_info[2]
	lx, ly, rx, ry = int(lx), int(ly), int(rx), int(ry)
	oy1, oy2, ox1, ox2 = cly+ly, cly+ry, clx+lx, clx+rx

	tmp_path = str(uuid.uuid4())+'.mp4'
	out_tmp = cv2.VideoWriter(tmp_path, cv2.VideoWriter_fourcc(*'MP4V'), fps, (frame_w, frame_h))
	for crop_frame in tqdm(crop_frames, 'seamlessClone:'):
	p = cv2.resize(crop_frame.astype(np.uint8), (r_w, r_h))

	mask = 255*np.ones(p.shape, p.dtype)
	location = ((ox1+ox2) // 2, (oy1+oy2) // 2)
	gen_img = cv2.seamlessClone(p, full_img, mask, location, cv2.NORMAL_CLONE)

	#full_img[oy1:oy2, ox1:ox2] = p
	out_tmp.write(gen_img)
	out_tmp.release()
	cmd = r'ffmpeg -y -i "%s" -i "%s" "%s"' % (tmp_path, new_audio_path, full_video_path)
	os.system(cmd)
	os.remove(tmp_path)