Spaces:

fffiloni
/

EchoMimic

Running on L40S

App Files Files Community

EchoMimic / src /utils /img_utils.py

fffiloni

Upload 184 files

03a856a verified 4 months ago

raw

history blame contribute delete

2.73 kB

	from PIL import Image
	import cv2
	import numpy as np
	from imageio_ffmpeg import get_ffmpeg_exe
	import pathlib
	import os
	from IPython import embed

	def pil_to_cv2(pil):
	return cv2.cvtColor(np.array(pil).astype(np.uint8), cv2.COLOR_RGB2BGR)

	def cv2_to_pil(cv2_img):
	return Image.fromarray(cv2.cvtColor(cv2_img, cv2.COLOR_BGR2RGB).astype(np.uint8))

	def center_crop_cv2(cv2_pic):
	h, w = cv2_pic.shape[0], cv2_pic.shape[1]
	if h > w:
	return cv2_pic[(h - w) // 2 : (h - w) // 2 + w, :]
	else:
	return cv2_pic[:, (w - h) // 2 : (w - h) // 2 + h]

	def pils_from_video(video_path):
	cap = cv2.VideoCapture(video_path)
	pils = []
	while True:
	ret, frame = cap.read()
	if not ret:
	break

	frame = cv2.resize(center_crop_cv2(frame), (512, 512))
	pils.append(cv2_to_pil(frame))

	return pils

	def save_videos_from_pils(pils, path, fps=24):
	width, height = pils[0].size
	print(width, height)
	fourcc = cv2.VideoWriter_fourcc(*'mp4v')

	pathlib.Path(path).parent.mkdir(exist_ok=True, parents=True)

	output_name = pathlib.Path(path).stem
	temp_output_path = path.replace(output_name, output_name + '-temp')
	videowrite = cv2.VideoWriter(temp_output_path, fourcc, fps, (height, width))
	for pil in pils:
	frame = pil_to_cv2(pil)
	print(frame.shape, frame.min(), frame.max())
	videowrite.write(frame)

	videowrite.release()
	"""
	embed()

	cmd = (f'{get_ffmpeg_exe()} -i "{temp_output_path}"'
	f'-map 0:v -map 1:a -c:v h264 -shortest -y "{path}" -loglevel quiet')
	os.system(cmd)
	os.remove(temp_output_path)
	"""
	def save_video_from_cv2_list(pic_cv2_list, output_path, fps=30.0):
	pathlib.Path(output_path).parent.mkdir(exist_ok=True, parents=True)

	num_frames = len(pic_cv2_list)
	height, width = pic_cv2_list[0].shape[:2]

	#video_tensor = video_tensor[0, ...]
	#_, num_frames, height, width = video_tensor.shape

	output_name = pathlib.Path(output_path).stem
	temp_output_path = output_path.replace(output_name, output_name)
	video_writer = cv2.VideoWriter(temp_output_path, cv2.VideoWriter_fourcc(*'mp4v'), fps, (width, height))

	for i in range(num_frames):
	#frame_tensor = video_tensor[:, i, ...] # [c, h, w]
	#frame_tensor = frame_tensor.permute(1, 2, 0) # [h, w, c]

	#frame_image = (frame_tensor * 255).numpy().astype(np.uint8)
	#frame_image = cv2.cvtColor(frame_image, cv2.COLOR_RGB2BGR)
	frame_image = pic_cv2_list[i].astype(np.uint8)
	video_writer.write(frame_image)

	video_writer.release()


	#ffmpeg -i input_file -c:v libx264 -crf 20 -c:a aac -strict experimental -b:a 192k output_file