mirror of
https://github.com/KwaiVGI/LivePortrait.git
synced 2024-12-24 21:49:08 +00:00
140 lines
4.9 KiB
Python
140 lines
4.9 KiB
Python
|
# coding: utf-8
|
||
|
|
||
|
"""
|
||
|
functions for processing video
|
||
|
"""
|
||
|
|
||
|
import os.path as osp
|
||
|
import numpy as np
|
||
|
import subprocess
|
||
|
import imageio
|
||
|
import cv2
|
||
|
|
||
|
from rich.progress import track
|
||
|
from .helper import prefix
|
||
|
from .rprint import rprint as print
|
||
|
|
||
|
|
||
|
def exec_cmd(cmd):
|
||
|
subprocess.run(cmd, shell=True, check=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)
|
||
|
|
||
|
|
||
|
def images2video(images, wfp, **kwargs):
|
||
|
fps = kwargs.get('fps', 30)
|
||
|
video_format = kwargs.get('format', 'mp4') # default is mp4 format
|
||
|
codec = kwargs.get('codec', 'libx264') # default is libx264 encoding
|
||
|
quality = kwargs.get('quality') # video quality
|
||
|
pixelformat = kwargs.get('pixelformat', 'yuv420p') # video pixel format
|
||
|
image_mode = kwargs.get('image_mode', 'rgb')
|
||
|
macro_block_size = kwargs.get('macro_block_size', 2)
|
||
|
ffmpeg_params = ['-crf', str(kwargs.get('crf', 18))]
|
||
|
|
||
|
writer = imageio.get_writer(
|
||
|
wfp, fps=fps, format=video_format,
|
||
|
codec=codec, quality=quality, ffmpeg_params=ffmpeg_params, pixelformat=pixelformat, macro_block_size=macro_block_size
|
||
|
)
|
||
|
|
||
|
n = len(images)
|
||
|
for i in track(range(n), description='writing', transient=True):
|
||
|
if image_mode.lower() == 'bgr':
|
||
|
writer.append_data(images[i][..., ::-1])
|
||
|
else:
|
||
|
writer.append_data(images[i])
|
||
|
|
||
|
writer.close()
|
||
|
|
||
|
# print(f':smiley: Dump to {wfp}\n', style="bold green")
|
||
|
print(f'Dump to {wfp}\n')
|
||
|
|
||
|
|
||
|
def video2gif(video_fp, fps=30, size=256):
|
||
|
if osp.exists(video_fp):
|
||
|
d = osp.split(video_fp)[0]
|
||
|
fn = prefix(osp.basename(video_fp))
|
||
|
palette_wfp = osp.join(d, 'palette.png')
|
||
|
gif_wfp = osp.join(d, f'{fn}.gif')
|
||
|
# generate the palette
|
||
|
cmd = f'ffmpeg -i {video_fp} -vf "fps={fps},scale={size}:-1:flags=lanczos,palettegen" {palette_wfp} -y'
|
||
|
exec_cmd(cmd)
|
||
|
# use the palette to generate the gif
|
||
|
cmd = f'ffmpeg -i {video_fp} -i {palette_wfp} -filter_complex "fps={fps},scale={size}:-1:flags=lanczos[x];[x][1:v]paletteuse" {gif_wfp} -y'
|
||
|
exec_cmd(cmd)
|
||
|
else:
|
||
|
print(f'video_fp: {video_fp} not exists!')
|
||
|
|
||
|
|
||
|
def merge_audio_video(video_fp, audio_fp, wfp):
|
||
|
if osp.exists(video_fp) and osp.exists(audio_fp):
|
||
|
cmd = f'ffmpeg -i {video_fp} -i {audio_fp} -c:v copy -c:a aac {wfp} -y'
|
||
|
exec_cmd(cmd)
|
||
|
print(f'merge {video_fp} and {audio_fp} to {wfp}')
|
||
|
else:
|
||
|
print(f'video_fp: {video_fp} or audio_fp: {audio_fp} not exists!')
|
||
|
|
||
|
|
||
|
def blend(img: np.ndarray, mask: np.ndarray, background_color=(255, 255, 255)):
|
||
|
mask_float = mask.astype(np.float32) / 255.
|
||
|
background_color = np.array(background_color).reshape([1, 1, 3])
|
||
|
bg = np.ones_like(img) * background_color
|
||
|
img = np.clip(mask_float * img + (1 - mask_float) * bg, 0, 255).astype(np.uint8)
|
||
|
return img
|
||
|
|
||
|
|
||
|
def concat_frames(I_p_lst, driving_rgb_lst, img_rgb):
|
||
|
# TODO: add more concat style, e.g., left-down corner driving
|
||
|
out_lst = []
|
||
|
for idx, _ in track(enumerate(I_p_lst), total=len(I_p_lst), description='Concatenating result...'):
|
||
|
source_image_drived = I_p_lst[idx]
|
||
|
image_drive = driving_rgb_lst[idx]
|
||
|
|
||
|
# resize images to match source_image_drived shape
|
||
|
h, w, _ = source_image_drived.shape
|
||
|
image_drive_resized = cv2.resize(image_drive, (w, h))
|
||
|
img_rgb_resized = cv2.resize(img_rgb, (w, h))
|
||
|
|
||
|
# concatenate images horizontally
|
||
|
frame = np.concatenate((image_drive_resized, img_rgb_resized, source_image_drived), axis=1)
|
||
|
out_lst.append(frame)
|
||
|
return out_lst
|
||
|
|
||
|
|
||
|
class VideoWriter:
|
||
|
def __init__(self, **kwargs):
|
||
|
self.fps = kwargs.get('fps', 30)
|
||
|
self.wfp = kwargs.get('wfp', 'video.mp4')
|
||
|
self.video_format = kwargs.get('format', 'mp4')
|
||
|
self.codec = kwargs.get('codec', 'libx264')
|
||
|
self.quality = kwargs.get('quality')
|
||
|
self.pixelformat = kwargs.get('pixelformat', 'yuv420p')
|
||
|
self.image_mode = kwargs.get('image_mode', 'rgb')
|
||
|
self.ffmpeg_params = kwargs.get('ffmpeg_params')
|
||
|
|
||
|
self.writer = imageio.get_writer(
|
||
|
self.wfp, fps=self.fps, format=self.video_format,
|
||
|
codec=self.codec, quality=self.quality,
|
||
|
ffmpeg_params=self.ffmpeg_params, pixelformat=self.pixelformat
|
||
|
)
|
||
|
|
||
|
def write(self, image):
|
||
|
if self.image_mode.lower() == 'bgr':
|
||
|
self.writer.append_data(image[..., ::-1])
|
||
|
else:
|
||
|
self.writer.append_data(image)
|
||
|
|
||
|
def close(self):
|
||
|
if self.writer is not None:
|
||
|
self.writer.close()
|
||
|
|
||
|
|
||
|
def change_video_fps(input_file, output_file, fps=20, codec='libx264', crf=5):
|
||
|
cmd = f"ffmpeg -i {input_file} -c:v {codec} -crf {crf} -r {fps} {output_file} -y"
|
||
|
exec_cmd(cmd)
|
||
|
|
||
|
|
||
|
def get_fps(filepath):
|
||
|
import ffmpeg
|
||
|
probe = ffmpeg.probe(filepath)
|
||
|
video_stream = next((stream for stream in probe['streams'] if stream['codec_type'] == 'video'), None)
|
||
|
fps = eval(video_stream['avg_frame_rate'])
|
||
|
return fps
|