# Thin-Plate Spline Motion Model for Image Animation


<img src="https://github.com/yoyo-nb/Thin-Plate-Spline-Motion-Model/raw/main/assets/vox.gif" width="600px" />

<img src="https://github.com/yoyo-nb/Thin-Plate-Spline-Motion-Model/raw/main/assets/ted.gif" width="600px" />

- 코딩없이 사용하기: https://replicate.com/yoyo-nb/thin-plate-spline-motion-model
- 원본 소스코드: https://github.com/yoyo-nb/Thin-Plate-Spline-Motion-Model

## 소스코드/모델 다운로드

In [None]:
!pip install -q face_alignment imageio_ffmpeg
!git clone https://github.com/yoyo-nb/Thin-Plate-Spline-Motion-Model.git
%cd Thin-Plate-Spline-Motion-Model
!mkdir checkpoints
!wget -q -c https://cloud.tsinghua.edu.cn/f/da8d61d012014b12a9e4/?dl=1 -O checkpoints/vox.pth.tar

In [None]:
%cd Thin-Plate-Spline-Motion-Model

In [None]:
!pip install pyyaml

## 설정

<img src="https://user-images.githubusercontent.com/48593306/197152487-45d5198a-1e7d-4e73-8709-cf7621827d60.png" width="600px" />

In [8]:
import torch

device = 'cuda' if torch.cuda.is_available() else 'cpu'
dataset_name = 'vox' # ['vox', 'taichi', 'ted', 'mgif'] 얼굴, 몸전체, 상반신, 말?
config_path = 'config/vox-256.yaml' # vox 모델은 256x256으로 합성됨
checkpoint_path = 'checkpoints/vox.pth.tar'
predict_mode = 'relative' # ['standard', 'relative', 'avd']
find_best_frame = True # when use the relative mode to animate a face, use 'find_best_frame=True' can get better quality result

pixel = 256 # for vox, taichi and mgif, the resolution is 256*256
if(dataset_name == 'ted'): # for ted, the resolution is 384*384
    pixel = 384

  from .autonotebook import tqdm as notebook_tqdm


## 패키지/모델 로드

In [10]:
import imageio
import imageio_ffmpeg
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.animation as animation
from skimage.transform import resize
from IPython.display import HTML
import warnings
from skimage import img_as_ubyte

from demo import load_checkpoints
from demo import make_animation
from demo import find_best_frame as _find

warnings.filterwarnings("ignore")

inpainting, kp_detector, dense_motion_network, avd_network = load_checkpoints(config_path = config_path, checkpoint_path = checkpoint_path, device = device)

## [옵션] 내 얼굴 녹화하기

driving video

In [3]:
#@title
from IPython.display import display, Javascript,HTML
from google.colab.output import eval_js
from base64 import b64decode
 
def record_video(filename):
  js=Javascript("""
    async function recordVideo() {
      const options = { mimeType: "video/webm; codecs=vp9" };
      const div = document.createElement('div');
      const capture = document.createElement('button');
      const stopCapture = document.createElement("button");
       
      capture.textContent = "Start Recording";
      capture.style.background = "orange";
      capture.style.color = "white";
 
      stopCapture.textContent = "Stop Recording";
      stopCapture.style.background = "red";
      stopCapture.style.color = "white";
      div.appendChild(capture);
 
      const video = document.createElement('video');
      const recordingVid = document.createElement("video");
      video.style.display = 'block';
 
      const stream = await navigator.mediaDevices.getUserMedia({audio:true, video: {
        facingMode: "environment",
        aspectRatio: { exact: 1 }
      }});
     
      let recorder = new MediaRecorder(stream, options);
      document.body.appendChild(div);
      div.appendChild(video);
 
      video.srcObject = stream;
      video.muted = true;
 
      await video.play();
 
      google.colab.output.setIframeHeight(document.documentElement.scrollHeight, true);
 
      await new Promise((resolve) => {
        capture.onclick = resolve;
      });
      recorder.start();
      capture.replaceWith(stopCapture);
 
      await new Promise((resolve) => stopCapture.onclick = resolve);
      recorder.stop();
      let recData = await new Promise((resolve) => recorder.ondataavailable = resolve);
      let arrBuff = await recData.data.arrayBuffer();
       
      // stop the stream and remove the video element
      stream.getVideoTracks()[0].stop();
      div.remove();
 
      let binaryString = "";
      let bytes = new Uint8Array(arrBuff);
      bytes.forEach((byte) => {
        binaryString += String.fromCharCode(byte);
      })
    return btoa(binaryString);
    }
  """)
  display(js)
#   try:
#     display(js)
#     data=eval_js('recordVideo({})')
#     binary=b64decode(data)
#     with open(filename,"wb") as video_file:
#       video_file.write(binary)
#     print(f"Finished recording video at:{filename}")
#   except Exception as err:
#     print(str(err))

record_video('assets/capture.mp4')

<IPython.core.display.Javascript object>

## [옵션] DALL-E 2로 얼굴 생성하기

source image

https://labs.openai.com

번역: https://papago.naver.com

```
A portrait of a black man with frontal face
```

## 전처리

In [11]:
source_image_path = 'assets/result.jpg'
driving_video_path = 'assets/driving.mp4'

source_image = imageio.imread(source_image_path) # 합성할 이미지
reader = imageio.get_reader(driving_video_path)  # 원본 비디오

source_image = resize(source_image, (pixel, pixel))[..., :3] # 소스이미지 리사이즈 256x256

fps = reader.get_meta_data()['fps'] # 프레임 단위로 분리
driving_video = []
try:
    for im in reader:
        driving_video.append(im)
except RuntimeError:
    pass
########
# print(reader)
# print(len(driving_video))
# for i in reader:
#     print(i.shape)
#     print(type(i))
#     break
########
reader.close()

driving_video = [resize(frame, (pixel, pixel))[..., :3] for frame in driving_video] # driving_video 리사이즈

def display(source, driving, generated=None):
    fig = plt.figure(figsize=(8 + 4 * (generated is not None), 4))
    fig.subplots_adjust(bottom=0, top=1, left=0, right=1)

    ims = []
    for i in range(len(driving)): # 원본 비디오에서 하나의 프레임씩
        cols = [source]
        cols.append(driving[i])
        if generated is not None:
            cols.append(generated[i])
        im = plt.imshow(np.concatenate(cols, axis=1), animated=True)
        plt.axis('off')
        ims.append([im])

    ani = animation.ArtistAnimation(fig, ims, interval=50, repeat_delay=1000)
    plt.close()
    return ani
    

HTML(display(source_image, driving_video).to_html5_video())

RuntimeError: Requested MovieWriter (ffmpeg) not available

## 추론/결과보기

In [None]:
output_video_path = 'assets/toonification_result.mp4'

if predict_mode=='relative' and find_best_frame:
    i = _find(source_image, driving_video, device=='cpu')
    print ("Best frame: " + str(i))
    driving_forward = driving_video[i:]
    driving_backward = driving_video[:(i+1)][::-1]
    predictions_forward = make_animation(source_image, driving_forward, inpainting, kp_detector, dense_motion_network, avd_network, device = device, mode = predict_mode)
    predictions_backward = make_animation(source_image, driving_backward, inpainting, kp_detector, dense_motion_network, avd_network, device = device, mode = predict_mode)
    predictions = predictions_backward[::-1] + predictions_forward[1:]
else:
    predictions = make_animation(source_image, driving_video, inpainting, kp_detector, dense_motion_network, avd_network, device = device, mode = predict_mode)

# save result video
imageio.mimsave(output_video_path, [img_as_ubyte(frame) for frame in predictions], fps=fps)

HTML(display(source_image, driving_video, predictions).to_html5_video())

Downloading: "https://www.adrianbulat.com/downloads/python-fan/s3fd-619a316812.pth" to /root/.cache/torch/hub/checkpoints/s3fd-619a316812.pth


  0%|          | 0.00/85.7M [00:00<?, ?B/s]

Downloading: "https://www.adrianbulat.com/downloads/python-fan/2DFAN4-cd938726ad.zip" to /root/.cache/torch/hub/checkpoints/2DFAN4-cd938726ad.zip


  0%|          | 0.00/91.9M [00:00<?, ?B/s]

115it [04:26,  1.79s/it]