In [1]:
import torch
import os
import psutil
from diffusers import AnimateDiffPipeline, MotionAdapter, EulerDiscreteScheduler
from diffusers.utils import export_to_gif
from huggingface_hub import hf_hub_download
from safetensors.torch import load_file

device = "cuda"
dtype = torch.float16

prompt = "Donald Trump stands at the podium and talks a lot.The camera remains stationary, focused on the man. The lighting is warm and natural. The scene appears to be real-life footage."


step = 8
repo = "ByteDance/AnimateDiff-Lightning"
ckpt = f"animatediff_lightning_{step}step_diffusers.safetensors"
base = "emilianJR/epiCRealism"

adapter = MotionAdapter().to(device, dtype)
adapter.load_state_dict(load_file(hf_hub_download(repo ,ckpt), device=device))
pipe = AnimateDiffPipeline.from_pretrained(base, motion_adapter=adapter, torch_dtype=dtype).to(device)
pipe.scheduler = EulerDiscreteScheduler.from_config(pipe.scheduler.config, timestep_spacing="trailing", beta_schedule="linear")

output = pipe(prompt=prompt, guidance_scale=1.0, num_inference_steps=step, width=768, height=480, num_frames=160)
export_to_gif(output.frames[0], "trump.gif", fps=24)

  from .autonotebook import tqdm as notebook_tqdm
Loading pipeline components...: 100%|██████████| 6/6 [00:02<00:00,  2.96it/s]
100%|██████████| 8/8 [00:04<00:00,  1.67it/s]


'trump.gif'

In [2]:
prompt = "A young woman walks through a lively street market, surrounded by the hum of conversation and the clatter of vendors’ stalls. The camera follows her from a handheld medium shot, capturing the gentle sway of her movement as she weaves between crowds. Sunlight filters through vibrant umbrellas and patchwork tents above, casting shifting patterns of light and shadow on the pavement. The atmosphere feels warm and authentic, rich with the colors and textures of everyday life."

output = pipe(prompt=prompt, guidance_scale=1.0, num_inference_steps=step, width=768, height=480, num_frames=160)
export_to_gif(output.frames[0], "market.gif", fps=24)


Token indices sequence length is longer than the specified maximum sequence length for this model (91 > 77). Running this sequence through the model will result in indexing errors
The following part of your input was truncated because CLIP can only handle sequences up to 77 tokens: ['warm and authentic, rich with the colors and textures of everyday life.']
100%|██████████| 8/8 [00:04<00:00,  1.61it/s]


'market.gif'

In [None]:
prompt = "A clear, turquoise river flows through a rocky canyon, cascading over a small waterfall and forming a pool of water at the bottom.The river is the main focus of the scene, with its clear water reflecting the surrounding trees and rocks. The canyon walls are steep and rocky, with some vegetation growing on them. The trees are mostly pine trees, with their green needles contrasting with the brown and gray rocks. The overall tone of the scene is one of peace and tranquility."

output = pipe(prompt=prompt, guidance_scale=1.0, num_inference_steps=step, width=768, height=480)
export_to_gif(output.frames[0], "landscape.gif", fps=24)

current_pid = os.getpid()
for proc in psutil.process_iter(attrs=['pid', 'name']):
    try:
        if "python" in proc.info['name'].lower() and proc.info['pid'] != current_pid:
            os.kill(proc.info['pid'], 9)
    except (psutil.NoSuchProcess, psutil.AccessDenied):
        continue

The following part of your input was truncated because CLIP can only handle sequences up to 77 tokens: ['contrasting with the brown and gray rocks. the overall tone of the scene is one of peace and tranquility.']
100%|██████████| 8/8 [00:05<00:00,  1.59it/s]
