latentblending/example2_multitrans.py

78 lines
3.2 KiB
Python
Raw Normal View History

2023-02-18 07:19:40 +00:00
# Copyright 2022 Lunar Ring. All rights reserved.
# Written by Johannes Stelzer, email stelzer@lunar-ring.ai twitter @j_stelzer
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import torch
torch.backends.cudnn.benchmark = False
2023-02-22 09:15:03 +00:00
torch.set_grad_enabled(False)
2023-02-18 07:19:40 +00:00
import warnings
warnings.filterwarnings('ignore')
import warnings
2023-02-22 09:15:03 +00:00
from latent_blending import LatentBlending
2023-02-18 07:19:40 +00:00
from stable_diffusion_holder import StableDiffusionHolder
2023-02-22 09:15:03 +00:00
from movie_util import concatenate_movies
from huggingface_hub import hf_hub_download
2023-02-18 07:19:40 +00:00
2023-02-22 09:15:03 +00:00
# %% First let us spawn a stable diffusion holder. Uncomment your version of choice.
# fp_ckpt = hf_hub_download(repo_id="stabilityai/stable-diffusion-2-1-base", filename="v2-1_512-ema-pruned.ckpt")
fp_ckpt = hf_hub_download(repo_id="stabilityai/stable-diffusion-2-1", filename="v2-1_768-ema-pruned.ckpt")
2023-02-18 07:19:40 +00:00
sdh = StableDiffusionHolder(fp_ckpt)
2023-02-22 09:15:03 +00:00
# %% Let's setup the multi transition
2023-02-18 07:19:40 +00:00
fps = 30
duration_single_trans = 6
2023-02-22 09:15:03 +00:00
depth_strength = 0.55 # Specifies how deep (in terms of diffusion iterations the first branching happens)
2023-02-18 07:19:40 +00:00
# Specify a list of prompts below
list_prompts = []
list_prompts.append("surrealistic statue made of glitter and dirt, standing in a lake, atmospheric light, strange glow")
list_prompts.append("statue of a mix between a tree and human, made of marble, incredibly detailed")
list_prompts.append("weird statue of a frog monkey, many colors, standing next to the ruins of an ancient city")
list_prompts.append("statue of a spider that looked like a human")
list_prompts.append("statue of a bird that looked like a scorpion")
list_prompts.append("statue of an ancient cybernetic messenger annoucing good news, golden, futuristic")
# You can optionally specify the seeds
list_seeds = [954375479, 332539350, 956051013, 408831845, 250009012, 675588737]
2023-02-22 09:15:03 +00:00
t_compute_max_allowed = 12 # per segment
2023-02-18 07:19:40 +00:00
fp_movie = 'movie_example2.mp4'
lb = LatentBlending(sdh)
2023-02-22 09:15:03 +00:00
list_movie_parts = []
for i in range(len(list_prompts) - 1):
2023-02-18 07:44:28 +00:00
# For a multi transition we can save some computation time and recycle the latents
2023-02-22 09:15:03 +00:00
if i == 0:
2023-02-18 07:44:28 +00:00
lb.set_prompt1(list_prompts[i])
2023-02-22 09:15:03 +00:00
lb.set_prompt2(list_prompts[i + 1])
2023-02-18 07:44:28 +00:00
recycle_img1 = False
else:
lb.swap_forward()
2023-02-22 09:15:03 +00:00
lb.set_prompt2(list_prompts[i + 1])
recycle_img1 = True
2023-02-18 07:19:40 +00:00
fp_movie_part = f"tmp_part_{str(i).zfill(3)}.mp4"
2023-02-22 09:15:03 +00:00
fixed_seeds = list_seeds[i:i + 2]
2023-02-18 07:19:40 +00:00
# Run latent blending
lb.run_transition(
2023-02-22 09:15:03 +00:00
depth_strength=depth_strength,
t_compute_max_allowed=t_compute_max_allowed,
fixed_seeds=fixed_seeds)
2023-02-18 07:19:40 +00:00
# Save movie
lb.write_movie_transition(fp_movie_part, duration_single_trans)
list_movie_parts.append(fp_movie_part)
# Finally, concatente the result
2023-02-22 09:15:03 +00:00
concatenate_movies(fp_movie, list_movie_parts)