### Setup

In [None]:
# %cd ~

In [None]:
# ~/.cache/huggingface

In [None]:
import wandb
import os
import time

wandb.login()

In [None]:
import torch

torch.cuda.empty_cache()
print(torch.cuda.memory_allocated() / (1024 ** 3))
print(torch.cuda.memory_reserved() / (1024 ** 3))

In [None]:
from diffusers import StableDiffusionPipeline
import torch
import random
from PIL import Image

device = "cuda" if torch.cuda.is_available() else "cpu"


def image_grid(imgs, rows, cols, size=None):
    assert len(imgs) == rows*cols

    w, h = imgs[0].size
    grid = Image.new('RGB', size=(cols*w, rows*h))
    grid_w, grid_h = grid.size
    
    for i, img in enumerate(imgs):
        grid.paste(img, box=(i%cols*w, i//cols*h))

    if size:
        return grid.resize((cols * size, rows * size))
    else:   
        return grid

import os
import math

# define function to get size of directory in bytes
def get_dir_size(path):
    total_size = os.path.getsize(path)
    if os.path.isdir(path):
        for item in os.listdir(path):
            item_path = os.path.join(path, item)
            if os.path.isfile(item_path):
                total_size += os.path.getsize(item_path)
            elif os.path.isdir(item_path):
                total_size += get_dir_size(item_path)
    return total_size

In [None]:
import diffusers
from diffusers import StableDiffusionPipeline, PNDMScheduler, EulerDiscreteScheduler, DDIMScheduler
import torch

schedulers = {
    "pndm": PNDMScheduler,
    "euler": EulerDiscreteScheduler,
    "ddim": DDIMScheduler
}

### Deliberate

In [None]:
import diffusers
from diffusers import StableDiffusionPipeline, EulerDiscreteScheduler
from transformers import CLIPImageProcessor
import torch

PROJECT_NAME = "sd-profiler"

model_id = "XpucT/Deliberate"
scheduler = schedulers["pndm"].from_pretrained(model_id, subfolder="scheduler")
pipe = StableDiffusionPipeline.from_pretrained(model_id, scheduler=scheduler, torch_dtype=torch.float16)
pipe = pipe.to(device)

print(f"Scheduler: {pipe.scheduler.config['_class_name']}")

torch.cuda.empty_cache()
print(torch.cuda.memory_allocated() / (1024 ** 3))
print(torch.cuda.memory_reserved() / (1024 ** 3))

# model_path = "./.cache/huggingface/hub/models--" + model_id.replace("/", "--")

# # get size of directory in bytes
# dir_size = get_dir_size(model_path)

# # convert to GB
# dir_size_gb = dir_size / (1024**3)

# print(f"Directory size {math.ceil(dir_size_gb)} GB")

In [None]:
prompts = [
    "The most beautiful cat nowadays can be described as a Bengal cat",
    "The most beautiful cat nowadays can be described as a Bengal cat. They have short, smooth and shiny fur with various colors, from orange, brown to gray and black",
    "The most beautiful cat nowadays can be described as a Bengal cat. They have short, smooth and shiny fur with various colors, from orange, brown to gray and black. The highlight of their appearance is the bold black stripes on their fur, creating a wild and charming look. They have big, bright eyes with green or yellow color"
]

In [9]:
n = 1
for inference_step in [20, 40, 60]:
    for sched in ["pndm", "ddim"]:
        for prompt in prompts:
            model_id = "XpucT/Deliberate"
            scheduler = schedulers[sched].from_pretrained(model_id, subfolder="scheduler")
            pipe = StableDiffusionPipeline.from_pretrained(model_id, scheduler=scheduler, torch_dtype=torch.float16)
            pipe = pipe.to(device)
            
            config = {}
            
            config["prompt"] = prompt
            config["word_count"] = len(config["prompt"].split())
            config["token_count"] = len(pipe.tokenizer(config["prompt"])["input_ids"])
            
            config["num_inference_steps"] = inference_step
            config["guidance_scale"] = 7.5
            config["num_images_per_prompt"] = 1
            
            config["cpu_count"] = os.cpu_count()
            config["gpu_count"] = torch.cuda.device_count()
            config["gpu_type"] = torch.cuda.get_device_name(0)
            config["cuda_memory_allocated (GB)"] = round(torch.cuda.memory_allocated() / (1024 ** 3), 2)
            
            for k, v in pipe.config.items():
                if k == "_name_or_path":
                    k = "model_id"
                
                if isinstance(v, tuple):
                    config[k] = v[1]
                else:
                    config[k] = v
            
            
            samples = 3
            seeds = []
            images = []
            
            for i in range(samples):
                wandb.init(project=PROJECT_NAME, config=config)
                
                seed = random.randint(0, 1e6)
                generator = torch.Generator(device).manual_seed(seed)
                
                torch.cuda.empty_cache()
                start_cuda_malloc = torch.cuda.memory_allocated()
                start_cuda_mres = torch.cuda.memory_reserved()
                start_time = time.time()
                
                image = pipe(
                    prompt = config["prompt"],
                    num_inference_steps = config["num_inference_steps"],
                    guidance_scale = config["guidance_scale"],
                    num_images_per_prompt = config["num_images_per_prompt"],
                    generator=generator
                ).images[0]
                
                end_time = time.time()
                end_cuda_malloc = torch.cuda.memory_allocated()
                end_cuda_mres = torch.cuda.memory_reserved()
                elapsed_time = end_time - start_time
                cuda_malloc_usage = (end_cuda_malloc - start_cuda_malloc) / (1024 **3)
                cuda_mres_usage = (end_cuda_mres - start_cuda_mres) / (1024 ** 3)
                
                wandb.config.update({
                    "seed": seed,
                    "elapsed_time (seconds)": round(elapsed_time, 2),
                    "cuda_inference_usage (GB)": round(cuda_mres_usage, 2)    
                })
                
                wandb.finish()
                
                print(f"iteration: #{n}")
                print(f"Word count: {len(config['prompt'].split())}")
                print(f"Token count: {len(pipe.tokenizer(config['prompt'])['input_ids'])}")
                print(f"Inference Steps: {inference_step}")
                print(f"Scheduler: {scheduler}")
                
                print(f"Elapsed time: {round(elapsed_time, 2)} seconds")
                print(f"CUDA Model size: {round(start_cuda_malloc / (1024 ** 3), 2)} GB")
                print(f"CUDA Memory Allocated: {round(cuda_malloc_usage, 2)} GB")
                print(f"CUDA Memory Inference: {round(cuda_mres_usage, 2)} GB")

                n += 1
    
    #     images.append(image)
    #     seeds.append(seed)
    
    # print(seeds)
    # image_grid(images, 1, samples, 256)

text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.
[34m[1mwandb[0m: Currently logged in as: [33mmatt24[0m. Use [1m`wandb login --relogin`[0m to force relogin


  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.732065…

iteration: #1
Word count: 12
Token count: 14
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.53 seconds
CUDA Model size: 2.58 GB
CUDA Memory Allocated: 0.01 GB
CUDA Memory Inference: 0.62 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01667051240801811, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #2
Word count: 12
Token count: 14
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.62 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01667097806930542, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #3
Word count: 12
Token count: 14
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.69 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #4
Word count: 29
Token count: 35
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.65 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01667995030681292, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.716478…

iteration: #5
Word count: 29
Token count: 35
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.67 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01666877105211218, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #6
Word count: 29
Token count: 35
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.67 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.699792…

iteration: #7
Word count: 58
Token count: 68
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.64 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670652106404303, max=1.0…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #8
Word count: 58
Token count: 68
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.66 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016671140988667805, max=1.0…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #9
Word count: 58
Token count: 68
Inference Steps: 20
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.66 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #10
Word count: 12
Token count: 14
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.52 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670470498502253, max=1.0…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #11
Word count: 12
Token count: 14
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.58 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01667049378156662, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #12
Word count: 12
Token count: 14
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.54 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #13
Word count: 29
Token count: 35
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.53 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670354114224514, max=1.0…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #14
Word count: 29
Token count: 35
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.54 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670493812610706, max=1.0…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #15
Word count: 29
Token count: 35
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.71 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.699792…

iteration: #16
Word count: 58
Token count: 68
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.67 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01666981866583228, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #17
Word count: 58
Token count: 68
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.58 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01666939960171779, max=1.0)…

  0%|          | 0/20 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #18
Word count: 58
Token count: 68
Inference Steps: 20
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 1.57 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #19
Word count: 12
Token count: 14
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.12 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01667174631729722, max=1.0)…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #20
Word count: 12
Token count: 14
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.16 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670847684144972, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #21
Word count: 12
Token count: 14
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.17 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #22
Word count: 29
Token count: 35
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.06 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670586944868167, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #23
Word count: 29
Token count: 35
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.98 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670666076242922, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #24
Word count: 29
Token count: 35
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.05 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #25
Word count: 58
Token count: 68
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.08 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670405336966117, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #26
Word count: 58
Token count: 68
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.05 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670503125836452, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #27
Word count: 58
Token count: 68
Inference Steps: 40
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.16 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.009 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.491705…

iteration: #28
Word count: 12
Token count: 14
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.93 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01667039602374037, max=1.0)…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #29
Word count: 12
Token count: 14
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.98 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670475217203298, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #30
Word count: 12
Token count: 14
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.01 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #31
Word count: 29
Token count: 35
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.93 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670354145268598, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #32
Word count: 29
Token count: 35
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.93 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016669455512116352, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #33
Word count: 29
Token count: 35
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.0 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #34
Word count: 58
Token count: 68
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.94 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016669157519936563, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.699792…

iteration: #35
Word count: 58
Token count: 68
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 2.99 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016668612758318584, max=1.0…

  0%|          | 0/40 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #36
Word count: 58
Token count: 68
Inference Steps: 40
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 3.0 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #37
Word count: 12
Token count: 14
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.39 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016669711594780288, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #38
Word count: 12
Token count: 14
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.57 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670456466575462, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #39
Word count: 12
Token count: 14
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.46 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #40
Word count: 29
Token count: 35
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.41 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670759146412212, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #41
Word count: 29
Token count: 35
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.4 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016669753411163887, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #42
Word count: 29
Token count: 35
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.46 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.699792…

iteration: #43
Word count: 58
Token count: 68
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.43 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016671676343927782, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #44
Word count: 58
Token count: 68
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.49 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670526284724475, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #45
Word count: 58
Token count: 68
Inference Steps: 60
Scheduler: PNDMScheduler {
  "_class_name": "PNDMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.49 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #46
Word count: 12
Token count: 14
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.42 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670540254563094, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #47
Word count: 12
Token count: 14
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.42 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670563506583372, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.006 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.728979…

iteration: #48
Word count: 12
Token count: 14
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.41 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #49
Word count: 29
Token count: 35
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.31 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016669041011482477, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #50
Word count: 29
Token count: 35
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.35 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670456466575462, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #51
Word count: 29
Token count: 35
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.5 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


text_encoder/model.safetensors not found


Loading pipeline components...:   0%|          | 0/7 [00:00<?, ?it/s]

`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["id2label"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["bos_token_id"]` will be overriden.
`text_config_dict` is provided which will be used to initialize `CLIPTextConfig`. The value `text_config["eos_token_id"]` will be overriden.


  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #52
Word count: 58
Token count: 68
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.34 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670754458755255, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #53
Word count: 58
Token count: 68
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.39 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.016670950036495925, max=1.0…

  0%|          | 0/60 [00:00<?, ?it/s]

VBox(children=(Label(value='0.004 MB of 0.004 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

iteration: #54
Word count: 58
Token count: 68
Inference Steps: 60
Scheduler: DDIMScheduler {
  "_class_name": "DDIMScheduler",
  "_diffusers_version": "0.19.3",
  "beta_end": 0.012,
  "beta_schedule": "scaled_linear",
  "beta_start": 0.00085,
  "clip_sample": false,
  "clip_sample_range": 1.0,
  "dynamic_thresholding_ratio": 0.995,
  "num_train_timesteps": 1000,
  "prediction_type": "epsilon",
  "rescale_betas_zero_snr": false,
  "sample_max_value": 1.0,
  "set_alpha_to_one": false,
  "skip_prk_steps": true,
  "steps_offset": 1,
  "thresholding": false,
  "timestep_spacing": "leading",
  "trained_betas": null
}

Elapsed time: 4.47 seconds
CUDA Model size: 2.59 GB
CUDA Memory Allocated: 0.0 GB
CUDA Memory Inference: 0.6 GB


In [None]:
image_grid(images, 1, samples, 256)

In [None]:
# %%time

import time
 

samples = 4
seeds = []
images = []

for i in range(samples):
    wandb.init(project=PROJECT_NAME, config=config) 
    seed = random.randint(0, 1e6)
    generator = torch.Generator(device).manual_seed(seed)
    torch.cuda.empty_cache()
    start_cuda_malloc = torch.cuda.memory_allocated()
    start_cuda_mres = torch.cuda.memory_reserved()
    start_time = time.time()
    image = pipe(
        prompt = config["prompt"],
        num_inference_steps = config["num_inference_steps"],
        guidance_scale = config["guidance_scale"],
        num_images_per_prompt = config["num_images_per_prompt"],
        generator=generator
    ).images[0]
    end_time = time.time()
    end_cuda_malloc = torch.cuda.memory_allocated()
    end_cuda_mres = torch.cuda.memory_reserved()
    elapsed_time = end_time - start_time
    cuda_malloc_usage = (end_cuda_malloc - start_cuda_malloc) / (1024 **3)
    cuda_mres_usage = (end_cuda_mres - start_cuda_mres) / (1024 ** 3)
    
    wandb.config.update({
        "seed": seed,
        "elapsed_time (seconds)": round(elapsed_time, 2),
        "cuda_inference_usage (GB)": round(cuda_mres_usage, 2)    
    })
    
    wandb.finish()

    print(f"Word count: {len(config['prompt'].split())}")
    print(f"Token count: {len(pipe.tokenizer(config['prompt'])['input_ids'])}")
    print(f"Elapsed time: {round(elapsed_time, 2)} seconds")
    print(f"CUDA Model size: {round(start_cuda_malloc / (1024 ** 3), 2)} GB")
    print(f"CUDA Memory Allocated: {round(cuda_malloc_usage, 2)} GB")
    print(f"CUDA Memory Inference: {round(cuda_mres_usage, 2)} GB")

#     images.append(image)
#     seeds.append(seed)

# print(seeds)
# image_grid(images, 1, samples, 512)