### Text-Input Processing and Tokenization

In [1]:
from transformers import CLIPTokenizer

tokenizer = CLIPTokenizer.from_pretrained("openai/clip-vit-base-patch32")
prompt = "A sunset over the mountains"
text_inputs = tokenizer(prompt, return_tensors="pt", padding=True, truncation=True)

  from .autonotebook import tqdm as notebook_tqdm
To support symlinks on Windows, you either need to activate Developer Mode or to run Python as an administrator. In order to see activate developer mode, see this article: https://docs.microsoft.com/en-us/windows/apps/get-started/enable-your-device-for-development


### Text Encoding

In [2]:
from transformers import CLIPTextModel

text_encoder = CLIPTextModel.from_pretrained("openai/clip-vit-base-patch32")
text_embeddings = text_encoder(**text_inputs).pooler_output



ChunkedEncodingError: ("Connection broken: ConnectionResetError(10054, 'An existing connection was forcibly closed by the remote host', None, 10054, None)", ConnectionResetError(10054, 'An existing connection was forcibly closed by the remote host', None, 10054, None))

### Latent Space Initialization

In [None]:
import torch
latent_vector = torch.randn(1, 4, 64, 64)  # Example latent space

### Diffusion Model (UNet)

In [None]:
from diffusers import UNet2DConditionModel

unet_model = UNet2DConditionModel.from_pretrained("stabilityai/stable-diffusion-2")
refined_latent = unet_model(latent_vector, text_embeddings)

### Scheduler for Denoising

In [None]:
from diffusers import PNDMScheduler

scheduler = PNDMScheduler.from_pretrained("stabilityai/stable-diffusion-2")
for _ in range(num_steps):
    latent_vector = scheduler.step(latent_vector, refined_latent)

### Image Decoding(VAE)

In [None]:
from diffusers import AutoencoderKL

vae = AutoencoderKL.from_pretrained("stabilityai/stable-diffusion-2")
generated_image = vae.decode(latent_vector).sample

### Post-processing

In [None]:
from PIL import Image
import numpy as np

image_array = (generated_image[0].permute(1, 2, 0).numpy() * 255).astype("uint8")
final_image = Image.fromarray(image_array)
final_image.save("output_image.png")

### Pipeline Integration

In [None]:
from diffusers import StableDiffusionPipeline

pipeline = StableDiffusionPipeline.from_pretrained("stabilityai/stable-diffusion-2").to("cuda")
generated_image = pipeline("A sunset over the mountains").images[0]
generated_image.show()