In [None]:
from diffusers import BitsAndBytesConfig, SD3Transformer2DModel,FluxPipeline,FluxTransformer2DModel
from diffusers import StableDiffusion3Pipeline
import torch

model_id = "black-forest-labs/FLUX.1-dev"

# Using torch.float16 for better compatibility
nf4_config = BitsAndBytesConfig(
    load_in_4bit=True,
    bnb_4bit_quant_type="nf4",
    bnb_4bit_compute_dtype=torch.bfloat16  # Use float16 for consistency
)
model_nf4 = FluxTransformer2DModel.from_pretrained(
    model_id,
    subfolder="transformer",
    quantization_config=nf4_config,
    torch_dtype=torch.bfloat16  # Ensure float16 here as well
)

pipeline = FluxPipeline.from_pretrained(
    model_id, 
    transformer=model_nf4,
    torch_dtype=torch.bfloat16  # Ensure consistency with the model
)
pipeline.enable_model_cpu_offload()  # Make sure this is necessary for your setup

prompt = "Fernando Alonso winning the F1 championship with Ferrari"

# Adjusting max_sequence_length for performance (e.g., 128)
image = pipeline(
    prompt=prompt,
    num_inference_steps=50,
    guidance_scale=3.5,
    max_sequence_length=128  # You can try lowering this for better performance

).images[0]

image.save("generated_images/flux/ferrari.png")


Fetching 3 files: 100%|██████████| 3/3 [00:00<00:00, 27594.11it/s]
Loading checkpoint shards: 100%|██████████| 2/2 [00:00<00:00,  3.09it/s]
Loading pipeline components...: 100%|██████████| 7/7 [00:00<00:00,  7.19it/s]
100%|██████████| 50/50 [01:27<00:00,  1.75s/it]


In [None]:
from diffusers import BitsAndBytesConfig, SD3Transformer2DModel
from diffusers import StableDiffusion3Pipeline
import torch
from huggingface_hub import login

login(token="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")

model_id = "stabilityai/stable-diffusion-3.5-large"



nf4_config = BitsAndBytesConfig(
    load_in_4bit=True,
    bnb_4bit_quant_type="nf4",
    bnb_4bit_compute_dtype=torch.bfloat16
    
)
model_nf4 = SD3Transformer2DModel.from_pretrained(
    model_id,
    subfolder="transformer",
    quantization_config=nf4_config,
    torch_dtype=torch.bfloat16,
)



pipeline = StableDiffusion3Pipeline.from_pretrained(
    model_id, 
    transformer=model_nf4,
    torch_dtype=torch.bfloat16
)
pipeline.vae.to(torch.bfloat16)
pipeline.text_encoder.to(torch.bfloat16)

pipeline.text_encoder_2.to(torch.bfloat16)

pipeline.text_encoder_3.to(torch.bfloat16)

pipeline.enable_model_cpu_offload()

prompt='Fernando Alonso winning the F1 championship with Ferrari'
image = pipeline(
    prompt,
    height=1024,
    width=1024,
    guidance_scale=3.5,
    num_inference_steps=50,
    max_sequence_length=76,
    generator=torch.Generator("cpu").manual_seed(0)
    
).images[0]
image.save("generated_images/stable_diffusion/ferrari.png")


Fetching 2 files: 100%|██████████| 2/2 [00:00<00:00, 16352.06it/s]
Loading checkpoint shards: 100%|██████████| 2/2 [00:02<00:00,  1.03s/it]it/s]
Loading pipeline components...: 100%|██████████| 9/9 [00:03<00:00,  2.36it/s]
100%|██████████| 50/50 [01:18<00:00,  1.57s/it]


In [None]:

import torch
from diffusers import SanaPipeline,SanaTransformer2DModel,BitsAndBytesConfig

model_id="Efficient-Large-Model/Sana_600M_1024px_diffusers"
nf4_config = BitsAndBytesConfig(
    load_in_4bit=True,
    bnb_4bit_quant_type="nf4",
    bnb_4bit_compute_dtype=torch.bfloat16
    
)
model_nf4 = SanaTransformer2DModel.from_pretrained(
    model_id,
    subfolder="transformer",
    quantization_config=nf4_config,
    torch_dtype=torch.bfloat16,
)

pipe = SanaPipeline.from_pretrained(
    "Efficient-Large-Model/Sana_600M_1024px_diffusers",
    transformer=model_nf4,
    

    torch_dtype=torch.bfloat16,
    
)
pipe.to("cuda")

pipe.vae.to(torch.bfloat16)
pipe.text_encoder.to(torch.bfloat16)

prompt='Fernando Alonso winning the F1 championship with Ferrari'
image = pipe(
    prompt=prompt,
    height=1024,
    width=1024,
    guidance_scale=4.5,
    num_inference_steps=50,
    generator=torch.Generator(device="cuda").manual_seed(42),
)[0]

image[0].save("generated_images/sana/ferrari.png")


Loading checkpoint shards: 100%|██████████| 2/2 [00:00<00:00, 12.55it/s]
Loading pipeline components...: 100%|██████████| 5/5 [00:00<00:00,  5.92it/s]

Setting `clean_caption=True` requires the ftfy library but it was not found in your environment. Checkout the instructions on the
installation section: https://github.com/rspeer/python-ftfy/tree/master#installing and follow the ones
that match your environment. Please note that you may need to restart your runtime after installation.

Setting `clean_caption` to False...

Setting `clean_caption=True` requires the ftfy library but it was not found in your environment. Checkout the instructions on the
installation section: https://github.com/rspeer/python-ftfy/tree/master#installing and follow the ones
that match your environment. Please note that you may need to restart your runtime after installation.

Setting `clean_caption` to False...
100%|██████████| 50/50 [00:04<00:00, 12.12it/s]


In [6]:
import torch
from diffusers import DiffusionPipeline
from huggingface_hub import login

login(token="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")

model_id="dalle-mini/dalle-mega"


pipe = DiffusionPipeline.from_pretrained(
    model_id,
    torch_dtype=torch.bfloat16
)
pipe.text_encoder.to(torch.bfloat16)
pipe.vae.to(torch.bfloat16)
pipe.transformer.to(torch.bfloat16)
pipeline.enable_model_cpu_offload()




prompt='Fernando Alonso winning the F1 championship with Ferrari'
image = pipe(
    prompt=prompt,
    height=1024,
    width=1024,
    guidance_scale=4.5,
    num_inference_steps=50,
    generator=torch.Generator(device="cuda").manual_seed(42),
)[0]

image[0].save("sana/ferrari.png")


EntryNotFoundError: 404 Client Error. (Request ID: Root=1-67b88167-3e2f5c032dc46a485b42972f;08eaf198-c495-4ac8-9c3c-2154ddef17b0)

Entry Not Found for url: https://huggingface.co/dalle-mini/dalle-mega/resolve/main/model_index.json.