Zooming with Outpainting

# Taken from 101 Generative AI Project
# https://xbdev.net/ai/101generativeaiprojects/

import torch
from PIL import Image
print(torch.__version__)  # Should show '2.3.0+cu121'
print(torch.cuda.is_available())  # Should return True
print(torch.version.cuda)  # Should show '12.1'

# One-line device detection **GPU** or **CPU**
device = "cuda" if all([
    torch.cuda.is_available(),                                   # GPU exists
    f"cu{torch.version.cuda.replace('.','')}" in torch.__version__  # Version matches (e.g., cu121)
]) else "cpu"

print(f"Using device: {device}")

from diffusers import StableDiffusionInpaintPipeline

# Load image
image = Image.open("input.jpg").convert("RGB")
width, height = image.size

# Expand canvas and create mask
new_width  = width + 512
new_height = height;
canvas = Image.new("RGB", (new_width, height), (255, 255, 255))
canvas.paste(image, (0, 0))

mask = Image.new("L", (new_width, height), 0)
for x in range(width, new_width):
    for y in range(height):
        mask.putpixel((x, y), 255)

# Load pipeline
pipe = StableDiffusionInpaintPipeline.from_pretrained(
    "runwayml/stable-diffusion-inpainting",
    torch_dtype=torch.float16 if device == "cuda" else torch.float32,
    variant="fp16" if device == "cuda" else None,
    safety_checker=None,  # Optional: disable safety checker for faster inference
).to( device )

# Generate
# prompt = "a mountain landscape continuing to the right"
prompt = "trees"

result = pipe(prompt=prompt,
              image=canvas,
              mask_image=mask,
              width=new_width,  # Explicitly set output dimensions
              height=new_height,
              num_inference_steps=50,  # Try 50-100 if needed
              # strength=0.999,        # Force for replacement
              guidance_scale=9.0,      # Stronger prompt adherence
              ).images[0]
result.save("outpainted_result.png")

import os
from PIL import Image
import torch
import imageio # pip install imageio[ffmpeg]

# Device setup
device = "cuda" if all([
    torch.cuda.is_available(),
    f"cu{torch.version.cuda.replace('.','')}" in torch.__version__
]) else "cpu"
print(f"Using device: {device}")

# Pipelines - Pick one
if False:
    from diffusers import StableDiffusionInpaintPipeline
    pipe = StableDiffusionInpaintPipeline.from_pretrained(
        "runwayml/stable-diffusion-inpainting",
        torch_dtype=torch.float16 if device == "cuda" else torch.float32,
        variant="fp16" if device == "cuda" else None,
        safety_checker=None,
    ).to(device)

if False:
    from diffusers import StableDiffusionXLInpaintPipeline
    pipe = StableDiffusionXLInpaintPipeline.from_pretrained(
        "stabilityai/stable-diffusion-xl-inpainting-1.0",
        torch_dtype=torch.float16 if device == "cuda" else torch.float32,
        # variant="fp16" if device == "cuda" else None,
        safety_checker=None,
    ).to(device)

if True:
    from diffusers import AutoPipelineForInpainting
    pipe = AutoPipelineForInpainting.from_pretrained(
        "kandinsky-community/kandinsky-2-2-decoder-inpaint",
        torch_dtype=torch.float16 if device == "cuda" else torch.float32,
        # variant="fp16" if device == "cuda" else None,
        safety_checker=None,
    ).to(device)

# Parameters
# prompt = "outdoor landscape surrounding the scene"
prompt = "mountains, trees, grass, clouds, fields, hills, rocks, plants"
image_path = "input.jpg"
num_frames = 128
expand_size = 64

output_size = Image.open(image_path).size
frames = []

# Load initial image
base_image = Image.open(image_path).convert("RGB")

base_image = base_image.resize((512-expand_size*2, 512-expand_size*2))
output_size = base_image.size

import os

output_folder = "frames3"
os.makedirs(output_folder, exist_ok=True)

for i in range(num_frames):
    # Expand canvas
    new_width  = base_image.width + expand_size * 2
    new_height = base_image.height + expand_size * 2
    canvas = Image.new("RGB", (new_width, new_height), (255, 255, 255))
    canvas.paste(base_image, (expand_size, expand_size))

    # Mask surrounding edges
    if True:
        from PIL import ImageDraw, ImageFilter

        # Create mask with feathered edges
        mask = Image.new("L", (new_width, new_height), 0)
        draw = ImageDraw.Draw(mask)

        # Draw white rectangle around edges to define outpaint region
        draw.rectangle(
            [0, 0, new_width, expand_size], fill=255)  # Top
        draw.rectangle(
            [0, new_height - expand_size-2, new_width, new_height+4], fill=255)  # Bottom
        draw.rectangle(
            [0, 0, expand_size, new_height], fill=255)  # Left
        draw.rectangle(
            [new_width - expand_size, 0, new_width, new_height], fill=255)  # Right

        # Apply Gaussian blur to feather the transition
        mask = mask.filter(ImageFilter.GaussianBlur(radius=20))

    print('i:', i, 'new_width:', new_width, 'new_height:', new_height )
    # Outpaint
    result = pipe(
        prompt=prompt,
        negative_prompt='frame, pictures, edge, border, caption, text, white border, solid border, solid color',
        image=canvas,
        mask_image=mask,
        width=new_width,
        height=new_height,
        num_inference_steps=50,
        guidance_scale=9.0,
    ).images[0]

    # Scale to original output size
    scaled = result.resize(output_size, resample=Image.LANCZOS)

    frame_path = f"frame_{i:03}.png"
    frame_path = os.path.join(output_folder, f"frame_{i:03}.png")

    result.save(frame_path)
    frames.append(frame_path)

    # Use outpainted image as next base
    base_image = scaled

# Save frames as video
video_output = "zoom_out3.mp4"
with imageio.get_writer(video_output, fps=4) as writer:
    for frame_file in frames:
        writer.append_data(imageio.imread(frame_file))

print(f"Zoom-out animation saved to {video_output}")

Stable Diffusion XL Outpainting + Noise