File size: 882 Bytes
a63d2a4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
#from src.diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion_ldm3d_inpaint import StableDiffusionLDM3DInpaintPipeline

#pipeline = StableDiffusionLDM3DInpaintPipeline()
from src.diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion_ldm3d import StableDiffusionLDM3DPipeline
import numpy as np
from PIL import Image

pipe = StableDiffusionLDM3DPipeline.from_pretrained("Intel/ldm3d-4c", cache_dir="cache")
pipe = pipe.to("cuda")

prompt = "a photo of an astronaut riding a horse on mars"
output = pipe(prompt, num_inference_steps=15)
rgb_image, depth_image = output.rgb, output.depth
rgb_image[0].save("output_rgb.jpg")
depth_image[0].save("output_depth.png")

mask_image = np.zeros_like(np.array(depth_image[0]))
#dummy threshold
mask_image[np.array(depth_image[0]) < 10000] = 65535
mask_image = Image.fromarray(mask_image).convert("L").save("output_mask.png")