pytorch diffusers text-to-image

Chinese Latent Diffusion Model

我们开源了适配模型 alibaba-pai/pai-diffusion-general-large-zh 的 ControlNet,输入图像的 Depth 特征,进行可控的生成。

from diffusers import StableDiffusionControlNetPipeline, ControlNetModel


controlnet_id = "alibaba-pai/pai-diffusion-general-large-zh-controlnet-depth"
controlnet = ControlNetModel.from_pretrained(controlnet_id)
model_id = "alibaba-pai/pai-diffusion-general-large-zh"
pipe = StableDiffusionControlNetPipeline.from_pretrained(model_id, controlnet=controlnet)
pipe = pipe.to("cuda")

image = Image.open("depth_image.png")
prompt = "雪地上的帐篷"
image = pipe(prompt, image).images[0]
image.save("result.png")