HunyuanImage2.1
Collection
HunyuanImage-2.1: An Efficient Diffusion Model for High-Resolution (2K) Text-to-Image Generationhttps://github.com/Tencent-Hunyuan/HunyuanImage-2.1
•
3 items
•
Updated
from diffusers import HunyuanImagePipeline
import torch
device = "cuda:0"
dtype = torch.bfloat16
repo = "hunyuanvideo-community/HunyuanImage-2.1-Diffusers"
pipe = HunyuanImagePipeline.from_pretrained(repo, torch_dtype=dtype)
pipe = pipe.to(device)
prompt = "A cute, cartoon-style anthropomorphic penguin plush toy with fluffy fur, standing in a painting studio, wearing a red knitted scarf and a red beret with the word “Tencent” on it, holding a paintbrush with a focused expression as it paints an oil painting of the Mona Lisa, rendered in a photorealistic photographic style."
generator = torch.Generator(device=device).manual_seed(649151)
out = pipe(
prompt,
num_inference_steps=50,
height=2048,
width=2048,
generator=generator,
).images[0]
out.save("test_hyimage_output.png")
to use a different guidance_scale
pipe.guider = pipe.guider.new(guidance_scale=5.0)
prompt = "A cute, cartoon-style anthropomorphic penguin plush toy with fluffy fur, standing in a painting studio, wearing a red knitted scarf and a red beret with the word “Tencent” on it, holding a paintbrush with a focused expression as it paints an oil painting of the Mona Lisa, rendered in a photorealistic photographic style."
generator = torch.Generator(device=device).manual_seed(649151)
out = pipe(
prompt,
num_inference_steps=50,
height=2048,
width=2048,
generator=generator,
).images[0]
out.save("test_hyimage_output_guidnce_scale_5.0.png")