Spaces:
Running
on
A100
Running
on
A100
default shift
Browse files
app.py
CHANGED
@@ -264,6 +264,7 @@ class HunyuanImageApp:
|
|
264 |
num_inference_steps=num_inference_steps,
|
265 |
guidance_scale=guidance_scale,
|
266 |
seed=seed,
|
|
|
267 |
use_reprompt=use_reprompt,
|
268 |
use_refiner=use_refiner
|
269 |
)
|
|
|
264 |
num_inference_steps=num_inference_steps,
|
265 |
guidance_scale=guidance_scale,
|
266 |
seed=seed,
|
267 |
+
shift=5,
|
268 |
use_reprompt=use_reprompt,
|
269 |
use_refiner=use_refiner
|
270 |
)
|
hyimage/diffusion/pipelines/hunyuanimage_pipeline.py
CHANGED
@@ -49,7 +49,7 @@ class HunyuanImagePipelineConfig:
|
|
49 |
# Default guidance scale, will be overridden by the guidance_scale parameter in __call__
|
50 |
default_guidance_scale: float = 3.5
|
51 |
# Inference shift
|
52 |
-
shift: int =
|
53 |
torch_dtype: str = "bf16"
|
54 |
device: str = "cuda"
|
55 |
version: str = ""
|
@@ -77,6 +77,9 @@ class HunyuanImagePipelineConfig:
|
|
77 |
vae_config=HUNYUANIMAGE_V2_1_VAE_32x(),
|
78 |
text_encoder_config=HUNYUANIMAGE_V2_1_TEXT_ENCODER(),
|
79 |
reprompt_config=HUNYUANIMAGE_REPROMPT(),
|
|
|
|
|
|
|
80 |
version=version,
|
81 |
**kwargs
|
82 |
)
|
@@ -587,8 +590,6 @@ class HunyuanImagePipeline:
|
|
587 |
guidance_rescale=self.guidance_rescale,
|
588 |
)
|
589 |
|
590 |
-
|
591 |
-
noise_pred = noise_pred_uncond + guidance_scale * (noise_pred_text - noise_pred_uncond)
|
592 |
return noise_pred
|
593 |
|
594 |
def _decode_latents(self, latents, reorg_tokens=False):
|
@@ -699,7 +700,7 @@ class HunyuanImagePipeline:
|
|
699 |
print(f"Guidance Scale: {guidance_scale}")
|
700 |
print(f"CFG Mode: {self.cfg_mode}")
|
701 |
print(f"Guidance Rescale: {self.guidance_rescale}")
|
702 |
-
print(f"Shift: {
|
703 |
print(f"Seed: {seed}")
|
704 |
print(f"Use MeanFlow: {self.use_meanflow}")
|
705 |
print(f"Use byT5: {self.use_byt5}")
|
|
|
49 |
# Default guidance scale, will be overridden by the guidance_scale parameter in __call__
|
50 |
default_guidance_scale: float = 3.5
|
51 |
# Inference shift
|
52 |
+
shift: int = 5
|
53 |
torch_dtype: str = "bf16"
|
54 |
device: str = "cuda"
|
55 |
version: str = ""
|
|
|
77 |
vae_config=HUNYUANIMAGE_V2_1_VAE_32x(),
|
78 |
text_encoder_config=HUNYUANIMAGE_V2_1_TEXT_ENCODER(),
|
79 |
reprompt_config=HUNYUANIMAGE_REPROMPT(),
|
80 |
+
shift=4 if use_distilled else 5,
|
81 |
+
default_guidance_scale=3.25 if use_distilled else 3.5,
|
82 |
+
default_sampling_steps=8 if use_distilled else 50,
|
83 |
version=version,
|
84 |
**kwargs
|
85 |
)
|
|
|
590 |
guidance_rescale=self.guidance_rescale,
|
591 |
)
|
592 |
|
|
|
|
|
593 |
return noise_pred
|
594 |
|
595 |
def _decode_latents(self, latents, reorg_tokens=False):
|
|
|
700 |
print(f"Guidance Scale: {guidance_scale}")
|
701 |
print(f"CFG Mode: {self.cfg_mode}")
|
702 |
print(f"Guidance Rescale: {self.guidance_rescale}")
|
703 |
+
print(f"Shift: {shift}")
|
704 |
print(f"Seed: {seed}")
|
705 |
print(f"Use MeanFlow: {self.use_meanflow}")
|
706 |
print(f"Use byT5: {self.use_byt5}")
|