KevinNg99 commited on
Commit
23c68ff
·
1 Parent(s): b9ad1cd

default shift

Browse files
app.py CHANGED
@@ -264,6 +264,7 @@ class HunyuanImageApp:
264
  num_inference_steps=num_inference_steps,
265
  guidance_scale=guidance_scale,
266
  seed=seed,
 
267
  use_reprompt=use_reprompt,
268
  use_refiner=use_refiner
269
  )
 
264
  num_inference_steps=num_inference_steps,
265
  guidance_scale=guidance_scale,
266
  seed=seed,
267
+ shift=5,
268
  use_reprompt=use_reprompt,
269
  use_refiner=use_refiner
270
  )
hyimage/diffusion/pipelines/hunyuanimage_pipeline.py CHANGED
@@ -49,7 +49,7 @@ class HunyuanImagePipelineConfig:
49
  # Default guidance scale, will be overridden by the guidance_scale parameter in __call__
50
  default_guidance_scale: float = 3.5
51
  # Inference shift
52
- shift: int = 4
53
  torch_dtype: str = "bf16"
54
  device: str = "cuda"
55
  version: str = ""
@@ -77,6 +77,9 @@ class HunyuanImagePipelineConfig:
77
  vae_config=HUNYUANIMAGE_V2_1_VAE_32x(),
78
  text_encoder_config=HUNYUANIMAGE_V2_1_TEXT_ENCODER(),
79
  reprompt_config=HUNYUANIMAGE_REPROMPT(),
 
 
 
80
  version=version,
81
  **kwargs
82
  )
@@ -587,8 +590,6 @@ class HunyuanImagePipeline:
587
  guidance_rescale=self.guidance_rescale,
588
  )
589
 
590
-
591
- noise_pred = noise_pred_uncond + guidance_scale * (noise_pred_text - noise_pred_uncond)
592
  return noise_pred
593
 
594
  def _decode_latents(self, latents, reorg_tokens=False):
@@ -699,7 +700,7 @@ class HunyuanImagePipeline:
699
  print(f"Guidance Scale: {guidance_scale}")
700
  print(f"CFG Mode: {self.cfg_mode}")
701
  print(f"Guidance Rescale: {self.guidance_rescale}")
702
- print(f"Shift: {self.shift}")
703
  print(f"Seed: {seed}")
704
  print(f"Use MeanFlow: {self.use_meanflow}")
705
  print(f"Use byT5: {self.use_byt5}")
 
49
  # Default guidance scale, will be overridden by the guidance_scale parameter in __call__
50
  default_guidance_scale: float = 3.5
51
  # Inference shift
52
+ shift: int = 5
53
  torch_dtype: str = "bf16"
54
  device: str = "cuda"
55
  version: str = ""
 
77
  vae_config=HUNYUANIMAGE_V2_1_VAE_32x(),
78
  text_encoder_config=HUNYUANIMAGE_V2_1_TEXT_ENCODER(),
79
  reprompt_config=HUNYUANIMAGE_REPROMPT(),
80
+ shift=4 if use_distilled else 5,
81
+ default_guidance_scale=3.25 if use_distilled else 3.5,
82
+ default_sampling_steps=8 if use_distilled else 50,
83
  version=version,
84
  **kwargs
85
  )
 
590
  guidance_rescale=self.guidance_rescale,
591
  )
592
 
 
 
593
  return noise_pred
594
 
595
  def _decode_latents(self, latents, reorg_tokens=False):
 
700
  print(f"Guidance Scale: {guidance_scale}")
701
  print(f"CFG Mode: {self.cfg_mode}")
702
  print(f"Guidance Rescale: {self.guidance_rescale}")
703
+ print(f"Shift: {shift}")
704
  print(f"Seed: {seed}")
705
  print(f"Use MeanFlow: {self.use_meanflow}")
706
  print(f"Use byT5: {self.use_byt5}")