mirror of
https://github.com/huggingface/diffusers.git
synced 2026-01-29 07:22:12 +03:00
use dn6 attn mask + fix true_cfg_scale
This commit is contained in:
@@ -232,9 +232,14 @@ class ChromaPipeline(
|
||||
prompt_embeds = self.text_encoder(
|
||||
text_input_ids.to(device),
|
||||
output_hidden_states=False,
|
||||
#attention_mask=(text_inputs.attention_mask.to(device),),
|
||||
attention_mask=text_inputs.attention_mask.to(device),
|
||||
)[0]
|
||||
|
||||
max_len = min(text_inputs.attention_mask.sum() + 1, max_sequence_length)
|
||||
prompt_embeds = prompt_embeds[
|
||||
:, :max_len
|
||||
]
|
||||
|
||||
dtype = self.text_encoder.dtype
|
||||
prompt_embeds = prompt_embeds.to(dtype=dtype, device=device)
|
||||
|
||||
@@ -554,7 +559,7 @@ class ChromaPipeline(
|
||||
instead.
|
||||
negative_prompt (`str` or `List[str]`, *optional*):
|
||||
The prompt or prompts not to guide the image generation. If not defined, one has to pass
|
||||
`negative_prompt_embeds` instead. Ignored when not using guidance (i.e., ignored if `true_cfg_scale` is
|
||||
`negative_prompt_embeds` instead. Ignored when not using guidance (i.e., ignored if `guidance_scale` is
|
||||
not greater than `1`).
|
||||
height (`int`, *optional*, defaults to self.unet.config.sample_size * self.vae_scale_factor):
|
||||
The height in pixels of the generated image. This is set to 1024 by default for the best results.
|
||||
@@ -794,7 +799,7 @@ class ChromaPipeline(
|
||||
joint_attention_kwargs=self.joint_attention_kwargs,
|
||||
return_dict=False,
|
||||
)[0]
|
||||
noise_pred = neg_noise_pred + true_cfg_scale * (noise_pred - neg_noise_pred)
|
||||
noise_pred = neg_noise_pred + guidance_scale * (noise_pred - neg_noise_pred)
|
||||
|
||||
# compute the previous noisy sample x_t -> x_t-1
|
||||
latents_dtype = latents.dtype
|
||||
|
||||
Reference in New Issue
Block a user