Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion docs/source/ko/tutorials/basic_training.md
Original file line number Diff line number Diff line change
Expand Up @@ -329,7 +329,7 @@ TensorBoard에 로깅, 그래디언트 누적 및 혼합 정밀도 학습을 쉽
... )

... # 각 타임스텝의 노이즈 크기에 따라 깨끗한 이미지에 노이즈를 추가합니다.
... # (이는 foward diffusion 과정입니다.)
... # (이는 forward diffusion 과정입니다.)
... noisy_images = noise_scheduler.add_noise(clean_images, noise, timesteps)

... with accelerator.accumulate(model):
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -703,7 +703,7 @@ def prepare_mask_latents(
)
masked_image_latents = masked_image_latents.repeat(batch_size // masked_image_latents.shape[0], 1, 1, 1)

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
masked_image_latents = self._pack_latents(
masked_image_latents,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -350,7 +350,7 @@ def prepare_mask_latents(
torch.cat([masked_image_latents] * 2) if do_classifier_free_guidance else masked_image_latents
)

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
return mask, masked_image_latents

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1068,7 +1068,7 @@ def forward(
Returns:
`tuple`: Returns relevant parts of the model's noise prediction: the first element of the tuple is tbe VAE
`tuple`: Returns relevant parts of the model's noise prediction: the first element of the tuple is the VAE
image embedding, the second element is the CLIP image embedding, and the third element is the CLIP text
embedding.
"""
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -681,7 +681,7 @@ def prepare_mask_latents(
masked_image_latents = torch.cat(new_mask_pixel_values, dim=0)
masked_image_latents = masked_image_latents * self.vae.config.scaling_factor

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
else:
masked_image_latents = None
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -766,7 +766,7 @@ def prepare_mask_latents(
)
masked_image_latents = masked_image_latents.repeat(batch_size // masked_image_latents.shape[0], 1, 1, 1)

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
masked_image_latents = self._pack_latents(
masked_image_latents,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -666,7 +666,7 @@ def prepare_mask_latents(
)
masked_image_latents = masked_image_latents.repeat(batch_size // masked_image_latents.shape[0], 1, 1, 1)

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
masked_image_latents = self._pack_latents(
masked_image_latents,
Expand Down
2 changes: 1 addition & 1 deletion src/diffusers/pipelines/flux/pipeline_flux_inpaint.py
Original file line number Diff line number Diff line change
Expand Up @@ -737,7 +737,7 @@ def prepare_mask_latents(
)
masked_image_latents = masked_image_latents.repeat(batch_size // masked_image_latents.shape[0], 1, 1, 1)

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
masked_image_latents = self._pack_latents(
masked_image_latents,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -898,7 +898,7 @@ def prepare_mask_latents(
)
masked_image_latents = masked_image_latents.repeat(batch_size // masked_image_latents.shape[0], 1, 1, 1)

# aligning device to prevent device errors when concating it with the latent model input
# aligning device to prevent device errors when concatenating it with the latent model input
masked_image_latents = masked_image_latents.to(device=device, dtype=dtype)
masked_image_latents = self._pack_latents(
masked_image_latents,
Expand Down
2 changes: 1 addition & 1 deletion src/diffusers/pipelines/ltx2/pipeline_ltx2.py
Original file line number Diff line number Diff line change
Expand Up @@ -244,7 +244,7 @@ def __init__(
self.vae_temporal_compression_ratio = (
self.vae.temporal_compression_ratio if getattr(self, "vae", None) is not None else 8
)
# TODO: check whether the MEL compression ratio logic here is corrct
# TODO: check whether the MEL compression ratio logic here is correct
self.audio_vae_mel_compression_ratio = (
self.audio_vae.mel_compression_ratio if getattr(self, "audio_vae", None) is not None else 4
)
Expand Down
2 changes: 1 addition & 1 deletion src/diffusers/pipelines/ltx2/pipeline_ltx2_condition.py
Original file line number Diff line number Diff line change
Expand Up @@ -235,7 +235,7 @@ def rescale_noise_cfg(noise_cfg, noise_pred_text, guidance_rescale=0.0):

class LTX2ConditionPipeline(DiffusionPipeline, FromSingleFileMixin, LTX2LoraLoaderMixin):
r"""
Pipeline for video generation which allows image conditions to be inserted at arbitary parts of the video.
Pipeline for video generation which allows image conditions to be inserted at arbitrary parts of the video.
Reference: https://github.com/Lightricks/LTX-Video
Expand Down
2 changes: 1 addition & 1 deletion src/diffusers/pipelines/ltx2/pipeline_ltx2_image2video.py
Original file line number Diff line number Diff line change
Expand Up @@ -247,7 +247,7 @@ def __init__(
self.vae_temporal_compression_ratio = (
self.vae.temporal_compression_ratio if getattr(self, "vae", None) is not None else 8
)
# TODO: check whether the MEL compression ratio logic here is corrct
# TODO: check whether the MEL compression ratio logic here is correct
self.audio_vae_mel_compression_ratio = (
self.audio_vae.mel_compression_ratio if getattr(self, "audio_vae", None) is not None else 4
)
Expand Down
2 changes: 1 addition & 1 deletion src/diffusers/pipelines/pipeline_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -759,7 +759,7 @@ def from_pretrained(cls, pretrained_model_name_or_path: str | os.PathLike, **kwa
>>> pipeline.scheduler = scheduler
```
"""
# Copy the kwargs to re-use during loading connected pipeline.
# Copy the kwargs to reuse during loading connected pipeline.
kwargs_copied = kwargs.copy()

cache_dir = kwargs.pop("cache_dir", None)
Expand Down
Loading