extra insurance in case eos id is not there

address https://github.com/lucidrains/DALLE2-pytorch/issues/266
bug fix cosine annealing optimizer in prior trainer (#262 )
2026-02-23 18:14:21 +01:00 · 2022-12-15 10:54:21 -08:00 · 2022-11-23 08:41:25 -08:00 · 2022-11-11 12:15:13 -08:00 · 2022-11-07 16:19:08 -08:00 · 2022-11-07 15:44:36 -08:00
5 changed files with 13 additions and 4 deletions
--- a/dalle2_pytorch/dalle2_pytorch.py
+++ b/dalle2_pytorch/dalle2_pytorch.py
@@ -360,6 +360,7 @@ class OpenAIClipAdapter(BaseClipAdapter):
        is_eos_id = (text == self.eos_id)
        text_mask_excluding_eos = is_eos_id.cumsum(dim = -1) == 0
        text_mask = F.pad(text_mask_excluding_eos, (1, -1), value = True)
        text_mask = text_mask & (text != 0)
        assert not self.cleared
        text_embed = self.clip.encode_text(text)
@@ -434,6 +435,7 @@ class OpenClipAdapter(BaseClipAdapter):
        is_eos_id = (text == self.eos_id)
        text_mask_excluding_eos = is_eos_id.cumsum(dim = -1) == 0
        text_mask = F.pad(text_mask_excluding_eos, (1, -1), value = True)
        text_mask = text_mask & (text != 0)
        assert not self.cleared
        text_embed = self.clip.encode_text(text)
@@ -629,7 +631,7 @@ class NoiseScheduler(nn.Module):
    def calculate_v(self, x_start, t, noise = None):
        return (
-            extract(self.sqrt_alphas_cumprod, t, x_start.shape) * noise +
+            extract(self.sqrt_alphas_cumprod, t, x_start.shape) * noise -
            extract(self.sqrt_one_minus_alphas_cumprod, t, x_start.shape) * x_start
        )
@@ -1320,7 +1322,7 @@ class DiffusionPrior(nn.Module):
            elif self.predict_x_start:
                x_start = pred
            else:
-                x_start = self.noise_scheduler.predict_start_from_noise(image_embed, t = time_cond, noise = pred_noise)
+                x_start = self.noise_scheduler.predict_start_from_noise(image_embed, t = time_cond, noise = pred)
            # clip x0 before maybe predicting noise
--- a/dalle2_pytorch/train_configs.py
+++ b/dalle2_pytorch/train_configs.py
@@ -4,11 +4,13 @@ from pydantic import BaseModel, validator, root_validator
 from typing import List, Optional, Union, Tuple, Dict, Any, TypeVar
 from x_clip import CLIP as XCLIP
 from open_clip import list_pretrained
 from coca_pytorch import CoCa
 from dalle2_pytorch.dalle2_pytorch import (
    CoCaAdapter,
    OpenAIClipAdapter,
    OpenClipAdapter,
    Unet,
    Decoder,
    DiffusionPrior,
@@ -117,6 +119,10 @@ class AdapterConfig(BaseModel):
    def create(self):
        if self.make == "openai":
            return OpenAIClipAdapter(self.model)
        elif self.make == "open_clip":
            pretrained = dict(list_pretrained())
            checkpoint = pretrained[self.model]
            return OpenClipAdapter(name=self.model, pretrained=checkpoint)
        elif self.make == "x-clip":
            return XClipAdapter(XCLIP(**self.base_model_kwargs))
        elif self.make == "coca":
--- a/dalle2_pytorch/trainer.py
+++ b/dalle2_pytorch/trainer.py
@@ -236,7 +236,7 @@ class DiffusionPriorTrainer(nn.Module):
        )
        if exists(cosine_decay_max_steps):
-            self.scheduler = CosineAnnealingLR(optimizer, T_max = cosine_decay_max_steps)
+            self.scheduler = CosineAnnealingLR(self.optimizer, T_max = cosine_decay_max_steps)
        else:
            self.scheduler = LambdaLR(self.optimizer, lr_lambda = lambda _: 1.0)
--- a/dalle2_pytorch/version.py
+++ b/dalle2_pytorch/version.py
@@ -1 +1 @@
-__version__ = '1.11.0'
+__version__ = '1.11.4'
--- a/setup.py
+++ b/setup.py
@@ -26,6 +26,7 @@ setup(
  install_requires=[
    'accelerate',
    'click',
    'open-clip-torch>=2.0.0,<3.0.0',
    'clip-anytorch>=2.4.0',
    'coca-pytorch>=0.0.5',
    'ema-pytorch>=0.0.7',
Author	SHA1	Message	Date
Phil Wang	683dd98b96	extra insurance in case eos id is not there	2022-12-15 10:54:21 -08:00
Phil Wang	067ac323da	address https://github.com/lucidrains/DALLE2-pytorch/issues/266	2022-11-23 08:41:25 -08:00
zion	91c8d1ca13	bug fix cosine annealing optimizer in prior trainer (#262 )	2022-11-11 12:15:13 -08:00
zion	08238a7200	depend on open-clip-torch (#261 ) fix the previous commit which assumes open_clip is installed	2022-11-07 16:19:08 -08:00
zion	7166ad6711	add open clip to train_config (#260 ) add the ability to use open_clip in the train configs (useful for the new SOTA h/14 model)	2022-11-07 15:44:36 -08:00
Phil Wang	fbba0f9aaf	bring in prediction of v objective, combining the findings from progressive distillation paper and imagen-video to the eventual extension of dalle2 to make-a-video	2022-10-28 18:21:07 -07:00
`@@ -1 +1 @@`
	`__version__ = '1.11.0'`	`__version__ = '1.11.4'`