mirror of
https://github.com/lucidrains/DALLE2-pytorch.git
synced 2025-12-19 17:54:20 +01:00
use eval vs training mode to determine whether to call backprop on trainer forward
This commit is contained in:
@@ -279,6 +279,8 @@ class DiffusionPriorTrainer(nn.Module):
|
|||||||
loss = loss * chunk_size_frac
|
loss = loss * chunk_size_frac
|
||||||
|
|
||||||
total_loss += loss.item()
|
total_loss += loss.item()
|
||||||
|
|
||||||
|
if self.training:
|
||||||
self.scaler.scale(loss).backward()
|
self.scaler.scale(loss).backward()
|
||||||
|
|
||||||
return total_loss
|
return total_loss
|
||||||
@@ -406,6 +408,8 @@ class DecoderTrainer(nn.Module):
|
|||||||
loss = loss * chunk_size_frac
|
loss = loss * chunk_size_frac
|
||||||
|
|
||||||
total_loss += loss.item()
|
total_loss += loss.item()
|
||||||
|
|
||||||
|
if self.training:
|
||||||
self.scale(loss, unet_number = unet_number).backward()
|
self.scale(loss, unet_number = unet_number).backward()
|
||||||
|
|
||||||
return total_loss
|
return total_loss
|
||||||
|
|||||||
Reference in New Issue
Block a user