Fix gradient accumulation averaging

2025-08-31 11:54:37 +08:00 · 2024-10-10 02:45:26 -07:00 · 2024-10-10 02:45:26 -07:00 · fc88e3b0d0
commit fc88e3b0d0
parent 3c587ed618
1 changed files with 5 additions and 1 deletions
--- a/flux/dreambooth.py
+++ b/flux/dreambooth.py
@ -274,7 +274,11 @@ if __name__ == "__main__":
        loss, grads = nn.value_and_grad(flux.flow, flux.training_loss)(
            x, t5_feat, clip_feat, guidance
        )
-        grads = tree_map(lambda a, b: a + b, prev_grads, grads)
+        grads = tree_map(
+            lambda a, b: (a + b) / args.grad_accumulate,
+            prev_grads,
+            grads,
+        )
        grads = average_gradients(grads)
        optimizer.update(flux.flow, grads)