Fix gradient accumulation averaging

2025-09-01 12:49:50 +08:00 · 2024-10-10 02:45:26 -07:00
parent 3c587ed618
commit fc88e3b0d0
1 changed files with 5 additions and 1 deletions
--- a/flux/dreambooth.py
+++ b/flux/dreambooth.py
@@ -274,7 +274,11 @@ if __name__ == "__main__":
        loss, grads = nn.value_and_grad(flux.flow, flux.training_loss)(
            x, t5_feat, clip_feat, guidance
        )
-        grads = tree_map(lambda a, b: a + b, prev_grads, grads)
+        grads = tree_map(
            lambda a, b: (a + b) / args.grad_accumulate,
            prev_grads,
            grads,
        )
        grads = average_gradients(grads)
        optimizer.update(flux.flow, grads)