Skip to content

Commit 71920dd

Browse files
author
Felipe Mello
committed
delete loss before bwd
1 parent 1157b94 commit 71920dd

File tree

4 files changed

+9
-0
lines changed

4 files changed

+9
-0
lines changed

recipes/full_finetune_distributed.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -523,6 +523,8 @@ def train(self) -> None:
523523
logits = logits.transpose(1, 2)
524524
# Compute loss
525525
loss = self._loss_fn(logits, labels)
526+
# free logits otherwise it peaks backward memory
527+
del logits
526528

527529
loss = loss / self._gradient_accumulation_steps
528530
running_loss += loss

recipes/full_finetune_single_device.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -452,6 +452,8 @@ def train(self) -> None:
452452
logits = logits.transpose(1, 2)
453453
# Compute loss
454454
loss = self._loss_fn(logits, labels)
455+
# free logits otherwise it peaks backward memory
456+
del logits
455457

456458
loss = loss / self._gradient_accumulation_steps
457459
running_loss += loss

recipes/lora_finetune_single_device.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -573,6 +573,9 @@ def train(self) -> None:
573573
logits = logits.transpose(1, 2)
574574
# Compute loss
575575
loss = self._loss_fn(logits, labels)
576+
# free logits otherwise it peaks backward memory
577+
del logits
578+
576579
loss = loss / self._gradient_accumulation_steps
577580
running_loss += loss
578581
loss.backward()

recipes/qat_distributed.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -572,6 +572,8 @@ def train(self) -> None:
572572
logits = logits.transpose(1, 2)
573573
# Compute loss
574574
loss = self._loss_fn(logits, labels)
575+
# free logits otherwise it peaks backward memory
576+
del logits
575577

576578
loss = loss / self._gradient_accumulation_steps
577579
running_loss += loss

0 commit comments

Comments
 (0)