🔨 [FIX] Fixes memory leak (#83)

* Fixes memory leak * Changed total_loss to use float type and adjusted collection of loss --------- Co-authored-by: Martin Cerman <m.cerman@enlite.ai>
WongKinYiu · Oct 2, 2024 · dea5a8a · dea5a8a
1 parent 8228669
commit dea5a8a
Showing 1 changed file with 2 additions and 2 deletions.
diff --git a/yolo/tools/solver.py b/yolo/tools/solver.py
@@ -86,7 +86,7 @@ def train_one_batch(self, images: Tensor, targets: Tensor):
 
     def train_one_epoch(self, dataloader):
         self.model.train()
-        total_loss = defaultdict(lambda: torch.tensor(0.0, device=self.device))
+        total_loss = defaultdict(float)
         total_samples = 0
         self.optimizer.next_epoch(len(dataloader))
         for batch_size, images, targets, *_ in dataloader:
@@ -96,7 +96,7 @@ def train_one_epoch(self, dataloader):
             for loss_name, loss_val in loss_each.items():
                 if self.use_ddp:  # collecting loss for each batch
                     distributed.all_reduce(loss_val, op=distributed.ReduceOp.AVG)
-                total_loss[loss_name] += loss_val * batch_size
+                total_loss[loss_name] += loss_val.item() * batch_size
             total_samples += batch_size
             self.progress.one_batch(loss_each)