update loss components

2018-09-23 22:25:23 +02:00 · 2018-09-23 22:25:23 +02:00 · cf9b4cfa52
parent bd3f617129
commit cf9b4cfa52
3 changed files with 33 additions and 31 deletions
--- a/models.py
+++ b/models.py
@ -137,10 +137,9 @@ class YOLOLayer(nn.Module):

        # Training
        if targets is not None:
-            BCEWithLogitsLoss1 = nn.BCEWithLogitsLoss(size_average=False)
-            BCEWithLogitsLoss2 = nn.BCEWithLogitsLoss(size_average=True)
-            MSELoss = nn.MSELoss(size_average=False)  # version 0.4.0
-            CrossEntropyLoss = nn.CrossEntropyLoss()
+            MSELoss = nn.MSELoss()
+            BCEWithLogitsLoss = nn.BCEWithLogitsLoss()
+            # CrossEntropyLoss = nn.CrossEntropyLoss()

            if requestPrecision:
                gx = self.grid_x[:, :, :nG, :nG]
@ -157,33 +156,36 @@ class YOLOLayer(nn.Module):
            if x.is_cuda:
                tx, ty, tw, th, mask, tcls = tx.cuda(), ty.cuda(), tw.cuda(), th.cuda(), mask.cuda(), tcls.cuda()

-                # Mask outputs to ignore non-existing objects (but keep confidence predictions)
-                nT = sum([len(x) for x in targets])  # number of targets
-                nM = mask.sum().float()  # number of anchors (assigned to targets)
-                nB = len(targets)  # batch size
-                if nM > 0:
-                    lx = (5 / nB) * MSELoss(x[mask], tx[mask])
-                    ly = (5 / nB) * MSELoss(y[mask], ty[mask])
-                    lw = (5 / nB) * MSELoss(w[mask], tw[mask])
-                    lh = (5 / nB) * MSELoss(h[mask], th[mask])
-                    lconf = (1 / nB) * BCEWithLogitsLoss1(pred_conf[mask], mask[mask].float())
+            # Mask outputs to ignore non-existing objects (but keep confidence predictions)
+            nT = sum([len(x) for x in targets])  # number of targets
+            nM = mask.sum().float()  # number of anchors (assigned to targets)
+            nB = len(targets)  # batch size
+            k = nM / nB
+            if nM > 0:
+                lx = k * MSELoss(x[mask], tx[mask])
+                ly = k * MSELoss(y[mask], ty[mask])
+                lw = k * MSELoss(w[mask], tw[mask])
+                lh = k * MSELoss(h[mask], th[mask])
+                lconf = k * BCEWithLogitsLoss(pred_conf[mask], mask[mask].float())

-                    lcls = (1 * nM / nB) * CrossEntropyLoss(pred_cls[mask], torch.argmax(tcls, 1))
-                    # lcls = (1 * nM / nB) * BCEWithLogitsLoss2(pred_cls[mask], tcls.float())
-                else:
-                    lx, ly, lw, lh, lcls, lconf = FT([0]), FT([0]), FT([0]), FT([0]), FT([0]), FT([0])
+                # lcls = k * CrossEntropyLoss(pred_cls[mask], torch.argmax(tcls, 1))
+                lcls = k * BCEWithLogitsLoss(pred_cls[mask], tcls.float())
+            else:
+                lx, ly, lw, lh, lcls, lconf = FT([0]), FT([0]), FT([0]), FT([0]), FT([0]), FT([0])

-                lconf += (0.5 * nM / nB) * BCEWithLogitsLoss2(pred_conf[~mask], mask[~mask].float())
+            # Add confidence loss for background anchors (noobj)
+            lconf += k * BCEWithLogitsLoss(pred_conf[~mask], mask[~mask].float())

-                loss = lx + ly + lw + lh + lconf + lcls
+            # Sum loss components
+            loss = lx + ly + lw + lh + lconf + lcls

-            # Sum False Positives from unnasigned anchors
-            i = torch.sigmoid(pred_conf[~mask]) > 0.99
-            FPe = torch.zeros(self.nC)
+            # Sum False Positives from unassigned anchors
+            i = torch.sigmoid(pred_conf[~mask]) > 0.9
            if i.sum() > 0:
                FP_classes = torch.argmax(pred_cls[~mask][i], 1)
-                for c in FP_classes:
-                    FPe[c] += 1
+                FPe = torch.bincount(FP_classes, minlength=self.nC).float().cpu()  # extra FPs
+            else:
+                FPe = torch.zeros(self.nC)

            return loss, loss.item(), lx.item(), ly.item(), lw.item(), lh.item(), lconf.item(), lcls.item(), \
                   nT, TP, FP, FPe, FN, TC
--- a/utils/gcp.sh
+++ b/utils/gcp.sh
@ -11,7 +11,7 @@ gsutil cp gs://ultralytics/fresh9_5_e201.pt yolov3/checkpoints
 python3 detect.py

 # Test
-python3 test.py -img_size 416 -weights_path checkpoints/yolov3.weights
+python3 test.py -img_size 416 -weights_path checkpoints/latest.pt -conf_thresh 0.5


 # Download and Test
--- a/utils/utils.py
+++ b/utils/utils.py
@ -282,9 +282,9 @@ def build_targets(pred_boxes, pred_conf, pred_cls, target, anchor_wh, nA, nC, nG
            pconf = torch.sigmoid(pred_conf[b, a, gj, gi]).cpu()
            iou_pred = bbox_iou(tb, pred_boxes[b, a, gj, gi].cpu())

-            TP[b, i] = (pconf > 0.99) & (iou_pred > 0.5) & (pcls == tc)
-            FP[b, i] = (pconf > 0.99) & (TP[b, i] == 0)  # coordinates or class are wrong
-            FN[b, i] = pconf <= 0.99  # confidence score is too low (set to zero)
+            TP[b, i] = (pconf > 0.9) & (iou_pred > 0.5) & (pcls == tc)
+            FP[b, i] = (pconf > 0.9) & (TP[b, i] == 0)  # coordinates or class are wrong
+            FN[b, i] = pconf <= 0.9  # confidence score is too low (set to zero)

    return tx, ty, tw, th, tconf, tcls, TP, FP, FN, TC

@ -429,8 +429,8 @@ def plotResults():
    import matplotlib.pyplot as plt
    plt.figure(figsize=(16, 8))
    s = ['X', 'Y', 'Width', 'Height', 'Objectness', 'Classification', 'Total Loss', 'Precision', 'Recall']
-    for f in ('/Users/glennjocher/Downloads/results_CE.txt',
-              '/Users/glennjocher/Downloads/results_BCE.txt'):
+    for f in ('results.txt',
+              ):
        results = np.loadtxt(f, usecols=[2, 3, 4, 5, 6, 7, 8, 9, 10]).T
        for i in range(9):
            plt.subplot(2, 5, i + 1)