From cf2caaad4119ee2304a28cb583a0bc17bd2ffd79 Mon Sep 17 00:00:00 2001
From: Glenn Jocher <glenn.jocher@ultralytics.com>
Date: Mon, 22 Apr 2019 14:31:23 +0200
Subject: [PATCH] updates

---
 detect.py         |  2 +-
 models.py         | 14 +++++++-------
 utils/datasets.py |  2 +-
 utils/utils.py    |  6 ++++--
 4 files changed, 13 insertions(+), 11 deletions(-)

diff --git a/detect.py b/detect.py
index 918c87c4..7d696221 100644
--- a/detect.py
+++ b/detect.py
@@ -67,7 +67,7 @@ def detect(
 
         if detections is not None and len(detections) > 0:
             # Rescale boxes from 416 to true image size
-            scale_coords(img_size, detections[:, :4], im0.shape).round()
+            detections[:, :4] = scale_coords(img_size, detections[:, :4], im0.shape).round()
 
             # Print results to screen
             for c in detections[:, -1].unique():
diff --git a/models.py b/models.py
index 87ff3e71..07aa8d47 100755
--- a/models.py
+++ b/models.py
@@ -121,12 +121,12 @@ class YOLOLayer(nn.Module):
         if ONNX_EXPORT:
             bs = 1  # batch size
         else:
-            bs, nx, ny = p.shape[0], p.shape[-2], p.shape[-1]
-            if (self.nx, self.ny) != (nx, ny):
-                create_grids(self, img_size, (nx, ny), p.device)
+            bs, ny, nx = p.shape[0], p.shape[-2], p.shape[-1]
+            if (self.ny, self.nx) != (ny, nx):
+                create_grids(self, img_size, (ny, nx), p.device)
 
         # p.view(bs, 255, 13, 13) -- > (bs, 3, 13, 13, 85)  # (bs, anchors, grid, grid, classes + xywh)
-        p = p.view(bs, self.na, self.nc + 5, self.nx, self.ny).permute(0, 1, 3, 4, 2).contiguous()  # prediction
+        p = p.view(bs, self.na, self.nc + 5, self.ny, self.nx).permute(0, 1, 3, 4, 2).contiguous()  # prediction
 
         if self.training:
             return p
@@ -235,13 +235,13 @@ def get_yolo_layers(model):
 
 
 def create_grids(self, img_size, ng, device='cpu'):
-    nx, ny = ng  # x and y grid size
+    ny, nx = ng  # x and y grid size
     self.img_size = img_size
     self.stride = img_size / max(ng)
 
     # build xy offsets
-    yv, xv = torch.meshgrid([torch.arange(nx), torch.arange(ny)])
-    self.grid_xy = torch.stack((xv, yv), 2).to(device).float().view((1, 1, nx, ny, 2))
+    yv, xv = torch.meshgrid([torch.arange(ny), torch.arange(nx)])
+    self.grid_xy = torch.stack((xv, yv), 2).to(device).float().view((1, 1, ny, nx, 2))
 
     # build wh gains
     self.anchor_vec = self.anchors.to(device) / self.stride
diff --git a/utils/datasets.py b/utils/datasets.py
index 2ebed801..e1f71667 100755
--- a/utils/datasets.py
+++ b/utils/datasets.py
@@ -74,7 +74,7 @@ class LoadImages:  # for inference
             print('image %g/%g %s: ' % (self.count, self.nF, path), end='')
 
         # Padded resize
-        img, _, _, _ = letterbox_rect(img0, height=self.height)
+        img, _, _, _ = letterbox(img0, height=self.height)
         print('%gx%g ' % img.shape[:2], end='')  # print image size
 
         # Normalize RGB
diff --git a/utils/utils.py b/utils/utils.py
index e25f1983..4ce682a2 100755
--- a/utils/utils.py
+++ b/utils/utils.py
@@ -103,8 +103,10 @@ def xywh2xyxy(x):
 def scale_coords(img1_shape, coords, img0_shape):
     # Rescale coords1 (xyxy) from img1_shape to img0_shape
     gain = img1_shape / max(img0_shape[:2])  # gain  = old / new
-    pad_x = np.mod(img1_shape - img0_shape[1] * gain, 32) / 2  # width padding
-    pad_y = np.mod(img1_shape - img0_shape[0] * gain, 32) / 2  # height padding
+    # pad_x = np.mod(img1_shape - img0_shape[1] * gain, 32) / 2  # width padding
+    # pad_y = np.mod(img1_shape - img0_shape[0] * gain, 32) / 2  # height padding
+    pad_x = (img1_shape - img0_shape[1] * gain) / 2  # width padding
+    pad_y = (img1_shape - img0_shape[0] * gain) / 2  # height padding
     coords[:, [0, 2]] -= pad_x
     coords[:, [1, 3]] -= pad_y
     coords[:, :4] /= gain