Adicionei o arquivo para detecção com o modelo ONNX

mtsousa · mtsousa · commit 3066bf68a379 · 2023-02-24T15:28:18.000-03:00
diff --git a/.gitignore b/.gitignore
@@ -9,4 +9,5 @@ __pycache__/
 yolov7-fork-o/
 yolov7-fork-p/
 *.pt
-*.onnx
+*.onnx
+plot_mosaic.py
diff --git a/detect.py b/detect.py
@@ -0,0 +1,123 @@
+"""
+@Author: Matheus Teixeira de Sousa (mtsousa14@gmail.com)
+
+Detect forks from images with trained YOLOv7 ONNX model
+"""
+
+import cv2 as cv
+import numpy as np
+import onnxruntime as ort
+from torch.utils.data import DataLoader
+from utils.dataset import TestDataset
+from utils.utils import plot_one_box, show_predicted_image, adjust_image
+from os.path import exists, isdir
+from os import makedirs
+from random import randint
+import argparse
+
+def predict_bbox(session, images):
+	"""
+	Predict bounding boxes from images
+	"""
+	outname = [i.name for i in session.get_outputs()]
+
+	dict_output = {}
+	for i, samples in enumerate(images):
+		im, ratio, dwdh, name = samples['image'], samples['ratio'], samples['dwdh'], samples['name']
+		im = np.ascontiguousarray(im/255)
+		out = session.run(outname, {'images':im})[0]
+		dict_output[f"batch {i}"] = {"preds": out, "ratio": ratio, "dwdh": dwdh, "name": name}
+
+	return dict_output
+
+if __name__ == '__main__':
+	# Parse command line arguments
+	parser = argparse.ArgumentParser(
+    description='Predict with YOLOv7-fork ONNX model')
+    
+	parser.add_argument('--model', required=True,
+                        metavar='/path/to/model.onnx',
+                        help="Path to ONNX model")
+	parser.add_argument('--input', required=True,
+                        help="Path to images (path/to/images) or path to image (path/to/image.jpg)")
+	parser.add_argument('--batch', default=1,
+                        help="Batch size")
+	parser.add_argument('--save', default=False, action='store_true',
+                        help="Save predicted image")
+	parser.add_argument('--dontshow', default=False, action='store_true',
+                        help="Don't show predicted image")
+	parser.add_argument('--cuda', default=False, action='store_true',
+                        help="Set execution on GPU")
+
+	args = parser.parse_args()
+	for key, value in args._get_kwargs():
+		if value is not None:
+			print(f'{key.capitalize()}: {value}')
+	print()
+
+	# Check if the input is a dir
+	input_isdir = isdir(args.input)
+
+	# Load the model
+	print('Loading model...', flush=True)
+	providers = ['CUDAExecutionProvider', 'CPUExecutionProvider'] if args.cuda else ['CPUExecutionProvider']
+	session = ort.InferenceSession(args.model, providers=providers)
+
+	# Get output name and input shape
+	outname = [i.name for i in session.get_outputs()]
+	input_shape = session.get_inputs()[0].shape
+	h, w = input_shape[2], input_shape[3]
+
+	# Load the images
+	print('Loading images...', flush=True)
+	if input_isdir:
+		dataset = TestDataset(args.input, shape=(h, w))
+		images = DataLoader(dataset, batch_size=args.batch, shuffle=False, num_workers=0)
+	else:
+		images = [adjust_image(args.input, shape=(h, w))]
+
+	# Predict from images
+	print('Making predictions...', flush=True)
+	dict_output = predict_bbox(session, images)
+	
+	names = ['fork']
+	colors = {name: [randint(0, 255) for _ in range(3)] for name in names}
+	# colors = {name: [104, 184, 82] for name in names} # green
+
+	if args.save and not exists(f'data/responses'):
+		makedirs(f'data/responses')
+
+	# For each image, plot the results
+	print('Plotting results...', flush=True)
+	for i, key in enumerate(dict_output.keys()):
+		pred, ratio, dwdh, name = dict_output[key]['preds'], dict_output[key]['ratio'][0], dict_output[key]['dwdh'], dict_output[key]['name'][0]
+		ratio = float(ratio)
+		dwdh = float(dwdh[0]), float(dwdh[1])
+
+		# Load original image
+		if input_isdir:
+			image = dataset.__getsrc__(i)
+		else:
+			image = cv.imread(args.input)
+
+		# Adjust bounding box to original image
+		for prediction in pred:
+			batch_id, x0, y0, x1, y1, cls_id, score = prediction
+			box = np.array([x0,y0,x1,y1])
+			box -= np.array(dwdh*2)
+			box /= ratio
+			box = box.round().astype(np.int32).tolist()
+			cls_id = int(cls_id)
+			score = round(float(score),3)
+			label = names[cls_id]
+			color = colors[label]
+			label += ' ' + str(score)
+			plot_one_box(box, image, label=label, color=color, line_thickness=1)
+	
+		if args.save:
+			path = 'data/responses/' + name
+			cv.imwrite(path, image)
+		
+		if not args.dontshow:
+			show_predicted_image(image)
+		
diff --git a/utils/dataset.py b/utils/dataset.py
@@ -8,6 +8,9 @@
 import json
 import cv2 as cv
 from torch import as_tensor, float64
+from .utils import letterbox
+import numpy as np
+import os
 
 class CocoForkDataset(Dataset):
     def __init__(self, img_dir, ann_dir, transforms=None, mode='train', device='cpu'):
@@ -99,25 +102,46 @@ def read_ids(self, ann_dir, mode):
         img_ids = list(dict.fromkeys(img_ids))
         return img_ids
 
-# def show_image(img, bbox):
-#     """
-#     Draw the bbox and show the image
-#     """
-#     import numpy as np
-#     img = np.float32(img)
-#     img = cv.cvtColor(img, cv.COLOR_RGB2BGR)
-#     for box in bbox:
-#         x0, y0, x1, y1 = int(box[0]), int(box[1]), int(box[2]), int(box[3]) 
-#         cv.rectangle(img, (x0, y0), (x1, y1), (255,0,0), 2)
-#     # cv.imwrite('img_name.jpg', img*255)
-#     cv.imshow(f'IMG', img)
-#     cv.waitKey(0)
-#     cv.destroyAllWindows()
-
-# from utils import get_transforms
-
-# dataset = CocoForkDataset('../data/train', '../data/annotations', get_transforms(train=True, size=(640, 640)), 'train')
-# for k in range(20, 30):
-#     img, ann = dataset.__getitem__(k)
-#     # print(img.shape, ann)
-#     show_image(img.numpy().transpose(1, 2, 0), ann['boxes'])
+class TestDataset(Dataset):
+	def __init__(self, path, shape):
+		"""
+        Initiliaze the dataset
+        
+        Args
+            - path: Path to images
+            - shape: Input shape
+        """
+		self.path = path
+		self.imgs_list = os.listdir(path)
+		self.shape = shape
+
+	def __len__(self):
+		"""
+		Return the length of the dataset
+		"""
+		return len(self.imgs_list)
+
+	def __getitem__(self, idx):
+		"""
+		Get an item from dataset by index with transformations
+		"""
+		img = cv.imread(self.path + "/" + self.imgs_list[idx])
+		img = cv.cvtColor(img, cv.COLOR_BGR2RGB)
+		image = img.copy()
+
+        # Adjust image shape
+		image, ratio, dwdh = letterbox(image, new_shape=self.shape, auto=False)
+		
+		# Transpose and set as a contiguous array
+		image = image.transpose((2, 0, 1))
+		image = np.ascontiguousarray(image)
+		im = image.astype(np.float32)
+        
+		return {"image": im, "ratio": ratio,"dwdh": dwdh, "name": self.imgs_list[idx]}
+
+	def __getsrc__(self, idx):
+		"""
+        Get an item from dataset by index without transformations
+        """
+		img = cv.imread(self.path + "/" + self.imgs_list[idx])
+		return img
diff --git a/utils/images_exploration/show_images.py b/utils/images_exploration/show_images.py
@@ -9,6 +9,16 @@
 import argparse
 from random import shuffle
 
+import sys
+from pathlib import Path
+
+file = Path(__file__).resolve()
+package_root_directory = file.parents[2]
+print(package_root_directory)
+sys.path.append(str(package_root_directory))
+
+from utils.utils import plot_one_box, show_predicted_image
+
 def read_json(input_name):
     """
     Read json annotations file
@@ -48,19 +58,6 @@ def find_image(coco, img_ids):
                     images[image_id]['bbox'].append(bbox)
     return images
 
-def show_image(id, dataset, file_name, bbox):
-    """
-    Draw the bbox and show the image
-    """
-    img = cv.imread(f'../../data/{dataset}/{file_name}')
-    # "bbox": [x,y,width,height]
-    for box in bbox:
-        x, y, w, h = int(box[0]), int(box[1]), int(box[2]), int(box[3])
-        cv.rectangle(img, (x, y), (x+w, y+h), (255,0,0), 2)
-    cv.imshow(f'IMG {id}', img)
-    cv.waitKey(0)
-    cv.destroyAllWindows()
-
 if __name__ == '__main__':
     # Parse command line arguments
     parser = argparse.ArgumentParser(description='Explore COCO dataset.')
@@ -86,4 +83,12 @@ def show_image(id, dataset, file_name, bbox):
     # For each image, show the bbox
     print('Loading images...')
     for k in images.keys():
-        show_image(k, dataset, images[k]['name'], images[k]['bbox'])
+        image = images[k]['name']
+        img = cv.imread(f'../../data/{dataset}/{image}')
+
+        for j in images[k]['bbox']:
+            x, y, w, h = int(j[0]), int(j[1]), int(j[2]), int(j[3])
+            box = [x, y, x+w, y+h]
+            plot_one_box(box, img, label='fork', color=[104, 184, 82], line_thickness=1)
+        
+        show_predicted_image(img)
diff --git a/utils/utils.py b/utils/utils.py