Spaces:

venkat-natchi
/

yolov3_obj_detector

Runtime error

App Files Files Community

venkyyuvy commited on Aug 13, 2023

Commit

60930a3

1 Parent(s): c87ccf3

ckpt to pth file

Browse files

Files changed (4) hide show

app.py +9 -14
config.py +176 -0
utils.py +2 -59
epoch=36-step=19166.ckpt → yolov3.pth +2 -2

app.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import gradio as gr
 import torch
-from PIL import Image
 import cv2
 import albumentations as A
 from albumentations.pytorch import ToTensorV2
@@ -8,6 +7,7 @@ import matplotlib.pyplot as plt
 import matplotlib
 matplotlib.use('agg')
 from model import YOLOv3
 from utils import (
     cells_to_bboxes,
@@ -15,23 +15,18 @@ from utils import (
     plot_image
 )
-ANCHORS = [
-    [(0.28, 0.22), (0.38, 0.48), (0.9, 0.78)],
-    [(0.07, 0.15), (0.15, 0.11), (0.14, 0.29)],
-    [(0.02, 0.03), (0.04, 0.07), (0.08, 0.06)],
-]  # Note these have been rescaled to be between [0, 1]
-fname = 'epoch=36-step=19166.ckpt'
-checkpoint = torch.load(fname, map_location=torch.device('cpu'))
-model_state_dict = checkpoint['state_dict']
 model = YOLOv3(num_classes=20)
-model.load_state_dict(model_state_dict)
 IMAGE_SIZE = 416
 S = [IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8]
-anchors = ( torch.tensor(ANCHORS)
-    * torch.tensor(S).unsqueeze(1)\
         .unsqueeze(1).repeat(1, 3, 2)
     )

 import gradio as gr
 import torch
 import cv2
 import albumentations as A
 from albumentations.pytorch import ToTensorV2
 import matplotlib
 matplotlib.use('agg')
+import config
 from model import YOLOv3
 from utils import (
     cells_to_bboxes,
     plot_image
 )
+# fname = 'epoch=36-step=19166.ckpt'
+fname = 'yolov3.pth'
+# checkpoint = torch.load(fname, map_location=torch.device('cpu'))
+# model_state_dict = checkpoint['state_dict']
+# torch.save(model.state_dict(), 'yolov3.pth')
 model = YOLOv3(num_classes=20)
+model.load_state_dict(torch.load(fname))
 IMAGE_SIZE = 416
 S = [IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8]
+anchors = ( torch.tensor(config.ANCHORS)
+    * torch.tensor(config.S).unsqueeze(1)\
         .unsqueeze(1).repeat(1, 3, 2)
     )

config.py ADDED Viewed

	@@ -0,0 +1,176 @@

+import albumentations as A
+import cv2
+from albumentations.pytorch import ToTensorV2
+DATASET='PASCAL_VOC'
+DEVICE = "cpu"
+NUM_WORKERS = 0
+BATCH_SIZE = 16
+IMAGE_SIZE = 416
+NUM_CLASSES = 20
+CONF_THRESHOLD = 0.05
+MAP_IOU_THRESH = 0.5
+NMS_IOU_THRESH = 0.45
+S = [IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8]
+PIN_MEMORY = True
+LOAD_MODEL = False
+SAVE_MODEL = True
+ANCHORS = [
+    [(0.28, 0.22), (0.38, 0.48), (0.9, 0.78)],
+    [(0.07, 0.15), (0.15, 0.11), (0.14, 0.29)],
+    [(0.02, 0.03), (0.04, 0.07), (0.08, 0.06)],
+]  # Note these have been rescaled to be between [0, 1]
+means = [0.485, 0.456, 0.406]
+scale = 1.1
+train_transforms = A.Compose(
+    [
+        A.LongestMaxSize(max_size=int(IMAGE_SIZE * scale)),
+        A.PadIfNeeded(
+            min_height=int(IMAGE_SIZE * scale),
+            min_width=int(IMAGE_SIZE * scale),
+            border_mode=cv2.BORDER_CONSTANT,
+        ),
+        A.Rotate(limit = 10, interpolation=1, border_mode=4),
+        A.RandomCrop(width=IMAGE_SIZE, height=IMAGE_SIZE),
+        A.ColorJitter(brightness=0.6, contrast=0.6, saturation=0.6, hue=0.6, p=0.4),
+        A.OneOf(
+            [
+                A.ShiftScaleRotate(
+                    rotate_limit=20, p=0.5, border_mode=cv2.BORDER_CONSTANT
+                ),
+                # A.Affine(shear=15, p=0.5, mode="constant"),
+            ],
+            p=1.0,
+        ),
+        A.HorizontalFlip(p=0.5),
+        A.Blur(p=0.1),
+        A.CLAHE(p=0.1),
+        A.Posterize(p=0.1),
+        A.ToGray(p=0.1),
+        A.ChannelShuffle(p=0.05),
+        A.Normalize(mean=[0, 0, 0], std=[1, 1, 1], max_pixel_value=255,),
+        ToTensorV2(),
+    ],
+    bbox_params=A.BboxParams(format="yolo", min_visibility=0.4, label_fields=[],),
+)
+test_transforms = A.Compose(
+    [
+        A.LongestMaxSize(max_size=IMAGE_SIZE),
+        A.PadIfNeeded(
+            min_height=IMAGE_SIZE, min_width=IMAGE_SIZE, border_mode=cv2.BORDER_CONSTANT
+        ),
+        A.Normalize(mean=[0, 0, 0], std=[1, 1, 1], max_pixel_value=255,),
+        ToTensorV2(),
+    ],
+    bbox_params=A.BboxParams(format="yolo", min_visibility=0.4, label_fields=[]),
+)
+PASCAL_CLASSES = [
+    "aeroplane",
+    "bicycle",
+    "bird",
+    "boat",
+    "bottle",
+    "bus",
+    "car",
+    "cat",
+    "chair",
+    "cow",
+    "diningtable",
+    "dog",
+    "horse",
+    "motorbike",
+    "person",
+    "pottedplant",
+    "sheep",
+    "sofa",
+    "train",
+    "tvmonitor"
+]
+COCO_LABELS = ['person',
+ 'bicycle',
+ 'car',
+ 'motorcycle',
+ 'airplane',
+ 'bus',
+ 'train',
+ 'truck',
+ 'boat',
+ 'traffic light',
+ 'fire hydrant',
+ 'stop sign',
+ 'parking meter',
+ 'bench',
+ 'bird',
+ 'cat',
+ 'dog',
+ 'horse',
+ 'sheep',
+ 'cow',
+ 'elephant',
+ 'bear',
+ 'zebra',
+ 'giraffe',
+ 'backpack',
+ 'umbrella',
+ 'handbag',
+ 'tie',
+ 'suitcase',
+ 'frisbee',
+ 'skis',
+ 'snowboard',
+ 'sports ball',
+ 'kite',
+ 'baseball bat',
+ 'baseball glove',
+ 'skateboard',
+ 'surfboard',
+ 'tennis racket',
+ 'bottle',
+ 'wine glass',
+ 'cup',
+ 'fork',
+ 'knife',
+ 'spoon',
+ 'bowl',
+ 'banana',
+ 'apple',
+ 'sandwich',
+ 'orange',
+ 'broccoli',
+ 'carrot',
+ 'hot dog',
+ 'pizza',
+ 'donut',
+ 'cake',
+ 'chair',
+ 'couch',
+ 'potted plant',
+ 'bed',
+ 'dining table',
+ 'toilet',
+ 'tv',
+ 'laptop',
+ 'mouse',
+ 'remote',
+ 'keyboard',
+ 'cell phone',
+ 'microwave',
+ 'oven',
+ 'toaster',
+ 'sink',
+ 'refrigerator',
+ 'book',
+ 'clock',
+ 'vase',
+ 'scissors',
+ 'teddy bear',
+ 'hair drier',
+ 'toothbrush'
+]

utils.py CHANGED Viewed

@@ -7,7 +7,6 @@ import random
 import torch
 from collections import Counter
-from torch.utils.data import DataLoader
 from tqdm import tqdm
@@ -235,7 +234,8 @@ def mean_average_precision(
 def plot_image(image, boxes, return_fig=False):
     """Plots predicted bounding boxes on the image"""
     cmap = plt.get_cmap("tab20b")
-    class_labels = config.COCO_LABELS if config.DATASET=='COCO' else config.PASCAL_CLASSES
     colors = [cmap(i) for i in np.linspace(0, 1, len(class_labels))]
     im = np.array(image)
     height, width, _ = im.shape
@@ -446,63 +446,6 @@ def load_checkpoint(checkpoint_file, model, optimizer, lr, device):
     for param_group in optimizer.param_groups:
         param_group["lr"] = lr
-def get_loaders(train_csv_path, test_csv_path):
-    from dataset import YOLODataset
-    IMAGE_SIZE = config.IMAGE_SIZE
-    train_dataset = YOLODataset(
-        train_csv_path,
-        transform=config.train_transforms,
-        S=[IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8],
-        img_dir=config.IMG_DIR,
-        label_dir=config.LABEL_DIR,
-        anchors=config.ANCHORS,
-    )
-    test_dataset = YOLODataset(
-        test_csv_path,
-        transform=config.test_transforms,
-        S=[IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8],
-        img_dir=config.IMG_DIR,
-        label_dir=config.LABEL_DIR,
-        anchors=config.ANCHORS,
-    )
-    train_loader = DataLoader(
-        dataset=train_dataset,
-        batch_size=config.BATCH_SIZE,
-        num_workers=config.NUM_WORKERS,
-        pin_memory=config.PIN_MEMORY,
-        shuffle=True,
-        drop_last=False,
-    )
-    test_loader = DataLoader(
-        dataset=test_dataset,
-        batch_size=config.BATCH_SIZE,
-        num_workers=config.NUM_WORKERS,
-        pin_memory=config.PIN_MEMORY,
-        shuffle=False,
-        drop_last=False,
-    )
-    train_eval_dataset = YOLODataset(
-        train_csv_path,
-        transform=config.test_transforms,
-        S=[IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8],
-        img_dir=config.IMG_DIR,
-        label_dir=config.LABEL_DIR,
-        anchors=config.ANCHORS,
-    )
-    train_eval_loader = DataLoader(
-        dataset=train_eval_dataset,
-        batch_size=config.BATCH_SIZE,
-        num_workers=config.NUM_WORKERS,
-        pin_memory=config.PIN_MEMORY,
-        shuffle=False,
-        drop_last=False,
-    )
-    return train_loader, test_loader, train_eval_loader
 def plot_couple_examples(model, batch, thresh, iou_thresh, anchors):
     model.eval()
     x, _ = batch

 import torch
 from collections import Counter
 from tqdm import tqdm
 def plot_image(image, boxes, return_fig=False):
     """Plots predicted bounding boxes on the image"""
     cmap = plt.get_cmap("tab20b")
+    class_labels = config.COCO_LABELS if config.DATASET=='COCO' \
+        else config.PASCAL_CLASSES
     colors = [cmap(i) for i in np.linspace(0, 1, len(class_labels))]
     im = np.array(image)
     height, width, _ = im.shape
     for param_group in optimizer.param_groups:
         param_group["lr"] = lr
 def plot_couple_examples(model, batch, thresh, iou_thresh, anchors):
     model.eval()
     x, _ = batch

epoch=36-step=19166.ckpt → yolov3.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cd0d67eac457f890a4c9557393e9b4c705dcbac707d30f9cbe658a1b7d00a678
-size 740104313

 version https://git-lfs.github.com/spec/v1
+oid sha256:af069adc24fec136b92b068e6e6c1361dd4b9dba7797dac7798489e8181d021c
+size 246865311