This code is compatible with the following versions, libraries, and SSD model.

Versions,
- python 3.8
- tensorflow 2.2.0

Libraries,
- Object_detection library from Tensorflow
- Google Protobuf library from Google
- Os, cv2, numpy

SSD Model,
- ssd_mobilenet_v2_fpn_keras

Data and trained model available in google Drive
- 

In order to train our model, we labelled the objects using labelImg
- https://github.com/tzutalin/labelImg/

# Setting up the Paths

In [13]:
WORKSPACE_PATH        = '/Users/jai/SSD_RealTime/Tensorflow/workspace/'
SCRIPTS_PATH          = '/Users/jai/SSD_RealTime/Tensorflow/scripts'
APIMODEL_PATH         = '/Users/jai/SSD_RealTime/Tensorflow/models/'
ANNOTATION_PATH       = WORKSPACE_PATH + '/annotations/'
IMAGE_PATH            = WORKSPACE_PATH + '/images/'
MODEL_PATH            = WORKSPACE_PATH + '/models/'
PRETRAINED_MODEL_PATH = WORKSPACE_PATH + '/pre-trained-models/'
CONFIG_PATH           = MODEL_PATH     + '/my_ssd_mobnet/pipeline.config'
CHECKPOINT_PATH       = MODEL_PATH     + '/my_ssd_mobnet/'

# Creating a Label Map

In [14]:
labels = [{'name':'car', 'id':1}]

with open(ANNOTATION_PATH + 'label_map.pbtxt', 'w') as f:
    for label in labels:
        f.write('item { \n')
        f.write('\tname:\'{}\'\n'.format(label['name']))
        f.write('\tid:{}\n'.format(label['id']))
        f.write('}\n')

# Creating a TF records

In [15]:
!python {SCRIPTS_PATH + '/generate_tfrecord.py'} -x {IMAGE_PATH + '/train'} -l {ANNOTATION_PATH + '/label_map.pbtxt'} -o {ANNOTATION_PATH + '/train.record'}
!python {SCRIPTS_PATH + '/generate_tfrecord.py'} -x {IMAGE_PATH + '/test'} -l {ANNOTATION_PATH + '/label_map.pbtxt'} -o {ANNOTATION_PATH + '/test.record'}

Successfully created the TFRecord file: /Users/jai/SSD_RealTime/Tensorflow/workspace//annotations//train.record
Successfully created the TFRecord file: /Users/jai/SSD_RealTime/Tensorflow/workspace//annotations//test.record


# Copy Model Config to Training Folder

In [16]:
CUSTOM_MODEL_NAME = 'my_ssd_mobnet' 

In [17]:
!mkdir {'/Users/jai/SSD_RealTime/Tensorflow/workspace/models//'+CUSTOM_MODEL_NAME}
!cp {PRETRAINED_MODEL_PATH+'/ssd_mobilenet_v2_fpnlite_320x320_coco17_tpu-8/pipeline.config'} {MODEL_PATH+'/'+CUSTOM_MODEL_NAME}

# Updating Config For Transfer Learning

In [18]:
import tensorflow as tf
from google.protobuf import text_format
from object_detection.utils import config_util
from object_detection.protos import pipeline_pb2

In [19]:
CONFIG_PATH = MODEL_PATH+'/'+CUSTOM_MODEL_NAME+'/pipeline.config'

In [20]:
config = config_util.get_configs_from_pipeline_file(CONFIG_PATH)

In [21]:
config

{'model': ssd {
   num_classes: 90
   image_resizer {
     fixed_shape_resizer {
       height: 320
       width: 320
     }
   }
   feature_extractor {
     type: "ssd_mobilenet_v2_fpn_keras"
     depth_multiplier: 1.0
     min_depth: 16
     conv_hyperparams {
       regularizer {
         l2_regularizer {
           weight: 3.9999998989515007e-05
         }
       }
       initializer {
         random_normal_initializer {
           mean: 0.0
           stddev: 0.009999999776482582
         }
       }
       activation: RELU_6
       batch_norm {
         decay: 0.996999979019165
         scale: true
         epsilon: 0.0010000000474974513
       }
     }
     use_depthwise: true
     override_base_feature_extractor_hyperparams: true
     fpn {
       min_level: 3
       max_level: 7
       additional_layer_depth: 128
     }
   }
   box_coder {
     faster_rcnn_box_coder {
       y_scale: 10.0
       x_scale: 10.0
       height_scale: 5.0
       width_scale: 5.0
     }
   }
   matc

In [22]:
pipeline_config = pipeline_pb2.TrainEvalPipelineConfig()
with tf.io.gfile.GFile(CONFIG_PATH, "r") as f:                                                                                                                                                                                                                     
    proto_str = f.read()                                                                                                                                                                                                                                          
    text_format.Merge(proto_str, pipeline_config)  

In [23]:
pipeline_config.model.ssd.num_classes                   = 2
pipeline_config.train_config.batch_size                 = 4
pipeline_config.train_config.fine_tune_checkpoint       = PRETRAINED_MODEL_PATH+'/ssd_mobilenet_v2_fpnlite_320x320_coco17_tpu-8/checkpoint/ckpt-0'
pipeline_config.train_config.fine_tune_checkpoint_type  = "detection"
pipeline_config.train_input_reader.label_map_path       = ANNOTATION_PATH + '/label_map.pbtxt'
pipeline_config.train_input_reader.tf_record_input_reader.input_path[:]   = [ANNOTATION_PATH + '/train.record']
pipeline_config.eval_input_reader[0].label_map_path     = ANNOTATION_PATH + '/label_map.pbtxt'
pipeline_config.eval_input_reader[0].tf_record_input_reader.input_path[:] = [ANNOTATION_PATH + '/test.record']

In [24]:
config_text = text_format.MessageToString(pipeline_config)                                                                                                                                                                                                        
with tf.io.gfile.GFile(CONFIG_PATH, "wb") as f:                                                                                                                                                                                                                     
    f.write(config_text)   

# Train the model

In [25]:
print("""python {}/research/object_detection/model_main_tf2.py --model_dir={}/{} --pipeline_config_path={}/{}/pipeline.config --num_train_steps=5000""".format(APIMODEL_PATH, MODEL_PATH,CUSTOM_MODEL_NAME,MODEL_PATH,CUSTOM_MODEL_NAME))

python /Users/jai/SSD_RealTime/Tensorflow/models//research/object_detection/model_main_tf2.py --model_dir=/Users/jai/SSD_RealTime/Tensorflow/workspace//models//my_ssd_mobnet --pipeline_config_path=/Users/jai/SSD_RealTime/Tensorflow/workspace//models//my_ssd_mobnet/pipeline.config --num_train_steps=5000


In [26]:
!python /Users/jai/SSD_RealTime/Tensorflow/models//research/object_detection/model_main_tf2.py --model_dir=/Users/jai/SSD_RealTime/Tensorflow/workspace//models//my_ssd_mobnet --pipeline_config_path=/Users/jai/SSD_RealTime/Tensorflow/workspace//models//my_ssd_mobnet/pipeline.config --num_train_steps=5000

2021-12-10 00:29:42.547265: I tensorflow/core/platform/cpu_feature_guard.cc:151] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA
To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.
W1210 00:29:42.572417 4680873472 cross_device_ops.py:1387] There are non-GPU devices in `tf.distribute.Strategy`, not using nccl allreduce.
INFO:tensorflow:Using MirroredStrategy with devices ('/job:localhost/replica:0/task:0/device:CPU:0',)
I1210 00:29:42.594134 4680873472 mirrored_strategy.py:376] Using MirroredStrategy with devices ('/job:localhost/replica:0/task:0/device:CPU:0',)
INFO:tensorflow:Maybe overwriting train_steps: 5000
I1210 00:29:42.627459 4680873472 config_util.py:552] Maybe overwriting train_steps: 5000
INFO:tensorflow:Maybe overwriting use_bfloat16: False
I1210 00:29:42.627708 4680873472 config_util.py:552] Maybe overwriting use_b

# Load Train Model From Checkpoint

In [27]:
import os
from object_detection.utils import label_map_util
from object_detection.builders import model_builder
from object_detection.utils import visualization_utils as viz_utils

In [28]:
# Load pipeline config and build a detection model
configs = config_util.get_configs_from_pipeline_file(CONFIG_PATH)
detection_model = model_builder.build(model_config = configs['model'], is_training = False)

# Restore checkpoint
ckpt = tf.compat.v2.train.Checkpoint(model = detection_model)
ckpt.restore(os.path.join(CHECKPOINT_PATH, 'ckpt-6')).expect_partial()

@tf.function
def detect_fn(image):
    image, shapes   = detection_model.preprocess(image)
    prediction_dict = detection_model.predict(image, shapes)
    detections      = detection_model.postprocess(prediction_dict, shapes)
    return detections

2021-12-10 02:18:32.193470: I tensorflow/core/platform/cpu_feature_guard.cc:151] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA
To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.


# Detect in Real-Time

In [29]:
import cv2 
import numpy as np

In [30]:
category_index = label_map_util.create_category_index_from_labelmap(ANNOTATION_PATH+'/label_map.pbtxt')

In [31]:
category_index

{1: {'id': 1, 'name': 'car'}}

In [32]:
# Setup capture
cap = cv2.VideoCapture(0)
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))

In [33]:
while True: 
    ret, frame     = cap.read()
    image_np       = np.array(frame)
    
    input_tensor   = tf.convert_to_tensor(np.expand_dims(image_np, 0), dtype=tf.float32)
    detections     = detect_fn(input_tensor)
    
    num_detections = int(detections.pop('num_detections'))
    detections     = {key: value[0, :num_detections].numpy()
                  for key, value in detections.items()}
    detections['num_detections']    = num_detections

    # detection_classes should be ints.
    detections['detection_classes'] = detections['detection_classes'].astype(np.int64)

    label_id_offset = 1
    image_np_with_detections = image_np.copy()

    viz_utils.visualize_boxes_and_labels_on_image_array(
                image_np_with_detections,
                detections['detection_boxes'],
                detections['detection_classes']+label_id_offset,
                detections['detection_scores'],
                category_index,
                use_normalized_coordinates=True,
                max_boxes_to_draw = 5,
                min_score_thresh = .5,
                agnostic_mode = False)

    cv2.imshow('object detection',  cv2.resize(image_np_with_detections, (800, 600)))
    
    if cv2.waitKey(1) & 0xFF == ord('q'):
        cap.release()
        break

In [35]:
print("hey its done")

hey its done
