# Setting up paths

In [None]:
# Importing the os module for operating system-related functionality
import os

In [None]:
# Dictionary containing file paths
files = {
    'PIPELINE_CONFIG':os.path.join('Model', 'pipeline.config'),
    # Script for generating TFRecord
    'TF_RECORD_SCRIPT': os.path.join('Tensorflow','scripts', 'generate_tfrecord.py'), 
    # Label map file name
    'LABELMAP': os.path.join('Tensorflow', 'workspace','annotations', 'label_map.pbtxt')
}

# Importing Modules

In [None]:
import tensorflow as tf
from object_detection.utils import label_map_util
from object_detection.utils import visualization_utils as viz_utils
from object_detection.builders import model_builder
from object_detection.utils import config_util

import cv2 
import numpy as np
from matplotlib import pyplot as plt
%matplotlib inline

In [None]:
# Create a category index from the label map
category_index = label_map_util.create_category_index_from_labelmap(files['LABELMAP'])


# Loading saved Model

In [None]:
# Load pipeline config and build a detection model
configs = config_util.get_configs_from_pipeline_file(files['PIPELINE_CONFIG'])
detection_model = model_builder.build(model_config=configs['model'], is_training=False)

# Restore checkpoint
ckpt = tf.compat.v2.train.Checkpoint(model=detection_model)
ckpt.restore(os.path.join('Model','checkpoint','ckpt-0')).expect_partial()

# Function to perform object detection on an input image
@tf.function
def detect_fn(image):
    # Preprocess the input image
    image, shapes = detection_model.preprocess(image)
    
    # Make predictions
    prediction_dict = detection_model.predict(image, shapes)
    
    # Postprocess the predictions to get final detections
    detections = detection_model.postprocess(prediction_dict, shapes)
    
    return detections

# Detecting Objects

In [None]:
# Open a connection to the webcam (assuming webcam index 0)
cap = cv2.VideoCapture(0)

# Get the frame dimensions
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))

# Continuously process frames from the webcam
while cap.isOpened(): 
    # Read a frame from the webcam
    ret, frame = cap.read()
    image_np = np.array(frame)
    
    # Convert the frame to a TensorFlow tensor
    input_tensor = tf.convert_to_tensor(np.expand_dims(image_np, 0), dtype=tf.float32)
    
    # Perform object detection on the frame
    detections = detect_fn(input_tensor)
    
    # Extract and preprocess the detection results
    num_detections = int(detections.pop('num_detections'))
    detections = {key: value[0, :num_detections].numpy() for key, value in detections.items()}
    detections['num_detections'] = num_detections

    # Ensure detection classes are integers
    detections['detection_classes'] = detections['detection_classes'].astype(np.int64)

    # Create a copy of the frame for visualization
    image_np_with_detections = image_np.copy()

    # Visualize the detected boxes, labels, and scores on the frame
    viz_utils.visualize_boxes_and_labels_on_image_array(
        image_np_with_detections,
        detections['detection_boxes'],
        detections['detection_classes'] + 1,  # Adding 1 to align with category indices (0-based index)
        detections['detection_scores'],
        category_index,
        use_normalized_coordinates=True,
        max_boxes_to_draw=5,  # Maximum number of boxes to draw on the frame
        min_score_thresh=0.8,  # Minimum confidence score to consider a detection
        agnostic_mode=False  # If True, treat all classes as one (agnostic to class)
    )

    # Display the frame with visualized detections
    cv2.imshow('object detection', cv2.resize(image_np_with_detections, (800, 600)))
    
    # Check for the 'q' key to exit the loop
    if cv2.waitKey(10) & 0xFF == ord('q'):
        cap.release()
        cv2.destroyAllWindows()
        break