# 1. Import Dependencies

In [1]:
!pip install opencv-python

Collecting opencv-python
  Obtaining dependency information for opencv-python from https://files.pythonhosted.org/packages/a6/08/583e1d8d589e80a702815f58daa317bd469a32c7dc339394e2a0dc14318b/opencv_python-4.8.0.74-cp37-abi3-win_amd64.whl.metadata
  Using cached opencv_python-4.8.0.74-cp37-abi3-win_amd64.whl.metadata (19 kB)
Collecting numpy>=1.21.2 (from opencv-python)
  Obtaining dependency information for numpy>=1.21.2 from https://files.pythonhosted.org/packages/b7/db/4d37359e2c9cf8bf071c08b8a6f7374648a5ab2e76e2e22e3b808f81d507/numpy-1.25.2-cp310-cp310-win_amd64.whl.metadata
  Downloading numpy-1.25.2-cp310-cp310-win_amd64.whl.metadata (5.7 kB)
Using cached opencv_python-4.8.0.74-cp37-abi3-win_amd64.whl (38.1 MB)
Downloading numpy-1.25.2-cp310-cp310-win_amd64.whl (15.6 MB)
   ---------------------------------------- 0.0/15.6 MB ? eta -:--:--
   ---------------------------------------- 0.1/15.6 MB 4.3 MB/s eta 0:00:04
   - -------------------------------------- 0.7/15.6 MB 8.3 MB/s et

In [2]:
# Import opencv
import cv2 

# Import uuid
import uuid

# Import Operating System
import os

# Import time
import time

# 2. Define Images to Collect

In [3]:
labels = ['emblem', 'title', 'name', 'signature']
number_imgs = 5

In [8]:
import os
import shutil

def rename_files(folder_path, new_name):
    # Get the list of all files in the folder
    files = os.listdir(folder_path)

    # Filter only JPG files
    jpg_files = [file for file in files if file.lower().endswith(".jpg")]

    # Rename JPG files
    for index, jpg_file in enumerate(jpg_files, start=1):
        # Get the new filename with the given word and index
        new_filename = f"{new_name}{index}.jpg"

        # Construct the full paths
        old_file_path = os.path.join(folder_path, jpg_file)
        new_file_path = os.path.join(folder_path, new_filename)

        # Rename the file
        shutil.move(old_file_path, new_file_path)

if __name__ == "__main__":
    folder_path = r'C:\Users\dharu\panproject\TFODCourse\Tensorflow\workspace\images\collectedimages\title'  # Replace with your actual folder path
    new_name = "title"  # Replace with the desired new name

    rename_files(folder_path, new_name)


# 3. Setup Folders 

In [4]:
IMAGES_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'collectedimages')

In [5]:
if not os.path.exists(IMAGES_PATH):
    if os.name == 'posix':
        !mkdir -p {IMAGES_PATH}
    if os.name == 'nt':
         !mkdir {IMAGES_PATH}
for label in labels:
    path = os.path.join(IMAGES_PATH, label)
    if not os.path.exists(path):
        !mkdir {path}

# 4. Capture Images

In [18]:
for label in labels:
    cap = cv2.VideoCapture(0)
    print('Collecting images for {}'.format(label))
    time.sleep(5)
    for imgnum in range(number_imgs):
        print('Collecting image {}'.format(imgnum))
        ret, frame = cap.read()
        imgname = os.path.join(IMAGES_PATH,label,label+'.'+'{}.jpg'.format(str(uuid.uuid1())))
        cv2.imwrite(imgname, frame)
        cv2.imshow('frame', frame)
        time.sleep(2)

        if cv2.waitKey(1) & 0xFF == ord('q'):
            break
cap.release()
cv2.destroyAllWindows()

Collecting images for thumbsup
Collecting image 0
Collecting image 1
Collecting image 2
Collecting image 3
Collecting image 4


# 5. Image Labelling

In [9]:
!pip install --upgrade pyqt5 lxml

Collecting pyqt5
  Using cached PyQt5-5.15.9-cp37-abi3-win_amd64.whl (6.8 MB)
Collecting lxml
  Obtaining dependency information for lxml from https://files.pythonhosted.org/packages/50/ba/cb7bc9728a3be4e00dfd658fc76dc64fd9dbc3d5492ff44cda70574329c6/lxml-4.9.3-cp310-cp310-win_amd64.whl.metadata
  Using cached lxml-4.9.3-cp310-cp310-win_amd64.whl.metadata (3.9 kB)
Collecting PyQt5-sip<13,>=12.11 (from pyqt5)
  Obtaining dependency information for PyQt5-sip<13,>=12.11 from https://files.pythonhosted.org/packages/9e/d1/2865085040c7bc553298553f51d6ac46b5051481b5c3eb8aad4bb5b63497/PyQt5_sip-12.12.2-cp310-cp310-win_amd64.whl.metadata
  Using cached PyQt5_sip-12.12.2-cp310-cp310-win_amd64.whl.metadata (524 bytes)
Collecting PyQt5-Qt5>=5.15.2 (from pyqt5)
  Using cached PyQt5_Qt5-5.15.2-py3-none-win_amd64.whl (50.1 MB)
Using cached lxml-4.9.3-cp310-cp310-win_amd64.whl (3.8 MB)
Using cached PyQt5_sip-12.12.2-cp310-cp310-win_amd64.whl (78 kB)
Installing collected packages: PyQt5-Qt5, PyQt5-sip, 

In [10]:
LABELIMG_PATH = os.path.join('Tensorflow', 'labelimg')

In [11]:
if not os.path.exists(LABELIMG_PATH):
    !mkdir {LABELIMG_PATH}
    !git clone https://github.com/tzutalin/labelImg {LABELIMG_PATH}

Cloning into 'Tensorflow\labelimg'...


In [12]:
if os.name == 'posix':
    !make qt5py3
if os.name =='nt':
    !cd {LABELIMG_PATH} && pyrcc5 -o libs/resources.py resources.qrc

In [None]:
!cd {LABELIMG_PATH} && python labelImg.py

# 6. Move them into a Training and Testing Partition

# OPTIONAL - 7. Compress them for Colab Training

In [20]:
TRAIN_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'train')
TEST_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'test')
ARCHIVE_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'archive.tar.gz')

In [21]:
!tar -czf {ARCHIVE_PATH} {TRAIN_PATH} {TEST_PATH}