# 1. Import Dependencies

In [1]:
!pip install opencv-python

Collecting opencv-python
  Downloading opencv_python-4.7.0.68-cp37-abi3-win_amd64.whl (38.2 MB)
     ---------------------------------------- 38.2/38.2 MB 4.5 MB/s eta 0:00:00
Collecting numpy>=1.19.3
  Downloading numpy-1.24.1-cp310-cp310-win_amd64.whl (14.8 MB)
     ---------------------------------------- 14.8/14.8 MB 4.8 MB/s eta 0:00:00
Installing collected packages: numpy, opencv-python
Successfully installed numpy-1.24.1 opencv-python-4.7.0.68


In [1]:
# Import opencv
import cv2 

# Import uuid
import uuid

# Import Operating System
import os

# Import time
import time

# 2. Define Images to Collect

In [3]:
labels = ['thumbsup', 'thumbsdown', 'thankyou', 'livelong']
labells = ['violetbottle', 'papercup', 'laptop']
number_imgs = 10

In [4]:
labels

['thumbsup', 'thumbsdown', 'thankyou', 'livelong']

# 3. Setup Folders 

In [5]:
IMAGES_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'collectedimages')

In [6]:
if not os.path.exists(IMAGES_PATH):
    if os.name == 'posix':
        !mkdir -p {IMAGES_PATH}
    if os.name == 'nt':
         !mkdir {IMAGES_PATH}
for label in labells:
    path = os.path.join(IMAGES_PATH, label)
    if not os.path.exists(path):
        !mkdir {path}

# 4. Capture Images

In [14]:
for label in labells:
    cap = cv2.VideoCapture(1)
    print('Collecting images for {}'.format(label))
    time.sleep(10)
    for imgnum in range(number_imgs):
        print('Collecting image {}'.format(imgnum))
        ret, frame = cap.read()
        imgname = os.path.join(IMAGES_PATH,label,label+'.'+'{}.jpg'.format(str(uuid.uuid1())))
        cv2.imwrite(imgname, frame)
        cv2.imshow('frame', frame)
        time.sleep(5)

        if cv2.waitKey(1) & 0xFF == ord('q'):
            break
cap.release()
cv2.destroyAllWindows()

Collecting images for violetbottle
Collecting image 0
Collecting image 1
Collecting image 2
Collecting image 3
Collecting image 4
Collecting images for papercup
Collecting image 0
Collecting image 1
Collecting image 2
Collecting image 3
Collecting image 4
Collecting images for laptop
Collecting image 0
Collecting image 1
Collecting image 2
Collecting image 3
Collecting image 4


# 5. Image Labelling

In [9]:
!pip install --upgrade pyqt5 lxml

Collecting pyqt5
  Downloading PyQt5-5.15.8-cp37-abi3-win_amd64.whl (6.8 MB)
     ---------------------------------------- 6.8/6.8 MB 4.3 MB/s eta 0:00:00
Collecting lxml
  Using cached lxml-4.9.2-cp310-cp310-win_amd64.whl (3.8 MB)
Collecting PyQt5-Qt5>=5.15.2
  Downloading PyQt5_Qt5-5.15.2-py3-none-win_amd64.whl (50.1 MB)
     ---------------------------------------- 50.1/50.1 MB 7.6 MB/s eta 0:00:00
Collecting PyQt5-sip<13,>=12.11
  Downloading PyQt5_sip-12.11.1-cp310-cp310-win_amd64.whl (78 kB)
     ---------------------------------------- 78.4/78.4 kB ? eta 0:00:00
Installing collected packages: PyQt5-Qt5, PyQt5-sip, lxml, pyqt5
Successfully installed PyQt5-Qt5-5.15.2 PyQt5-sip-12.11.1 lxml-4.9.2 pyqt5-5.15.8


In [4]:
LABELIMG_PATH = os.path.join('Tensorflow', 'labelimg')

In [5]:
if not os.path.exists(LABELIMG_PATH):
    !mkdir {LABELIMG_PATH}
    !git clone https://github.com/tzutalin/labelImg {LABELIMG_PATH}

In [6]:
if os.name == 'posix':
    !make qt5py3
if os.name =='nt':
    !cd {LABELIMG_PATH} && pyrcc5 -o libs/resources.py resources.qrc

'pyrcc5' is not recognized as an internal or external command,
operable program or batch file.


In [7]:
!cd {LABELIMG_PATH} && python labelImg.py

Traceback (most recent call last):
  File "c:\Users\Owner\Desktop\Hackathon\TFODCourse\Tensorflow\labelimg\labelImg.py", line 13, in <module>
    from PyQt5.QtGui import *
ModuleNotFoundError: No module named 'PyQt5'

During handling of the above exception, another exception occurred:

Traceback (most recent call last):
  File "c:\Users\Owner\Desktop\Hackathon\TFODCourse\Tensorflow\labelimg\labelImg.py", line 22, in <module>
    import sip
ModuleNotFoundError: No module named 'sip'


# 6. Move them into a Training and Testing Partition

# OPTIONAL - 7. Compress them for Colab Training

In [20]:
TRAIN_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'train')
TEST_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'test')
ARCHIVE_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'archive.tar.gz')

In [21]:
!tar -czf {ARCHIVE_PATH} {TRAIN_PATH} {TEST_PATH}