# 1. Import Dependencies

In [1]:
!pip install opencv-python

Collecting opencv-python
  Using cached opencv_python-4.5.3.56-cp37-cp37m-win_amd64.whl (34.9 MB)
Collecting numpy>=1.14.5
  Using cached numpy-1.21.1-cp37-cp37m-win_amd64.whl (14.0 MB)
Installing collected packages: numpy, opencv-python
Successfully installed numpy-1.21.1 opencv-python-4.5.3.56


In [2]:
# Import opencv
import cv2 

# Import uuid
import uuid

# Import Operating System
import os

# Import time
import time

# 2. Define Images to Collect

In [1]:
labels = ['IDcard']
number_imgs = 10

# 3. Setup Folders 

In [3]:
IMAGES_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'collectedimages')

In [4]:
if not os.path.exists(IMAGES_PATH):
    if os.name == 'posix':
        !mkdir -p {IMAGES_PATH}
    if os.name == 'nt':
         !mkdir {IMAGES_PATH}
for label in labels:
    path = os.path.join(IMAGES_PATH, label)
    if not os.path.exists(path):
        !mkdir {path}

# 4. Capture Images

In [6]:
for label in labels:
    cap = cv2.VideoCapture(0)
    print('Collecting images for {}'.format(label))
    time.sleep(5)
    for imgnum in range(number_imgs):
        print('Collecting image {}'.format(imgnum))
        ret, frame = cap.read()
        imgname = os.path.join(IMAGES_PATH,label,label+'.'+'{}.jpg'.format(str(uuid.uuid1())))
        cv2.imwrite(imgname, frame)
        cv2.imshow('frame', frame)
        time.sleep(2)

        if cv2.waitKey(1) & 0xFF == ord('q'):
            break
cap.release()
cv2.destroyAllWindows()

Collecting images for IDcard
Collecting image 0
Collecting image 1
Collecting image 2
Collecting image 3
Collecting image 4
Collecting image 5
Collecting image 6
Collecting image 7
Collecting image 8
Collecting image 9


# 5. Image Labelling

In [9]:
!pip install --upgrade pyqt5 lxml

Collecting pyqt5
  Downloading PyQt5-5.15.4-cp36.cp37.cp38.cp39-none-win_amd64.whl (6.8 MB)
Collecting lxml
  Downloading lxml-4.6.3-cp37-cp37m-win_amd64.whl (3.5 MB)
Collecting PyQt5-Qt5>=5.15
  Downloading PyQt5_Qt5-5.15.2-py3-none-win_amd64.whl (50.1 MB)
Collecting PyQt5-sip<13,>=12.8
  Downloading PyQt5_sip-12.9.0-cp37-cp37m-win_amd64.whl (62 kB)
Installing collected packages: PyQt5-sip, PyQt5-Qt5, pyqt5, lxml
Successfully installed PyQt5-Qt5-5.15.2 PyQt5-sip-12.9.0 lxml-4.6.3 pyqt5-5.15.4


In [7]:
LABELIMG_PATH = os.path.join('Tensorflow', 'labelimg')

In [11]:
if not os.path.exists(LABELIMG_PATH):
    !mkdir {LABELIMG_PATH}
    !git clone https://github.com/tzutalin/labelImg {LABELIMG_PATH}

Cloning into 'Tensorflow\labelimg'...


In [8]:
if os.name == 'posix':
    !make qt5py3
if os.name =='nt':
    !cd {LABELIMG_PATH} && pyrcc5 -o libs/resources.py resources.qrc

In [9]:
!cd {LABELIMG_PATH} && python labelImg.py

Image:D:\Data Science\Jupyter\ID card detection and OCR\TFODCourse\Tensorflow\workspace\images\collectedimages\IDcard\IDcard.8a2e6f68-f5ae-11eb-89c6-f0038c43e360.jpg -> Annotation:D:/Data Science/Jupyter/ID card detection and OCR/TFODCourse/Tensorflow/workspace/images/collectedimages/IDcard/IDcard.8a2e6f68-f5ae-11eb-89c6-f0038c43e360.xml
Image:D:\Data Science\Jupyter\ID card detection and OCR\TFODCourse\Tensorflow\workspace\images\collectedimages\IDcard\IDcard.b131247e-f5ae-11eb-aae3-f0038c43e360.jpg -> Annotation:D:/Data Science/Jupyter/ID card detection and OCR/TFODCourse/Tensorflow/workspace/images/collectedimages/IDcard/IDcard.b131247e-f5ae-11eb-aae3-f0038c43e360.xml
Image:D:\Data Science\Jupyter\ID card detection and OCR\TFODCourse\Tensorflow\workspace\images\collectedimages\IDcard\IDcard.b266f476-f5ae-11eb-b43e-f0038c43e360.jpg -> Annotation:D:/Data Science/Jupyter/ID card detection and OCR/TFODCourse/Tensorflow/workspace/images/collectedimages/IDcard/IDcard.b266f476-f5ae-11eb-b4

# 6. Move them into a Training and Testing Partition

# OPTIONAL - 7. Compress them for Colab Training

In [20]:
TRAIN_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'train')
TEST_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'test')
ARCHIVE_PATH = os.path.join('Tensorflow', 'workspace', 'images', 'archive.tar.gz')

In [21]:
!tar -czf {ARCHIVE_PATH} {TRAIN_PATH} {TEST_PATH}