# How to Use The Pre-Trained VGG Model to Classify Objects in Photographs

- VGG = [Oxford Visual Geometry Group](https://www.robots.ox.ac.uk/~vgg/)
- https://machinelearningmastery.com/use-pre-trained-vgg-model-classify-objects-photographs/

In [8]:
# for load_img, img_to_array
from keras import utils
from keras.applications.vgg16 import preprocess_input
from keras.applications.vgg16 import decode_predictions
from keras.applications.vgg16 import VGG16

from keras.applications.vgg19 import preprocess_input
from keras.applications.vgg19 import decode_predictions
from keras.applications.vgg19 import VGG19

In [2]:
BASE = '/Users/brinkley97/Documents/development/'
CLASS_PATH = 'classes/csci_535_multimodal_probabilistic_learning/'
DATASET_PATH = 'datasets/'

In [3]:
def simple_photo_classifier(model, image):
    """
    model -- keras (VGG16, VGG19)
    image -- str (of image with path to it)
    
    """
    
    
    # load an image from file
    image = utils.load_img(image, target_size=(224, 224))
    
    # convert the image pixels to a numpy array
    image = utils.img_to_array(image)
    
    # reshape data for the model
    image = image.reshape((1, image.shape[0], image.shape[1], image.shape[2]))
    
    # prepare the image for the VGG model
    image = preprocess_input(image)
    
    # predict the probability across all output classes
    yhat = model.predict(image)
    
    # convert the probabilities to class labels
    label = decode_predictions(yhat)
    
    # retrieve the most likely result, e.g. highest probability
    label = label[0][0]
    
    # print the classification
    print('%s (%.2f%%)' % (label[1], label[2]*100))

In [4]:
image = BASE + CLASS_PATH + DATASET_PATH + 'misc/mug.jpg'

# Load Models
- VGG16
- VGG19

In [5]:
# load the model
vgg16_model = VGG16()
print(vgg16_model.summary())

2023-05-02 12:05:07.848535: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  SSE4.1 SSE4.2 AVX AVX2 FMA
To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.


Model: "vgg16"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_1 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0     

In [6]:
simple_photo_classifier(vgg16_model, image)

coffee_mug (70.11%)


In [9]:
# load the model
vgg19_model = VGG19()
print(vgg19_model.summary())

Downloading data from https://storage.googleapis.com/tensorflow/keras-applications/vgg19/vgg19_weights_tf_dim_ordering_tf_kernels.h5
Model: "vgg19"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_2 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     14758

In [10]:
simple_photo_classifier(vgg19_model, image)

coffee_mug (85.46%)


In [None]:
# load the model
vgg19_model = VGG19()
print(vgg19_model.summary())

In [None]:
simple_photo_classifier(vgg19_model, image)