## Test the Retrieval Latency of Approximate vs Exact Matching 

In [None]:
import tensorflow as tf
import time

In [None]:
PROJECT_ID = 'ksalama-cloudml'
BUCKET = 'ksalama-cloudml'
INDEX_DIR = f'gs://{BUCKET}/bqml/scann_index'
BQML_MODEL_DIR = f'gs://{BUCKET}/bqml/item_matching_model'
LOOKUP_MODEL_DIR = f'gs://{BUCKET}/bqml/embedding_lookup_model'

In [None]:
songs = {
   '1': "Seven7 Women's Long Sleeve Stripe Belted Top",
    '2': "Calvin Klein Women's MSY Crew Neck Roll Sleeve",
    '3': "Calvin Klein Women's MSY Crew Neck Roll Sleeve",
    '4': "Bailey 44 Women's Undertow Top",
    '5': "Anne Klein Women's Plus-Size Button Front Blouse",
    '6': "Wilt Women's Color Blocked Big Mixed Slant Top",
    '7': "Lucky Brand Women's Riad Tee",
    '8': "Ella Moss Women's Stella Button Up Shirt",
    '9': "Alternative Women's Alice Drop Shoulder V-Neck",
    '10': "Calvin Klein Women's Plus-Size Print Drape Top",
    '4096': "AX Paris Strapless Spot Print Orange Romper",
    '5120': "Lee Women's Plus-Size Comfort Fit Straight Leg Pant",
    '7424': "Allegra K Woman Plaid Elastic Waist Preppy Above Knee Skirt Gray Black S",
    '4352': "Silver Jeans Juniors Suki Surplus Mid Rise Bootcut Jean"
}

## Exact Matching

In [None]:
class ExactMatcher(object):
  def __init__(self, model_dir):
    print("Loading exact matchg model...")
    self.model = tf.saved_model.load(model_dir)
    print("Exact matchg model is loaded.")
  
  def match(self, instances):
    outputs = self.model.signatures['serving_default'](tf.constant(instances, tf.dtypes.int64))
    return outputs['predicted_item2_Id'].numpy()

In [None]:
exact_matcher = ExactMatcher(BQML_MODEL_DIR)

In [None]:
exact_matches = {}

start_time = time.time()
for i in range(100):
  for song in songs:
    matches = exact_matcher.match([int(song)])
    exact_matches[song] = matches.tolist()[0]
end_time = time.time()
exact_elapsed_time = end_time - start_time

print(f'Elapsed time: {round(exact_elapsed_time, 3)} seconds - average time: {exact_elapsed_time / (100 * len(songs))} seconds')

## Approximate Matching (ScaNN)

In [None]:
from index_server.matching import ScaNNMatcher
scann_matcher = ScaNNMatcher(INDEX_DIR)
embedding_lookup = tf.saved_model.load(LOOKUP_MODEL_DIR)

In [None]:
approx_matches = dict()

start_time = time.time()
for i in range(100):
  for song in songs:
    vector = embedding_lookup([song]).numpy()[0]
    matches = scann_matcher.match(vector, 50)
    approx_matches[song] = matches
end_time = time.time()
scann_elapsed_time = end_time - start_time

print(f'Elapsed time: {round(scann_elapsed_time, 3)} seconds - average time: {scann_elapsed_time / (100 * len(songs))} seconds')

In [None]:
speedup_percent = round(exact_elapsed_time / scann_elapsed_time, 1)
print(f'ScaNN speedup: {speedup_percent}x')

## License

Copyright 2020 Google LLC

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License. You may obtain a copy of the License at: http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 

See the License for the specific language governing permissions and limitations under the License.

**This is not an official Google product but sample code provided for an educational purpose**