# GCP Courses/Videos Analysis

In [1]:
import pandas as pd

## Load Data

In [2]:
cols = ['format', 'name', 'credits', 'link']
catalog_data = pd.read_json('../data/gcp_resources_chkp_230620.json', orient='split')[cols]

## Preprocessing

In [3]:
catalog_data['link'] = catalog_data['link'].apply(
    lambda x: f'<a href="{x}" target="_blank">link</a>')

## Most expensive resources

In [4]:
limit = 10

catalog_data.sort_values(
    by=['format', 'credits','name'], 
    ascending=[True, False, True], inplace=True)

catalog_data[:limit].style.format()

Unnamed: 0,format,name,credits,link
148,Course,Serverless Data Processing with Dataflow: Develop Pipelines,70,link
26,Course,Building Scalable Java Microservices with Spring Boot and Spring Cloud,55,link
55,Course,Enterprise Database Migration,55,link
13,Course,Architecting with Google Kubernetes Engine: Workloads,45,link
20,Course,Building Batch Data Pipelines on Google Cloud,45,link
111,Course,"Logging, Monitoring and Observability in Google Cloud",45,link
8,Course,Application Development with Cloud Run,40,link
30,Course,Computer Vision Fundamentals with Google Cloud,40,link
142,Course,Production Machine Learning Systems,40,link
1,Course,API Development on Google Cloud's Apigee API Platform,35,link


## Search resources

In [5]:
def contains(sentence):
    return catalog_data['name'].str.lower().str.contains(sentence)

def check_sentences(sentences):
    check = contains(sentences[0])

    for sentence in sentences[1:]:
        check |= contains(sentence)

    return check

In [6]:
valid_sentences = [
    'machine learning',
    'ml',
    'vertex',
    'data science',
    'tensorflow',
    'feature engineering',
    'computer vision',
    'natural language',
    'recommendation system',
    'forecast'
]

invalid_sentences = [
    'lookml',
    'bigquery'
]

valid_filter = check_sentences(valid_sentences)
invalid_filter = check_sentences(invalid_sentences)
filter = valid_filter & ~invalid_filter

print(f'{len(catalog_data[filter])} resources')

catalog_data[filter].style.format()

69 resources


Unnamed: 0,format,name,credits,link
30,Course,Computer Vision Fundamentals with Google Cloud,40,link
142,Course,Production Machine Learning Systems,40,link
112,Course,ML Pipelines on Google Cloud,30,link
114,Course,Machine Learning in the Enterprise,26,link
143,Course,Recommendation Systems on Google Cloud,25,link
154,Course,"Smart Analytics, Machine Learning, and AI on Google Cloud",25,link
155,Course,TensorFlow on Google Cloud,25,link
127,Course,Natural Language Processing on Google Cloud,21,link
9,Course,Applying Machine Learning to your Data with Google Cloud,20,link
59,Course,Feature Engineering,20,link
